From 03dacaa8810bda4ccba3222dcb824410424d9752 Mon Sep 17 00:00:00 2001 From: Zhengyu Gu Date: Wed, 20 Sep 2017 20:54:29 -0400 Subject: [PATCH 01/80] 8187331: VirtualSpaceList tracks free space on wrong node Fixed miscounting of virtual space node's free memory Reviewed-by: shade, coleenp, stuefe --- src/hotspot/share/memory/metaspace.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/hotspot/share/memory/metaspace.cpp b/src/hotspot/share/memory/metaspace.cpp index 4a86e8efcda..b1d90841010 100644 --- a/src/hotspot/share/memory/metaspace.cpp +++ b/src/hotspot/share/memory/metaspace.cpp @@ -1291,7 +1291,7 @@ VirtualSpaceList::VirtualSpaceList(ReservedSpace rs) : } size_t VirtualSpaceList::free_bytes() { - return virtual_space_list()->free_words_in_vs() * BytesPerWord; + return current_virtual_space()->free_words_in_vs() * BytesPerWord; } // Allocate another meta virtual space and add it to the list. From 8969bd19e05e0c6245c7d9bc8e9331ffe7e49b8a Mon Sep 17 00:00:00 2001 From: Zhengyu Gu Date: Mon, 25 Sep 2017 11:56:21 -0400 Subject: [PATCH 02/80] 8187629: NMT: Memory miscounting in compiler (C2) Fixed memory counting in compiler (C2) Reviewed-by: adinn, cjplummer, kvn --- src/hotspot/share/memory/resourceArea.hpp | 6 +++--- src/hotspot/share/opto/chaitin.cpp | 4 ++-- src/hotspot/share/opto/gcm.cpp | 2 +- src/hotspot/share/opto/matcher.cpp | 2 +- 4 files changed, 7 insertions(+), 7 deletions(-) diff --git a/src/hotspot/share/memory/resourceArea.hpp b/src/hotspot/share/memory/resourceArea.hpp index 89ad7457314..72dcddf0f0d 100644 --- a/src/hotspot/share/memory/resourceArea.hpp +++ b/src/hotspot/share/memory/resourceArea.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -49,11 +49,11 @@ class ResourceArea: public Arena { debug_only(static int _warned;) // to suppress multiple warnings public: - ResourceArea() : Arena(mtThread) { + ResourceArea(MEMFLAGS flags = mtThread) : Arena(flags) { debug_only(_nesting = 0;) } - ResourceArea(size_t init_size) : Arena(mtThread, init_size) { + ResourceArea(size_t init_size, MEMFLAGS flags = mtThread) : Arena(flags, init_size) { debug_only(_nesting = 0;); } diff --git a/src/hotspot/share/opto/chaitin.cpp b/src/hotspot/share/opto/chaitin.cpp index 901f53023a7..914dc43f64f 100644 --- a/src/hotspot/share/opto/chaitin.cpp +++ b/src/hotspot/share/opto/chaitin.cpp @@ -348,8 +348,8 @@ void PhaseChaitin::Register_Allocate() { _alternate = 0; _matcher._allocation_started = true; - ResourceArea split_arena; // Arena for Split local resources - ResourceArea live_arena; // Arena for liveness & IFG info + ResourceArea split_arena(mtCompiler); // Arena for Split local resources + ResourceArea live_arena(mtCompiler); // Arena for liveness & IFG info ResourceMark rm(&live_arena); // Need live-ness for the IFG; need the IFG for coalescing. If the diff --git a/src/hotspot/share/opto/gcm.cpp b/src/hotspot/share/opto/gcm.cpp index 92cc001f141..50724090270 100644 --- a/src/hotspot/share/opto/gcm.cpp +++ b/src/hotspot/share/opto/gcm.cpp @@ -1424,7 +1424,7 @@ void PhaseCFG::global_code_motion() { // Enabling the scheduler for register pressure plus finding blocks of size to schedule for it // is key to enabling this feature. PhaseChaitin regalloc(C->unique(), *this, _matcher, true); - ResourceArea live_arena; // Arena for liveness + ResourceArea live_arena(mtCompiler); // Arena for liveness ResourceMark rm_live(&live_arena); PhaseLive live(*this, regalloc._lrg_map.names(), &live_arena, true); PhaseIFG ifg(&live_arena); diff --git a/src/hotspot/share/opto/matcher.cpp b/src/hotspot/share/opto/matcher.cpp index b15875ccce1..19cdfb99584 100644 --- a/src/hotspot/share/opto/matcher.cpp +++ b/src/hotspot/share/opto/matcher.cpp @@ -69,7 +69,7 @@ Matcher::Matcher() _register_save_type(register_save_type), _ruleName(ruleName), _allocation_started(false), - _states_arena(Chunk::medium_size), + _states_arena(Chunk::medium_size, mtCompiler), _visited(&_states_arena), _shared(&_states_arena), _dontcare(&_states_arena) { From 80184d351526ba38e4d6ddd6508a3e35ad5844e2 Mon Sep 17 00:00:00 2001 From: John Paul Adrian Glaubitz Date: Tue, 26 Sep 2017 04:52:02 -0400 Subject: [PATCH 03/80] 8187590: Zero runtime can lock-up on linux-alpha Reviewed-by: aph, dholmes --- .../os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp b/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp index 20d851c9234..6bda67d54d6 100644 --- a/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp +++ b/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp @@ -56,8 +56,16 @@ typedef void (__kernel_dmb_t) (void); #else // PPC +#ifdef ALPHA + +#define LIGHT_MEM_BARRIER __sync_synchronize() + +#else // ALPHA + #define LIGHT_MEM_BARRIER __asm __volatile ("":::"memory") +#endif // ALPHA + #endif // PPC #endif // ARM From 2f137ced944469ccc80e419d6f41394405911cf9 Mon Sep 17 00:00:00 2001 From: Thomas Stuefe Date: Tue, 26 Sep 2017 11:25:34 +0200 Subject: [PATCH 04/80] 8187028: [aix] Real thread stack size may be up to 64K smaller than requested one Reviewed-by: goetz --- src/hotspot/os/aix/os_aix.cpp | 19 +++++++++++++++++-- 1 file changed, 17 insertions(+), 2 deletions(-) diff --git a/src/hotspot/os/aix/os_aix.cpp b/src/hotspot/os/aix/os_aix.cpp index 70441018902..ad59ff3b788 100644 --- a/src/hotspot/os/aix/os_aix.cpp +++ b/src/hotspot/os/aix/os_aix.cpp @@ -770,8 +770,15 @@ static void *thread_native_entry(Thread *thread) { const pthread_t pthread_id = ::pthread_self(); const tid_t kernel_thread_id = ::thread_self(); - log_info(os, thread)("Thread is alive (tid: " UINTX_FORMAT ", kernel thread id: " UINTX_FORMAT ").", - os::current_thread_id(), (uintx) kernel_thread_id); + LogTarget(Info, os, thread) lt; + if (lt.is_enabled()) { + address low_address = thread->stack_end(); + address high_address = thread->stack_base(); + lt.print("Thread is alive (tid: " UINTX_FORMAT ", kernel thread id: " UINTX_FORMAT + ", stack [" PTR_FORMAT " - " PTR_FORMAT " (" SIZE_FORMAT "k using %uk pages)).", + os::current_thread_id(), (uintx) kernel_thread_id, low_address, high_address, + (high_address - low_address) / K, os::Aix::query_pagesize(low_address) / K); + } // Normally, pthread stacks on AIX live in the data segment (are allocated with malloc() // by the pthread library). In rare cases, this may not be the case, e.g. when third-party @@ -864,6 +871,14 @@ bool os::create_thread(Thread* thread, ThreadType thr_type, // Calculate stack size if it's not specified by caller. size_t stack_size = os::Posix::get_initial_stack_size(thr_type, req_stack_size); + // JDK-8187028: It was observed that on some configurations (4K backed thread stacks) + // the real thread stack size may be smaller than the requested stack size, by as much as 64K. + // This very much looks like a pthread lib error. As a workaround, increase the stack size + // by 64K for small thread stacks (arbitrarily choosen to be < 4MB) + if (stack_size < 4096 * K) { + stack_size += 64 * K; + } + // On Aix, pthread_attr_setstacksize fails with huge values and leaves the // thread size in attr unchanged. If this is the minimal stack size as set // by pthread_attr_init this leads to crashes after thread creation. E.g. the From 070104325caf4e0e5d17e47749de80cad72cb80c Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Tue, 26 Sep 2017 06:53:35 -0400 Subject: [PATCH 05/80] 8187597: WrongTypeException is occurred at CLHSDB jstack after JDK-8186837 Reviewed-by: rehn, cjplummer, dholmes --- .../share/classes/sun/jvm/hotspot/code/NMethod.java | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/NMethod.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/NMethod.java index 84ec0a195ea..880b86b6e3e 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/NMethod.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/NMethod.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -71,7 +71,7 @@ public class NMethod extends CompiledMethod { stack. An not_entrant method can be removed when there is no more activations, i.e., when the _stack_traversal_mark is less than current sweep traversal index. */ - private static JLongField stackTraversalMarkField; + private static CIntegerField stackTraversalMarkField; private static CIntegerField compLevelField; @@ -105,7 +105,7 @@ public class NMethod extends CompiledMethod { verifiedEntryPointField = type.getAddressField("_verified_entry_point"); osrEntryPointField = type.getAddressField("_osr_entry_point"); lockCountField = type.getJIntField("_lock_count"); - stackTraversalMarkField = type.getJLongField("_stack_traversal_mark"); + stackTraversalMarkField = type.getCIntegerField("_stack_traversal_mark"); compLevelField = type.getCIntegerField("_comp_level"); pcDescSize = db.lookupType("PcDesc").getSize(); } From 2781cf9c38496a01881de083b33a85d237b95f08 Mon Sep 17 00:00:00 2001 From: Harold Seigel Date: Tue, 26 Sep 2017 08:58:04 -0400 Subject: [PATCH 06/80] 8187436: -Xbootclasspath/a causes sanity check assertion with exploded build Fixed asserts to work properly with exploded build Reviewed-by: alanb, jiangli, gtriantafill --- src/hotspot/share/classfile/classLoader.hpp | 3 +- .../GetPackageXbootclasspath.java | 59 +++++++++++++++++++ 2 files changed, 61 insertions(+), 1 deletion(-) create mode 100644 test/hotspot/jtreg/runtime/getSysPackage/GetPackageXbootclasspath.java diff --git a/src/hotspot/share/classfile/classLoader.hpp b/src/hotspot/share/classfile/classLoader.hpp index b5633962008..c3f363c0326 100644 --- a/src/hotspot/share/classfile/classLoader.hpp +++ b/src/hotspot/share/classfile/classLoader.hpp @@ -403,7 +403,8 @@ class ClassLoader: AllStatic { static int compute_Object_vtable(); static ClassPathEntry* classpath_entry(int n) { - assert(n >= 0 && n < _num_entries, "sanity"); + assert(n >= 0, "sanity"); + assert(!has_jrt_entry() || n < _num_entries, "sanity"); if (n == 0) { assert(has_jrt_entry(), "No class path entry at 0 for exploded module builds"); return ClassLoader::_jrt_entry; diff --git a/test/hotspot/jtreg/runtime/getSysPackage/GetPackageXbootclasspath.java b/test/hotspot/jtreg/runtime/getSysPackage/GetPackageXbootclasspath.java new file mode 100644 index 00000000000..5884adfc524 --- /dev/null +++ b/test/hotspot/jtreg/runtime/getSysPackage/GetPackageXbootclasspath.java @@ -0,0 +1,59 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8187436 + * @summary Test that getPackage() works with a class loaded via -Xbootclasspath/a. + * @library /test/lib + * @run main/othervm GetPackageXbootclasspath + */ + +// This is a regression test for a bug with the exploded build but should pass +// when run with either the normal or exploded build. +import jdk.test.lib.compiler.InMemoryJavaCompiler; +import jdk.test.lib.process.ProcessTools; +import jdk.test.lib.process.OutputAnalyzer; + +public class GetPackageXbootclasspath { + + public static void main(String args[]) throws Exception { + + String Test_src = + "package P; " + + "public class Test { " + + "public static void main(String[] args) throws Exception { " + + "Package p = Test.class.getPackage(); " + + "System.out.println(\"Test Passed\"); " + + "} " + + "}"; + + String test_classes = System.getProperty("test.classes"); + ClassFileInstaller.writeClassToDisk("P/Test", + InMemoryJavaCompiler.compile("P.Test", Test_src), test_classes); + + new OutputAnalyzer(ProcessTools.createJavaProcessBuilder( + "-Xbootclasspath/a:" + test_classes, "P.Test") + .start()).shouldContain("Test Passed"); + } +} From 03d1c13fa3bb76c62d2fc872fa03dbe684e69f7f Mon Sep 17 00:00:00 2001 From: Coleen Phillimore Date: Tue, 26 Sep 2017 10:03:17 -0400 Subject: [PATCH 07/80] 8081323: ConstantPool::_resolved_references is missing in heap dump Add resolved_references and init_lock as hidden static field in class so root is found. Reviewed-by: hseigel, jiangli, sspitsyn --- src/hotspot/share/classfile/vmSymbols.hpp | 2 + src/hotspot/share/oops/constantPool.cpp | 10 +++++ src/hotspot/share/oops/constantPool.hpp | 1 + src/hotspot/share/services/heapDumper.cpp | 50 ++++++++++++++++++++++- 4 files changed, 62 insertions(+), 1 deletion(-) diff --git a/src/hotspot/share/classfile/vmSymbols.hpp b/src/hotspot/share/classfile/vmSymbols.hpp index 6bd7412cfb2..9551124f7df 100644 --- a/src/hotspot/share/classfile/vmSymbols.hpp +++ b/src/hotspot/share/classfile/vmSymbols.hpp @@ -461,6 +461,8 @@ template(getProtectionDomain_signature, "(Ljava/security/CodeSource;)Ljava/security/ProtectionDomain;") \ template(url_code_signer_array_void_signature, "(Ljava/net/URL;[Ljava/security/CodeSigner;)V") \ template(module_entry_name, "module_entry") \ + template(resolved_references_name, "") \ + template(init_lock_name, "") \ \ /* name symbols needed by intrinsics */ \ VM_INTRINSICS_DO(VM_INTRINSIC_IGNORE, VM_SYMBOL_IGNORE, template, VM_SYMBOL_IGNORE, VM_ALIAS_IGNORE) \ diff --git a/src/hotspot/share/oops/constantPool.cpp b/src/hotspot/share/oops/constantPool.cpp index 7e9534baae3..158103c1dc1 100644 --- a/src/hotspot/share/oops/constantPool.cpp +++ b/src/hotspot/share/oops/constantPool.cpp @@ -135,6 +135,16 @@ objArrayOop ConstantPool::resolved_references() const { return (objArrayOop)_cache->resolved_references(); } +// Called from outside constant pool resolution where a resolved_reference array +// may not be present. +objArrayOop ConstantPool::resolved_references_or_null() const { + if (_cache == NULL) { + return NULL; + } else { + return (objArrayOop)_cache->resolved_references(); + } +} + // Create resolved_references array and mapping array for original cp indexes // The ldc bytecode was rewritten to have the resolved reference array index so need a way // to map it back for resolving and some unlikely miscellaneous uses. diff --git a/src/hotspot/share/oops/constantPool.hpp b/src/hotspot/share/oops/constantPool.hpp index 88b772937ce..b2c0fa18f24 100644 --- a/src/hotspot/share/oops/constantPool.hpp +++ b/src/hotspot/share/oops/constantPool.hpp @@ -226,6 +226,7 @@ class ConstantPool : public Metadata { // resolved strings, methodHandles and callsite objects from the constant pool objArrayOop resolved_references() const; + objArrayOop resolved_references_or_null() const; // mapping resolved object array indexes to cp indexes and back. int object_to_cp_index(int index) { return reference_map()->at(index); } int cp_to_object_index(int index); diff --git a/src/hotspot/share/services/heapDumper.cpp b/src/hotspot/share/services/heapDumper.cpp index 18241c22448..3df6d0a8494 100644 --- a/src/hotspot/share/services/heapDumper.cpp +++ b/src/hotspot/share/services/heapDumper.cpp @@ -856,6 +856,29 @@ void DumperSupport::dump_static_fields(DumpWriter* writer, Klass* k) { if (fldc.access_flags().is_static()) field_count++; } + // Add in resolved_references which is referenced by the cpCache + // The resolved_references is an array per InstanceKlass holding the + // strings and other oops resolved from the constant pool. + oop resolved_references = ik->constants()->resolved_references_or_null(); + if (resolved_references != NULL) { + field_count++; + + // Add in the resolved_references of the used previous versions of the class + // in the case of RedefineClasses + InstanceKlass* prev = ik->previous_versions(); + while (prev != NULL && prev->constants()->resolved_references_or_null() != NULL) { + field_count++; + prev = prev->previous_versions(); + } + } + + // Also provide a pointer to the init_lock if present, so there aren't unreferenced int[0] + // arrays. + oop init_lock = ik->init_lock(); + if (init_lock != NULL) { + field_count++; + } + writer->write_u2(field_count); // pass 2 - dump the field descriptors and raw values @@ -873,6 +896,29 @@ void DumperSupport::dump_static_fields(DumpWriter* writer, Klass* k) { dump_field_value(writer, sig->byte_at(0), addr); } } + + // Add resolved_references for each class that has them + if (resolved_references != NULL) { + writer->write_symbolID(vmSymbols::resolved_references_name()); // name + writer->write_u1(sig2tag(vmSymbols::object_array_signature())); // type + writer->write_objectID(resolved_references); + + // Also write any previous versions + InstanceKlass* prev = ik->previous_versions(); + while (prev != NULL && prev->constants()->resolved_references_or_null() != NULL) { + writer->write_symbolID(vmSymbols::resolved_references_name()); // name + writer->write_u1(sig2tag(vmSymbols::object_array_signature())); // type + writer->write_objectID(prev->constants()->resolved_references()); + prev = prev->previous_versions(); + } + } + + // Add init lock to the end if the class is not yet initialized + if (init_lock != NULL) { + writer->write_symbolID(vmSymbols::init_lock_name()); // name + writer->write_u1(sig2tag(vmSymbols::int_array_signature())); // type + writer->write_objectID(init_lock); + } } // dump the raw values of the instance fields of the given object @@ -908,7 +954,7 @@ void DumperSupport::dump_instance_field_descriptors(DumpWriter* writer, Klass* k if (!fld.access_flags().is_static()) { Symbol* sig = fld.signature(); - writer->write_symbolID(fld.name()); // name + writer->write_symbolID(fld.name()); // name writer->write_u1(sig2tag(sig)); // type } } @@ -1822,6 +1868,8 @@ void VM_HeapDumper::doit() { // HPROF_GC_ROOT_JNI_GLOBAL JNIGlobalsDumper jni_dumper(writer()); JNIHandles::oops_do(&jni_dumper); + Universe::oops_do(&jni_dumper); // technically not jni roots, but global roots + // for things like preallocated throwable backtraces check_segment_length(); // HPROF_GC_ROOT_STICKY_CLASS From 6d015ba5025989ca89225c101e7cd49b8168f4f4 Mon Sep 17 00:00:00 2001 From: Lutz Schmidt Date: Tue, 26 Sep 2017 17:06:06 +0200 Subject: [PATCH 08/80] 8187573: [s390] z/Architecture Vector Facility Support Reviewed-by: mdoerr --- src/hotspot/cpu/s390/assembler_s390.hpp | 656 +++++++++++++++++- .../cpu/s390/assembler_s390.inline.hpp | 394 ++++++++++- .../cpu/s390/register_definitions_s390.cpp | 6 +- src/hotspot/cpu/s390/register_s390.cpp | 14 +- src/hotspot/cpu/s390/register_s390.hpp | 203 +++++- 5 files changed, 1239 insertions(+), 34 deletions(-) diff --git a/src/hotspot/cpu/s390/assembler_s390.hpp b/src/hotspot/cpu/s390/assembler_s390.hpp index 8a7ae9d0756..6e2820ce980 100644 --- a/src/hotspot/cpu/s390/assembler_s390.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.hpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -250,7 +250,6 @@ class Address VALUE_OBJ_CLASS_SPEC { bool is_RSform() { return has_base() && !has_index() && is_disp12(); } bool is_RSYform() { return has_base() && !has_index() && is_disp20(); } bool is_RXform() { return has_base() && has_index() && is_disp12(); } - bool is_RXEform() { return has_base() && has_index() && is_disp12(); } bool is_RXYform() { return has_base() && has_index() && is_disp20(); } bool uses(Register r) { return _base == r || _index == r; }; @@ -1093,7 +1092,194 @@ class Assembler : public AbstractAssembler { #define TRTT_ZOPC (unsigned int)(0xb9 << 24 | 0x90 << 16) -// Miscellaneous Operations +//--------------------------- +//-- Vector Instructions -- +//--------------------------- + +//---< Vector Support Instructions >--- + +//--- Load (memory) --- + +#define VLM_ZOPC (unsigned long)(0xe7L << 40 | 0x36L << 0) // load full vreg range (n * 128 bit) +#define VL_ZOPC (unsigned long)(0xe7L << 40 | 0x06L << 0) // load full vreg (128 bit) +#define VLEB_ZOPC (unsigned long)(0xe7L << 40 | 0x00L << 0) // load vreg element (8 bit) +#define VLEH_ZOPC (unsigned long)(0xe7L << 40 | 0x01L << 0) // load vreg element (16 bit) +#define VLEF_ZOPC (unsigned long)(0xe7L << 40 | 0x03L << 0) // load vreg element (32 bit) +#define VLEG_ZOPC (unsigned long)(0xe7L << 40 | 0x02L << 0) // load vreg element (64 bit) + +#define VLREP_ZOPC (unsigned long)(0xe7L << 40 | 0x05L << 0) // load and replicate into all vector elements +#define VLLEZ_ZOPC (unsigned long)(0xe7L << 40 | 0x04L << 0) // load logical element and zero. + +// vector register gather +#define VGEF_ZOPC (unsigned long)(0xe7L << 40 | 0x13L << 0) // gather element (32 bit), V1(M3) = [D2(V2(M3),B2)] +#define VGEG_ZOPC (unsigned long)(0xe7L << 40 | 0x12L << 0) // gather element (64 bit), V1(M3) = [D2(V2(M3),B2)] +// vector register scatter +#define VSCEF_ZOPC (unsigned long)(0xe7L << 40 | 0x1bL << 0) // vector scatter element FW +#define VSCEG_ZOPC (unsigned long)(0xe7L << 40 | 0x1aL << 0) // vector scatter element DW + +#define VLBB_ZOPC (unsigned long)(0xe7L << 40 | 0x07L << 0) // load vreg to block boundary (load to alignment). +#define VLL_ZOPC (unsigned long)(0xe7L << 40 | 0x37L << 0) // load vreg with length. + +//--- Load (register) --- + +#define VLR_ZOPC (unsigned long)(0xe7L << 40 | 0x56L << 0) // copy full vreg (128 bit) +#define VLGV_ZOPC (unsigned long)(0xe7L << 40 | 0x21L << 0) // copy vreg element -> GR +#define VLVG_ZOPC (unsigned long)(0xe7L << 40 | 0x22L << 0) // copy GR -> vreg element +#define VLVGP_ZOPC (unsigned long)(0xe7L << 40 | 0x62L << 0) // copy GR2, GR3 (disjoint pair) -> vreg + +// vector register pack: cut in half the size the source vector elements +#define VPK_ZOPC (unsigned long)(0xe7L << 40 | 0x94L << 0) // just cut +#define VPKS_ZOPC (unsigned long)(0xe7L << 40 | 0x97L << 0) // saturate as signed values +#define VPKLS_ZOPC (unsigned long)(0xe7L << 40 | 0x95L << 0) // saturate as unsigned values + +// vector register unpack: double in size the source vector elements +#define VUPH_ZOPC (unsigned long)(0xe7L << 40 | 0xd7L << 0) // signed, left half of the source vector elements +#define VUPLH_ZOPC (unsigned long)(0xe7L << 40 | 0xd5L << 0) // unsigned, left half of the source vector elements +#define VUPL_ZOPC (unsigned long)(0xe7L << 40 | 0xd6L << 0) // signed, right half of the source vector elements +#define VUPLL_ZOPC (unsigned long)(0xe7L << 40 | 0xd4L << 0) // unsigned, right half of the source vector element + +// vector register merge +#define VMRH_ZOPC (unsigned long)(0xe7L << 40 | 0x61L << 0) // register merge high (left half of source registers) +#define VMRL_ZOPC (unsigned long)(0xe7L << 40 | 0x60L << 0) // register merge low (right half of source registers) + +// vector register permute +#define VPERM_ZOPC (unsigned long)(0xe7L << 40 | 0x8cL << 0) // vector permute +#define VPDI_ZOPC (unsigned long)(0xe7L << 40 | 0x84L << 0) // vector permute DW immediate + +// vector register replicate +#define VREP_ZOPC (unsigned long)(0xe7L << 40 | 0x4dL << 0) // vector replicate +#define VREPI_ZOPC (unsigned long)(0xe7L << 40 | 0x45L << 0) // vector replicate immediate +#define VSEL_ZOPC (unsigned long)(0xe7L << 40 | 0x8dL << 0) // vector select + +#define VSEG_ZOPC (unsigned long)(0xe7L << 40 | 0x5fL << 0) // vector sign-extend to DW (rightmost element in each DW). + +//--- Load (immediate) --- + +#define VLEIB_ZOPC (unsigned long)(0xe7L << 40 | 0x40L << 0) // load vreg element (16 bit imm to 8 bit) +#define VLEIH_ZOPC (unsigned long)(0xe7L << 40 | 0x41L << 0) // load vreg element (16 bit imm to 16 bit) +#define VLEIF_ZOPC (unsigned long)(0xe7L << 40 | 0x43L << 0) // load vreg element (16 bit imm to 32 bit) +#define VLEIG_ZOPC (unsigned long)(0xe7L << 40 | 0x42L << 0) // load vreg element (16 bit imm to 64 bit) + +//--- Store --- + +#define VSTM_ZOPC (unsigned long)(0xe7L << 40 | 0x3eL << 0) // store full vreg range (n * 128 bit) +#define VST_ZOPC (unsigned long)(0xe7L << 40 | 0x0eL << 0) // store full vreg (128 bit) +#define VSTEB_ZOPC (unsigned long)(0xe7L << 40 | 0x08L << 0) // store vreg element (8 bit) +#define VSTEH_ZOPC (unsigned long)(0xe7L << 40 | 0x09L << 0) // store vreg element (16 bit) +#define VSTEF_ZOPC (unsigned long)(0xe7L << 40 | 0x0bL << 0) // store vreg element (32 bit) +#define VSTEG_ZOPC (unsigned long)(0xe7L << 40 | 0x0aL << 0) // store vreg element (64 bit) +#define VSTL_ZOPC (unsigned long)(0xe7L << 40 | 0x3fL << 0) // store vreg with length. + +//--- Misc --- + +#define VGM_ZOPC (unsigned long)(0xe7L << 40 | 0x46L << 0) // generate bit mask, [start..end] = '1', else '0' +#define VGBM_ZOPC (unsigned long)(0xe7L << 40 | 0x44L << 0) // generate byte mask, bits(imm16) -> bytes + +//---< Vector Arithmetic Instructions >--- + +// Load +#define VLC_ZOPC (unsigned long)(0xe7L << 40 | 0xdeL << 0) // V1 := -V2, element size = 2**m +#define VLP_ZOPC (unsigned long)(0xe7L << 40 | 0xdfL << 0) // V1 := |V2|, element size = 2**m + +// ADD +#define VA_ZOPC (unsigned long)(0xe7L << 40 | 0xf3L << 0) // V1 := V2 + V3, element size = 2**m +#define VACC_ZOPC (unsigned long)(0xe7L << 40 | 0xf1L << 0) // V1 := carry(V2 + V3), element size = 2**m + +// SUB +#define VS_ZOPC (unsigned long)(0xe7L << 40 | 0xf7L << 0) // V1 := V2 - V3, element size = 2**m +#define VSCBI_ZOPC (unsigned long)(0xe7L << 40 | 0xf5L << 0) // V1 := borrow(V2 - V3), element size = 2**m + +// MUL +#define VML_ZOPC (unsigned long)(0xe7L << 40 | 0xa2L << 0) // V1 := V2 * V3, element size = 2**m +#define VMH_ZOPC (unsigned long)(0xe7L << 40 | 0xa3L << 0) // V1 := V2 * V3, element size = 2**m +#define VMLH_ZOPC (unsigned long)(0xe7L << 40 | 0xa1L << 0) // V1 := V2 * V3, element size = 2**m, unsigned +#define VME_ZOPC (unsigned long)(0xe7L << 40 | 0xa6L << 0) // V1 := V2 * V3, element size = 2**m +#define VMLE_ZOPC (unsigned long)(0xe7L << 40 | 0xa4L << 0) // V1 := V2 * V3, element size = 2**m, unsigned +#define VMO_ZOPC (unsigned long)(0xe7L << 40 | 0xa7L << 0) // V1 := V2 * V3, element size = 2**m +#define VMLO_ZOPC (unsigned long)(0xe7L << 40 | 0xa5L << 0) // V1 := V2 * V3, element size = 2**m, unsigned + +// MUL & ADD +#define VMAL_ZOPC (unsigned long)(0xe7L << 40 | 0xaaL << 0) // V1 := V2 * V3 + V4, element size = 2**m +#define VMAH_ZOPC (unsigned long)(0xe7L << 40 | 0xabL << 0) // V1 := V2 * V3 + V4, element size = 2**m +#define VMALH_ZOPC (unsigned long)(0xe7L << 40 | 0xa9L << 0) // V1 := V2 * V3 + V4, element size = 2**m, unsigned +#define VMAE_ZOPC (unsigned long)(0xe7L << 40 | 0xaeL << 0) // V1 := V2 * V3 + V4, element size = 2**m +#define VMALE_ZOPC (unsigned long)(0xe7L << 40 | 0xacL << 0) // V1 := V2 * V3 + V4, element size = 2**m, unsigned +#define VMAO_ZOPC (unsigned long)(0xe7L << 40 | 0xafL << 0) // V1 := V2 * V3 + V4, element size = 2**m +#define VMALO_ZOPC (unsigned long)(0xe7L << 40 | 0xadL << 0) // V1 := V2 * V3 + V4, element size = 2**m, unsigned + +// Vector SUM +#define VSUM_ZOPC (unsigned long)(0xe7L << 40 | 0x64L << 0) // V1[j] := toFW(sum(V2[i]) + V3[j]), subelements: byte or HW +#define VSUMG_ZOPC (unsigned long)(0xe7L << 40 | 0x65L << 0) // V1[j] := toDW(sum(V2[i]) + V3[j]), subelements: HW or FW +#define VSUMQ_ZOPC (unsigned long)(0xe7L << 40 | 0x67L << 0) // V1[j] := toQW(sum(V2[i]) + V3[j]), subelements: FW or DW + +// Average +#define VAVG_ZOPC (unsigned long)(0xe7L << 40 | 0xf2L << 0) // V1 := (V2+V3+1)/2, signed, element size = 2**m +#define VAVGL_ZOPC (unsigned long)(0xe7L << 40 | 0xf0L << 0) // V1 := (V2+V3+1)/2, unsigned, element size = 2**m + +// VECTOR Galois Field Multiply Sum +#define VGFM_ZOPC (unsigned long)(0xe7L << 40 | 0xb4L << 0) +#define VGFMA_ZOPC (unsigned long)(0xe7L << 40 | 0xbcL << 0) + +//---< Vector Logical Instructions >--- + +// AND +#define VN_ZOPC (unsigned long)(0xe7L << 40 | 0x68L << 0) // V1 := V2 & V3, element size = 2**m +#define VNC_ZOPC (unsigned long)(0xe7L << 40 | 0x69L << 0) // V1 := V2 & ~V3, element size = 2**m + +// XOR +#define VX_ZOPC (unsigned long)(0xe7L << 40 | 0x6dL << 0) // V1 := V2 ^ V3, element size = 2**m + +// NOR +#define VNO_ZOPC (unsigned long)(0xe7L << 40 | 0x6bL << 0) // V1 := !(V2 | V3), element size = 2**m + +// OR +#define VO_ZOPC (unsigned long)(0xe7L << 40 | 0x6aL << 0) // V1 := V2 | V3, element size = 2**m + +// Comparison (element-wise) +#define VCEQ_ZOPC (unsigned long)(0xe7L << 40 | 0xf8L << 0) // V1 := (V2 == V3) ? 0xffff : 0x0000, element size = 2**m +#define VCH_ZOPC (unsigned long)(0xe7L << 40 | 0xfbL << 0) // V1 := (V2 > V3) ? 0xffff : 0x0000, element size = 2**m, signed +#define VCHL_ZOPC (unsigned long)(0xe7L << 40 | 0xf9L << 0) // V1 := (V2 > V3) ? 0xffff : 0x0000, element size = 2**m, unsigned + +// Max/Min (element-wise) +#define VMX_ZOPC (unsigned long)(0xe7L << 40 | 0xffL << 0) // V1 := (V2 > V3) ? V2 : V3, element size = 2**m, signed +#define VMXL_ZOPC (unsigned long)(0xe7L << 40 | 0xfdL << 0) // V1 := (V2 > V3) ? V2 : V3, element size = 2**m, unsigned +#define VMN_ZOPC (unsigned long)(0xe7L << 40 | 0xfeL << 0) // V1 := (V2 < V3) ? V2 : V3, element size = 2**m, signed +#define VMNL_ZOPC (unsigned long)(0xe7L << 40 | 0xfcL << 0) // V1 := (V2 < V3) ? V2 : V3, element size = 2**m, unsigned + +// Leading/Trailing Zeros, population count +#define VCLZ_ZOPC (unsigned long)(0xe7L << 40 | 0x53L << 0) // V1 := leadingzeros(V2), element size = 2**m +#define VCTZ_ZOPC (unsigned long)(0xe7L << 40 | 0x52L << 0) // V1 := trailingzeros(V2), element size = 2**m +#define VPOPCT_ZOPC (unsigned long)(0xe7L << 40 | 0x50L << 0) // V1 := popcount(V2), bytewise!! + +// Rotate/Shift +#define VERLLV_ZOPC (unsigned long)(0xe7L << 40 | 0x73L << 0) // V1 := rotateleft(V2), rotate count in V3 element +#define VERLL_ZOPC (unsigned long)(0xe7L << 40 | 0x33L << 0) // V1 := rotateleft(V3), rotate count from d2(b2). +#define VERIM_ZOPC (unsigned long)(0xe7L << 40 | 0x72L << 0) // Rotate then insert under mask. Read Principles of Operation!! + +#define VESLV_ZOPC (unsigned long)(0xe7L << 40 | 0x70L << 0) // V1 := SLL(V2, V3), unsigned, element-wise +#define VESL_ZOPC (unsigned long)(0xe7L << 40 | 0x30L << 0) // V1 := SLL(V3), unsigned, shift count from d2(b2). + +#define VESRAV_ZOPC (unsigned long)(0xe7L << 40 | 0x7AL << 0) // V1 := SRA(V2, V3), signed, element-wise +#define VESRA_ZOPC (unsigned long)(0xe7L << 40 | 0x3AL << 0) // V1 := SRA(V3), signed, shift count from d2(b2). +#define VESRLV_ZOPC (unsigned long)(0xe7L << 40 | 0x78L << 0) // V1 := SRL(V2, V3), unsigned, element-wise +#define VESRL_ZOPC (unsigned long)(0xe7L << 40 | 0x38L << 0) // V1 := SRL(V3), unsigned, shift count from d2(b2). + +#define VSL_ZOPC (unsigned long)(0xe7L << 40 | 0x74L << 0) // V1 := SLL(V2), unsigned, bit-count +#define VSLB_ZOPC (unsigned long)(0xe7L << 40 | 0x75L << 0) // V1 := SLL(V2), unsigned, byte-count +#define VSLDB_ZOPC (unsigned long)(0xe7L << 40 | 0x77L << 0) // V1 := SLL((V2,V3)), unsigned, byte-count + +#define VSRA_ZOPC (unsigned long)(0xe7L << 40 | 0x7eL << 0) // V1 := SRA(V2), signed, bit-count +#define VSRAB_ZOPC (unsigned long)(0xe7L << 40 | 0x7fL << 0) // V1 := SRA(V2), signed, byte-count +#define VSRL_ZOPC (unsigned long)(0xe7L << 40 | 0x7cL << 0) // V1 := SRL(V2), unsigned, bit-count +#define VSRLB_ZOPC (unsigned long)(0xe7L << 40 | 0x7dL << 0) // V1 := SRL(V2), unsigned, byte-count + +// Test under Mask +#define VTM_ZOPC (unsigned long)(0xe7L << 40 | 0xd8L << 0) // Like TM, set CC according to state of selected bits. + + +//-------------------------------- +//-- Miscellaneous Operations -- +//-------------------------------- // Execute #define EX_ZOPC (unsigned int)(68L << 24) @@ -1280,6 +1466,21 @@ class Assembler : public AbstractAssembler { to_minus_infinity = 7 }; + // Vector Register Element Type. + enum VRegElemType { + VRET_BYTE = 0, + VRET_HW = 1, + VRET_FW = 2, + VRET_DW = 3, + VRET_QW = 4 + }; + + // Vector Operation Condition Code Control. + enum VOpCCC { + VOP_CCIGN = 0, // ignore, don't set CC + VOP_CCSET = 1 // set the CC + }; + // Inverse condition code, i.e. determine "15 - cc" for a given condition code cc. static branch_condition inverse_condition(branch_condition cc); static branch_condition inverse_float_condition(branch_condition cc); @@ -1376,6 +1577,60 @@ class Assembler : public AbstractAssembler { return r; } + static int64_t rsmask_48( Address a) { assert(a.is_RSform(), "bad address format"); return rsmask_48( a.disp12(), a.base()); } + static int64_t rxmask_48( Address a) { if (a.is_RXform()) { return rxmask_48( a.disp12(), a.index(), a.base()); } + else if (a.is_RSform()) { return rsmask_48( a.disp12(), a.base()); } + else { guarantee(false, "bad address format"); return 0; } + } + static int64_t rsymask_48(Address a) { assert(a.is_RSYform(), "bad address format"); return rsymask_48(a.disp20(), a.base()); } + static int64_t rxymask_48(Address a) { if (a.is_RXYform()) { return rxymask_48( a.disp20(), a.index(), a.base()); } + else if (a.is_RSYform()) { return rsymask_48( a.disp20(), a.base()); } + else { guarantee(false, "bad address format"); return 0; } + } + + static int64_t rsmask_48( int64_t d2, Register b2) { return uimm12(d2, 20, 48) | regz(b2, 16, 48); } + static int64_t rxmask_48( int64_t d2, Register x2, Register b2) { return uimm12(d2, 20, 48) | reg(x2, 12, 48) | regz(b2, 16, 48); } + static int64_t rsymask_48(int64_t d2, Register b2) { return simm20(d2) | regz(b2, 16, 48); } + static int64_t rxymask_48(int64_t d2, Register x2, Register b2) { return simm20(d2) | reg(x2, 12, 48) | regz(b2, 16, 48); } + + // Address calculated from d12(vx,b) - vx is vector index register. + static int64_t rvmask_48( int64_t d2, VectorRegister x2, Register b2) { return uimm12(d2, 20, 48) | vreg(x2, 12) | regz(b2, 16, 48); } + + static int64_t vreg_mask(VectorRegister v, int pos) { + return vreg(v, pos) | v->RXB_mask(pos); + } + + // Vector Element Size Control. 4-bit field which indicates the size of the vector elements. + static int64_t vesc_mask(int64_t size, int min_size, int max_size, int pos) { + // min_size - minimum element size. Not all instructions support element sizes beginning with "byte". + // max_size - maximum element size. Not all instructions support element sizes up to "QW". + assert((min_size <= size) && (size <= max_size), "element size control out of range"); + return uimm4(size, pos, 48); + } + + // Vector Element IndeX. 4-bit field which indexes the target vector element. + static int64_t veix_mask(int64_t ix, int el_size, int pos) { + // el_size - size of the vector element. This is a VRegElemType enum value. + // ix - vector element index. + int max_ix = -1; + switch (el_size) { + case VRET_BYTE: max_ix = 15; break; + case VRET_HW: max_ix = 7; break; + case VRET_FW: max_ix = 3; break; + case VRET_DW: max_ix = 1; break; + case VRET_QW: max_ix = 0; break; + default: guarantee(false, "bad vector element size %d", el_size); break; + } + assert((0 <= ix) && (ix <= max_ix), "element size out of range (0 <= %ld <= %d)", ix, max_ix); + return uimm4(ix, pos, 48); + } + + // Vector Operation Condition Code Control. 4-bit field, one bit of which indicates if the condition code is to be set by the operation. + static int64_t vccc_mask(int64_t flag, int pos) { + assert((flag == VOP_CCIGN) || (flag == VOP_CCSET), "VCCC flag value out of range"); + return uimm4(flag, pos, 48); + } + public: //-------------------------------------------------- @@ -1453,6 +1708,8 @@ class Assembler : public AbstractAssembler { static long imm24(int64_t i24, int s, int len) { return imm(i24, 24) << (len-s-24); } static long imm32(int64_t i32, int s, int len) { return imm(i32, 32) << (len-s-32); } + static long vreg(VectorRegister v, int pos) { const int len = 48; return u_field(v->encoding()&0x0f, (len-pos)-1, (len-pos)-4) | v->RXB_mask(pos); } + static long fregt(FloatRegister r, int s, int len) { return freg(r,s,len); } static long freg( FloatRegister r, int s, int len) { return u_field(r->encoding(), (len-s)-1, (len-s)-4); } @@ -2125,6 +2382,397 @@ class Assembler : public AbstractAssembler { inline void z_trtt(Register r1, Register r2, int64_t m3); + //--------------------------- + //-- Vector Instructions -- + //--------------------------- + + //---< Vector Support Instructions >--- + + // Load (transfer from memory) + inline void z_vlm( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vl( VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vleb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vleh( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vlef( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vleg( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + + // Gather/Scatter + inline void z_vgef( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3); + inline void z_vgeg( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3); + + inline void z_vscef( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3); + inline void z_vsceg( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3); + + // load and replicate + inline void z_vlrep( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vlrepb(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vlreph(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vlrepf(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vlrepg(VectorRegister v1, int64_t d2, Register x2, Register b2); + + inline void z_vllez( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vllezb(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vllezh(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vllezf(VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vllezg(VectorRegister v1, int64_t d2, Register x2, Register b2); + + inline void z_vlbb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vll( VectorRegister v1, Register r3, int64_t d2, Register b2); + + // Load (register to register) + inline void z_vlr( VectorRegister v1, VectorRegister v2); + + inline void z_vlgv( Register r1, VectorRegister v3, int64_t d2, Register b2, int64_t m4); + inline void z_vlgvb( Register r1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vlgvh( Register r1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vlgvf( Register r1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vlgvg( Register r1, VectorRegister v3, int64_t d2, Register b2); + + inline void z_vlvg( VectorRegister v1, Register r3, int64_t d2, Register b2, int64_t m4); + inline void z_vlvgb( VectorRegister v1, Register r3, int64_t d2, Register b2); + inline void z_vlvgh( VectorRegister v1, Register r3, int64_t d2, Register b2); + inline void z_vlvgf( VectorRegister v1, Register r3, int64_t d2, Register b2); + inline void z_vlvgg( VectorRegister v1, Register r3, int64_t d2, Register b2); + + inline void z_vlvgp( VectorRegister v1, Register r2, Register r3); + + // vector register pack + inline void z_vpk( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vpkh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpkf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpkg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + inline void z_vpks( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5); + inline void z_vpksh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpksf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpksg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpkshs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpksfs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpksgs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + + inline void z_vpkls( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5); + inline void z_vpklsh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpklsf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpklsg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpklshs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpklsfs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vpklsgs(VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // vector register unpack (sign-extended) + inline void z_vuph( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vuphb( VectorRegister v1, VectorRegister v2); + inline void z_vuphh( VectorRegister v1, VectorRegister v2); + inline void z_vuphf( VectorRegister v1, VectorRegister v2); + inline void z_vupl( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vuplb( VectorRegister v1, VectorRegister v2); + inline void z_vuplh( VectorRegister v1, VectorRegister v2); + inline void z_vuplf( VectorRegister v1, VectorRegister v2); + + // vector register unpack (zero-extended) + inline void z_vuplh( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vuplhb( VectorRegister v1, VectorRegister v2); + inline void z_vuplhh( VectorRegister v1, VectorRegister v2); + inline void z_vuplhf( VectorRegister v1, VectorRegister v2); + inline void z_vupll( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vupllb( VectorRegister v1, VectorRegister v2); + inline void z_vupllh( VectorRegister v1, VectorRegister v2); + inline void z_vupllf( VectorRegister v1, VectorRegister v2); + + // vector register merge high/low + inline void z_vmrh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmrhb(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrhh(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrhf(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrhg(VectorRegister v1, VectorRegister v2, VectorRegister v3); + + inline void z_vmrl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmrlb(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrlh(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrlf(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmrlg(VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // vector register permute + inline void z_vperm( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + inline void z_vpdi( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + + // vector register replicate + inline void z_vrep( VectorRegister v1, VectorRegister v3, int64_t imm2, int64_t m4); + inline void z_vrepb( VectorRegister v1, VectorRegister v3, int64_t imm2); + inline void z_vreph( VectorRegister v1, VectorRegister v3, int64_t imm2); + inline void z_vrepf( VectorRegister v1, VectorRegister v3, int64_t imm2); + inline void z_vrepg( VectorRegister v1, VectorRegister v3, int64_t imm2); + inline void z_vrepi( VectorRegister v1, int64_t imm2, int64_t m3); + inline void z_vrepib(VectorRegister v1, int64_t imm2); + inline void z_vrepih(VectorRegister v1, int64_t imm2); + inline void z_vrepif(VectorRegister v1, int64_t imm2); + inline void z_vrepig(VectorRegister v1, int64_t imm2); + + inline void z_vsel( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + inline void z_vseg( VectorRegister v1, VectorRegister v2, int64_t imm3); + + // Load (immediate) + inline void z_vleib( VectorRegister v1, int64_t imm2, int64_t m3); + inline void z_vleih( VectorRegister v1, int64_t imm2, int64_t m3); + inline void z_vleif( VectorRegister v1, int64_t imm2, int64_t m3); + inline void z_vleig( VectorRegister v1, int64_t imm2, int64_t m3); + + // Store + inline void z_vstm( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vst( VectorRegister v1, int64_t d2, Register x2, Register b2); + inline void z_vsteb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vsteh( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vstef( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vsteg( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3); + inline void z_vstl( VectorRegister v1, Register r3, int64_t d2, Register b2); + + // Misc + inline void z_vgm( VectorRegister v1, int64_t imm2, int64_t imm3, int64_t m4); + inline void z_vgmb( VectorRegister v1, int64_t imm2, int64_t imm3); + inline void z_vgmh( VectorRegister v1, int64_t imm2, int64_t imm3); + inline void z_vgmf( VectorRegister v1, int64_t imm2, int64_t imm3); + inline void z_vgmg( VectorRegister v1, int64_t imm2, int64_t imm3); + + inline void z_vgbm( VectorRegister v1, int64_t imm2); + inline void z_vzero( VectorRegister v1); // preferred method to set vreg to all zeroes + inline void z_vone( VectorRegister v1); // preferred method to set vreg to all ones + + //---< Vector Arithmetic Instructions >--- + + // Load + inline void z_vlc( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vlcb( VectorRegister v1, VectorRegister v2); + inline void z_vlch( VectorRegister v1, VectorRegister v2); + inline void z_vlcf( VectorRegister v1, VectorRegister v2); + inline void z_vlcg( VectorRegister v1, VectorRegister v2); + inline void z_vlp( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vlpb( VectorRegister v1, VectorRegister v2); + inline void z_vlph( VectorRegister v1, VectorRegister v2); + inline void z_vlpf( VectorRegister v1, VectorRegister v2); + inline void z_vlpg( VectorRegister v1, VectorRegister v2); + + // ADD + inline void z_va( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vab( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vah( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vaf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vag( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vaq( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vacc( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vaccb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vacch( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vaccf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vaccg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vaccq( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // SUB + inline void z_vs( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vsb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsq( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vscbi( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vscbib( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vscbih( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vscbif( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vscbig( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vscbiq( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // MULTIPLY + inline void z_vml( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmlh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vme( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmle( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmo( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmlo( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + + // MULTIPLY & ADD + inline void z_vmal( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmah( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmalh( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmae( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmale( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmao( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vmalo( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + + // VECTOR SUM + inline void z_vsum( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vsumb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsumh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsumg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vsumgh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsumgf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsumq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vsumqf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsumqg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // Average + inline void z_vavg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vavgb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavgh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavgf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavgg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavgl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vavglb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavglh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavglf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vavglg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // VECTOR Galois Field Multiply Sum + inline void z_vgfm( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vgfmb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vgfmh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vgfmf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vgfmg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + // VECTOR Galois Field Multiply Sum and Accumulate + inline void z_vgfma( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5); + inline void z_vgfmab( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + inline void z_vgfmah( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + inline void z_vgfmaf( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + inline void z_vgfmag( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4); + + //---< Vector Logical Instructions >--- + + // AND + inline void z_vn( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vnc( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // XOR + inline void z_vx( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // NOR + inline void z_vno( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // OR + inline void z_vo( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // Comparison (element-wise) + inline void z_vceq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5); + inline void z_vceqb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqbs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqhs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqfs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vceqgs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vch( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5); + inline void z_vchb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchbs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchhs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchfs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchgs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5); + inline void z_vchlb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlbs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlhs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlfs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vchlgs( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // Max/Min (element-wise) + inline void z_vmx( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmxb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmxlb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxlh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxlf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmxlg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmn( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmnb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmng( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vmnlb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnlh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnlf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vmnlg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // Leading/Trailing Zeros, population count + inline void z_vclz( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vclzb( VectorRegister v1, VectorRegister v2); + inline void z_vclzh( VectorRegister v1, VectorRegister v2); + inline void z_vclzf( VectorRegister v1, VectorRegister v2); + inline void z_vclzg( VectorRegister v1, VectorRegister v2); + inline void z_vctz( VectorRegister v1, VectorRegister v2, int64_t m3); + inline void z_vctzb( VectorRegister v1, VectorRegister v2); + inline void z_vctzh( VectorRegister v1, VectorRegister v2); + inline void z_vctzf( VectorRegister v1, VectorRegister v2); + inline void z_vctzg( VectorRegister v1, VectorRegister v2); + inline void z_vpopct( VectorRegister v1, VectorRegister v2, int64_t m3); + + // Rotate/Shift + inline void z_verllv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_verllvb(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_verllvh(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_verllvf(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_verllvg(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_verll( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4); + inline void z_verllb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_verllh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_verllf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_verllg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_verim( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t m5); + inline void z_verimb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4); + inline void z_verimh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4); + inline void z_verimf( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4); + inline void z_verimg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4); + + inline void z_veslv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_veslvb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_veslvh( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_veslvf( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_veslvg( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesl( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4); + inline void z_veslb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_veslh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_veslf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_veslg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + + inline void z_vesrav( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vesravb(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesravh(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesravf(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesravg(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesra( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4); + inline void z_vesrab( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrah( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesraf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrag( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrlv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4); + inline void z_vesrlvb(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesrlvh(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesrlvf(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesrlvg(VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vesrl( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4); + inline void z_vesrlb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrlh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrlf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + inline void z_vesrlg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2); + + inline void z_vsl( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vslb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsldb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4); + + inline void z_vsra( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsrab( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsrl( VectorRegister v1, VectorRegister v2, VectorRegister v3); + inline void z_vsrlb( VectorRegister v1, VectorRegister v2, VectorRegister v3); + + // Test under Mask + inline void z_vtm( VectorRegister v1, VectorRegister v2); + + // Floatingpoint instructions // ========================== diff --git a/src/hotspot/cpu/s390/assembler_s390.inline.hpp b/src/hotspot/cpu/s390/assembler_s390.inline.hpp index 449d0af0bf3..a9d4c078b38 100644 --- a/src/hotspot/cpu/s390/assembler_s390.inline.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.inline.hpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -702,6 +702,396 @@ inline void Assembler::z_cvd(Register r1, int64_t d2, Register x2, Register b2) inline void Assembler::z_cvdg(Register r1, int64_t d2, Register x2, Register b2) { emit_48( CVDG_ZOPC | regt(r1, 8, 48) | reg(x2, 12, 48) | reg(b2, 16, 48) | simm20(d2)); } +//--------------------------- +//-- Vector Instructions -- +//--------------------------- + +//---< Vector Support Instructions >--- + +// Load (transfer from memory) +inline void Assembler::z_vlm( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {emit_48(VLM_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2)); } +inline void Assembler::z_vl( VectorRegister v1, int64_t d2, Register x2, Register b2) {emit_48(VL_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2)); } +inline void Assembler::z_vleb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLEB_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_BYTE, 32)); } +inline void Assembler::z_vleh( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLEH_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_HW, 32)); } +inline void Assembler::z_vlef( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLEF_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_FW, 32)); } +inline void Assembler::z_vleg( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLEG_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_DW, 32)); } + +// Gather/Scatter +inline void Assembler::z_vgef( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3) {emit_48(VGEF_ZOPC | vreg(v1, 8) | rvmask_48(d2, vx2, b2) | veix_mask(m3, VRET_FW, 32)); } +inline void Assembler::z_vgeg( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3) {emit_48(VGEG_ZOPC | vreg(v1, 8) | rvmask_48(d2, vx2, b2) | veix_mask(m3, VRET_DW, 32)); } + +inline void Assembler::z_vscef( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3) {emit_48(VSCEF_ZOPC | vreg(v1, 8) | rvmask_48(d2, vx2, b2) | veix_mask(m3, VRET_FW, 32)); } +inline void Assembler::z_vsceg( VectorRegister v1, int64_t d2, VectorRegister vx2, Register b2, int64_t m3) {emit_48(VSCEG_ZOPC | vreg(v1, 8) | rvmask_48(d2, vx2, b2) | veix_mask(m3, VRET_DW, 32)); } + +// load and replicate +inline void Assembler::z_vlrep( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLREP_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vlrepb( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vlrep(v1, d2, x2, b2, VRET_BYTE); }// load byte and replicate to all vector elements of type 'B' +inline void Assembler::z_vlreph( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vlrep(v1, d2, x2, b2, VRET_HW); } // load HW and replicate to all vector elements of type 'H' +inline void Assembler::z_vlrepf( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vlrep(v1, d2, x2, b2, VRET_FW); } // load FW and replicate to all vector elements of type 'F' +inline void Assembler::z_vlrepg( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vlrep(v1, d2, x2, b2, VRET_DW); } // load DW and replicate to all vector elements of type 'G' + +inline void Assembler::z_vllez( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLLEZ_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vllezb( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vllez(v1, d2, x2, b2, VRET_BYTE); }// load logical byte into left DW of VR, zero all other bit positions. +inline void Assembler::z_vllezh( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vllez(v1, d2, x2, b2, VRET_HW); } // load logical HW into left DW of VR, zero all other bit positions. +inline void Assembler::z_vllezf( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vllez(v1, d2, x2, b2, VRET_FW); } // load logical FW into left DW of VR, zero all other bit positions. +inline void Assembler::z_vllezg( VectorRegister v1, int64_t d2, Register x2, Register b2) {z_vllez(v1, d2, x2, b2, VRET_DW); } // load logical DW into left DW of VR, zero all other bit positions. + +inline void Assembler::z_vlbb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VLBB_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | uimm4(m3, 32, 48)); } +inline void Assembler::z_vll( VectorRegister v1, Register r3, int64_t d2, Register b2) {emit_48(VLL_ZOPC | vreg(v1, 8) | reg(r3, 12, 48) | rsmask_48(d2, b2)); } + +// Load (register to register) +inline void Assembler::z_vlr ( VectorRegister v1, VectorRegister v2) {emit_48(VLR_ZOPC | vreg(v1, 8) | vreg(v2, 12)); } + +inline void Assembler::z_vlgv( Register r1, VectorRegister v3, int64_t d2, Register b2, int64_t m4) {emit_48(VLGV_ZOPC | reg(r1, 8, 48) | vreg(v3, 12) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vlgvb( Register r1, VectorRegister v3, int64_t d2, Register b2) {z_vlgv(r1, v3, d2, b2, VRET_BYTE); } // load byte from VR element (index d2(b2)) into GR (logical) +inline void Assembler::z_vlgvh( Register r1, VectorRegister v3, int64_t d2, Register b2) {z_vlgv(r1, v3, d2, b2, VRET_HW); } // load HW from VR element (index d2(b2)) into GR (logical) +inline void Assembler::z_vlgvf( Register r1, VectorRegister v3, int64_t d2, Register b2) {z_vlgv(r1, v3, d2, b2, VRET_FW); } // load FW from VR element (index d2(b2)) into GR (logical) +inline void Assembler::z_vlgvg( Register r1, VectorRegister v3, int64_t d2, Register b2) {z_vlgv(r1, v3, d2, b2, VRET_DW); } // load DW from VR element (index d2(b2)) into GR. + +inline void Assembler::z_vlvg( VectorRegister v1, Register r3, int64_t d2, Register b2, int64_t m4) {emit_48(VLVG_ZOPC | vreg(v1, 8) | reg(r3, 12, 48) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vlvgb( VectorRegister v1, Register r3, int64_t d2, Register b2) {z_vlvg(v1, r3, d2, b2, VRET_BYTE); } +inline void Assembler::z_vlvgh( VectorRegister v1, Register r3, int64_t d2, Register b2) {z_vlvg(v1, r3, d2, b2, VRET_HW); } +inline void Assembler::z_vlvgf( VectorRegister v1, Register r3, int64_t d2, Register b2) {z_vlvg(v1, r3, d2, b2, VRET_FW); } +inline void Assembler::z_vlvgg( VectorRegister v1, Register r3, int64_t d2, Register b2) {z_vlvg(v1, r3, d2, b2, VRET_DW); } + +inline void Assembler::z_vlvgp( VectorRegister v1, Register r2, Register r3) {emit_48(VLVGP_ZOPC | vreg(v1, 8) | reg(r2, 12, 48) | reg(r3, 16, 48)); } + +// vector register pack +inline void Assembler::z_vpk( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VPK_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32)); } +inline void Assembler::z_vpkh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpk(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vpkf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpk(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vpkg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpk(v1, v2, v3, VRET_DW); } // vector element type 'G' + +inline void Assembler::z_vpks( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | vccc_mask(cc5, 24)); } +inline void Assembler::z_vpksh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vpksf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vpksg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vpkshs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', set CC +inline void Assembler::z_vpksfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', set CC +inline void Assembler::z_vpksgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', set CC + +inline void Assembler::z_vpkls( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKLS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | vccc_mask(cc5, 24)); } +inline void Assembler::z_vpklsh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vpklsf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vpklsg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vpklshs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', set CC +inline void Assembler::z_vpklsfs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', set CC +inline void Assembler::z_vpklsgs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', set CC + +// vector register unpack (sign-extended) +inline void Assembler::z_vuph( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VUPH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vuphb( VectorRegister v1, VectorRegister v2) {z_vuph(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vuphh( VectorRegister v1, VectorRegister v2) {z_vuph(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vuphf( VectorRegister v1, VectorRegister v2) {z_vuph(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vupl( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VUPL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vuplb( VectorRegister v1, VectorRegister v2) {z_vupl(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vuplh( VectorRegister v1, VectorRegister v2) {z_vupl(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vuplf( VectorRegister v1, VectorRegister v2) {z_vupl(v1, v2, VRET_FW); } // vector element type 'F' + +// vector register unpack (zero-extended) +inline void Assembler::z_vuplh( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VUPLH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vuplhb( VectorRegister v1, VectorRegister v2) {z_vuplh(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vuplhh( VectorRegister v1, VectorRegister v2) {z_vuplh(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vuplhf( VectorRegister v1, VectorRegister v2) {z_vuplh(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vupll( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VUPLL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vupllb( VectorRegister v1, VectorRegister v2) {z_vupll(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vupllh( VectorRegister v1, VectorRegister v2) {z_vupll(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vupllf( VectorRegister v1, VectorRegister v2) {z_vupll(v1, v2, VRET_FW); } // vector element type 'F' + +// vector register merge high/low +inline void Assembler::z_vmrh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMRH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmrhb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmrhh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmrhf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmrhg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_DW); } // vector element type 'G' + +inline void Assembler::z_vmrl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMRL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmrlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmrlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmrlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmrlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmrh(v1, v2, v3, VRET_DW); } // vector element type 'G' + +// vector register permute +inline void Assembler::z_vperm( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {emit_48(VPERM_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32)); } +inline void Assembler::z_vpdi( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VPDI_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | uimm4(m4, 32, 48)); } + +// vector register replicate +inline void Assembler::z_vrep( VectorRegister v1, VectorRegister v3, int64_t imm2, int64_t m4) {emit_48(VREP_ZOPC | vreg(v1, 8) | vreg(v3, 12) | simm16(imm2, 16, 48) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vrepb( VectorRegister v1, VectorRegister v3, int64_t imm2) {z_vrep(v1, v3, imm2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vreph( VectorRegister v1, VectorRegister v3, int64_t imm2) {z_vrep(v1, v3, imm2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vrepf( VectorRegister v1, VectorRegister v3, int64_t imm2) {z_vrep(v1, v3, imm2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vrepg( VectorRegister v1, VectorRegister v3, int64_t imm2) {z_vrep(v1, v3, imm2, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vrepi( VectorRegister v1, int64_t imm2, int64_t m3) {emit_48(VREPI_ZOPC | vreg(v1, 8) | simm16(imm2, 16, 48) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vrepib( VectorRegister v1, int64_t imm2) {z_vrepi(v1, imm2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vrepih( VectorRegister v1, int64_t imm2) {z_vrepi(v1, imm2, VRET_HW); } // vector element type 'B' +inline void Assembler::z_vrepif( VectorRegister v1, int64_t imm2) {z_vrepi(v1, imm2, VRET_FW); } // vector element type 'B' +inline void Assembler::z_vrepig( VectorRegister v1, int64_t imm2) {z_vrepi(v1, imm2, VRET_DW); } // vector element type 'B' + +inline void Assembler::z_vsel( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {emit_48(VSEL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32)); } +inline void Assembler::z_vseg( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VSEG_ZOPC | vreg(v1, 8) | vreg(v2, 12) | uimm4(m3, 32, 48)); } + +// Load (immediate) +inline void Assembler::z_vleib( VectorRegister v1, int64_t imm2, int64_t m3) {emit_48(VLEIB_ZOPC | vreg(v1, 8) | simm16(imm2, 32, 48) | veix_mask(m3, VRET_BYTE, 32)); } +inline void Assembler::z_vleih( VectorRegister v1, int64_t imm2, int64_t m3) {emit_48(VLEIH_ZOPC | vreg(v1, 8) | simm16(imm2, 32, 48) | veix_mask(m3, VRET_HW, 32)); } +inline void Assembler::z_vleif( VectorRegister v1, int64_t imm2, int64_t m3) {emit_48(VLEIF_ZOPC | vreg(v1, 8) | simm16(imm2, 32, 48) | veix_mask(m3, VRET_FW, 32)); } +inline void Assembler::z_vleig( VectorRegister v1, int64_t imm2, int64_t m3) {emit_48(VLEIG_ZOPC | vreg(v1, 8) | simm16(imm2, 32, 48) | veix_mask(m3, VRET_DW, 32)); } + +// Store +inline void Assembler::z_vstm( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {emit_48(VSTM_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2)); } +inline void Assembler::z_vst( VectorRegister v1, int64_t d2, Register x2, Register b2) {emit_48(VST_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2)); } +inline void Assembler::z_vsteb( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VSTEB_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_BYTE, 32)); } +inline void Assembler::z_vsteh( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VSTEH_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_HW, 32)); } +inline void Assembler::z_vstef( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VSTEF_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_FW, 32)); } +inline void Assembler::z_vsteg( VectorRegister v1, int64_t d2, Register x2, Register b2, int64_t m3) {emit_48(VSTEG_ZOPC | vreg(v1, 8) | rxmask_48(d2, x2, b2) | veix_mask(m3, VRET_DW, 32)); } +inline void Assembler::z_vstl( VectorRegister v1, Register r3, int64_t d2, Register b2) {emit_48(VSTL_ZOPC | vreg(v1, 8) | reg(r3, 12, 48) | rsmask_48(d2, b2)); } + +// Misc +inline void Assembler::z_vgm( VectorRegister v1, int64_t imm2, int64_t imm3, int64_t m4) {emit_48(VGM_ZOPC | vreg(v1, 8) | uimm8( imm2, 16, 48) | uimm8(imm3, 24, 48) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vgmb( VectorRegister v1, int64_t imm2, int64_t imm3) {z_vgm(v1, imm2, imm3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vgmh( VectorRegister v1, int64_t imm2, int64_t imm3) {z_vgm(v1, imm2, imm3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vgmf( VectorRegister v1, int64_t imm2, int64_t imm3) {z_vgm(v1, imm2, imm3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vgmg( VectorRegister v1, int64_t imm2, int64_t imm3) {z_vgm(v1, imm2, imm3, VRET_DW); } // vector element type 'G' + +inline void Assembler::z_vgbm( VectorRegister v1, int64_t imm2) {emit_48(VGBM_ZOPC | vreg(v1, 8) | uimm16(imm2, 16, 48)); } +inline void Assembler::z_vzero( VectorRegister v1) {z_vgbm(v1, 0); } // preferred method to set vreg to all zeroes +inline void Assembler::z_vone( VectorRegister v1) {z_vgbm(v1, 0xffff); } // preferred method to set vreg to all ones + +//---< Vector Arithmetic Instructions >--- + +// Load +inline void Assembler::z_vlc( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VLC_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vlcb( VectorRegister v1, VectorRegister v2) {z_vlc(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vlch( VectorRegister v1, VectorRegister v2) {z_vlc(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vlcf( VectorRegister v1, VectorRegister v2) {z_vlc(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vlcg( VectorRegister v1, VectorRegister v2) {z_vlc(v1, v2, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vlp( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VLP_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vlpb( VectorRegister v1, VectorRegister v2) {z_vlp(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vlph( VectorRegister v1, VectorRegister v2) {z_vlp(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vlpf( VectorRegister v1, VectorRegister v2) {z_vlp(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vlpg( VectorRegister v1, VectorRegister v2) {z_vlp(v1, v2, VRET_DW); } // vector element type 'G' + +// ADD +inline void Assembler::z_va( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VA_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_QW, 32)); } +inline void Assembler::z_vab( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_va(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vah( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_va(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vaf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_va(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vag( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_va(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vaq( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_va(v1, v2, v3, VRET_QW); } // vector element type 'Q' +inline void Assembler::z_vacc( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VACC_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_QW, 32)); } +inline void Assembler::z_vaccb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vacc(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vacch( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vacc(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vaccf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vacc(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vaccg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vacc(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vaccq( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vacc(v1, v2, v3, VRET_QW); } // vector element type 'Q' + +// SUB +inline void Assembler::z_vs( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_QW, 32)); } +inline void Assembler::z_vsb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vs(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vsh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vs(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vsf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vs(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vsg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vs(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vsq( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vs(v1, v2, v3, VRET_QW); } // vector element type 'Q' +inline void Assembler::z_vscbi( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VSCBI_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_QW, 32)); } +inline void Assembler::z_vscbib( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vscbi(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vscbih( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vscbi(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vscbif( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vscbi(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vscbig( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vscbi(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vscbiq( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vscbi(v1, v2, v3, VRET_QW); } // vector element type 'Q' + +// MULTIPLY +inline void Assembler::z_vml( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VML_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vmh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vmlh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMLH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vme( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VME_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vmle( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMLE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vmo( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } +inline void Assembler::z_vmlo( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMLO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_FW, 32)); } + +// MULTIPLY & ADD +inline void Assembler::z_vmal( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMAL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmah( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMAH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmalh( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMALH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmae( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMAE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmale( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMALE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmao( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMAO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } +inline void Assembler::z_vmalo( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VMALO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(m5, VRET_BYTE, VRET_FW, 20)); } + +// VECTOR SUM +inline void Assembler::z_vsum( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VSUM_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_HW, 32)); } +inline void Assembler::z_vsumb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsum(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vsumh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsum(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vsumg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VSUMG_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_FW, 32)); } +inline void Assembler::z_vsumgh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsumg(v1, v2, v3, VRET_HW); } // vector element type 'B' +inline void Assembler::z_vsumgf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsumg(v1, v2, v3, VRET_FW); } // vector element type 'H' +inline void Assembler::z_vsumq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VSUMQ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_FW, VRET_DW, 32)); } +inline void Assembler::z_vsumqf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsumq(v1, v2, v3, VRET_FW); } // vector element type 'B' +inline void Assembler::z_vsumqg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vsumq(v1, v2, v3, VRET_DW); } // vector element type 'H' + +// Average +inline void Assembler::z_vavg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VAVG_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vavgb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavg(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vavgh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavg(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vavgf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavg(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vavgg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavg(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vavgl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VAVGL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vavglb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavgl(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vavglh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavgl(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vavglf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavgl(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vavglg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vavgl(v1, v2, v3, VRET_DW); } // vector element type 'G' + +// VECTOR Galois Field Multiply Sum +inline void Assembler::z_vgfm( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VGFM_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vgfmb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vgfm(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vgfmh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vgfm(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vgfmf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vgfm(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vgfmg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vgfm(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vgfma( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t m5) {emit_48(VGFMA_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v3, 16) | vesc_mask(m5, VRET_BYTE, VRET_DW, 20)); } +inline void Assembler::z_vgfmab( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {z_vgfma(v1, v2, v3, v4, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vgfmah( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {z_vgfma(v1, v2, v3, v4, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vgfmaf( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {z_vgfma(v1, v2, v3, v4, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vgfmag( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4) {z_vgfma(v1, v2, v3, v4, VRET_DW); } // vector element type 'G' + +//---< Vector Logical Instructions >--- + +// AND +inline void Assembler::z_vn( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VN_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vnc( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VNC_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } + +// XOR +inline void Assembler::z_vx( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VX_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } + +// NOR +inline void Assembler::z_vno( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VNO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } + +// OR +inline void Assembler::z_vo( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } + +// Comparison (element-wise) +inline void Assembler::z_vceq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCEQ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } +inline void Assembler::z_vceqb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vceqh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vceqf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vceqg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vceqbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vceqhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vceqfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vceqgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC +inline void Assembler::z_vch( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } +inline void Assembler::z_vchb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vchh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vchf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vchg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vchbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vchhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vchfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vchgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC +inline void Assembler::z_vchl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCHL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } +inline void Assembler::z_vchlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vchlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vchlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vchlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vchlbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vchlhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vchlfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vchlgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC + +// Max/Min (element-wise) +inline void Assembler::z_vmx( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMX_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmxb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmx(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmxh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmx(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmxf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmx(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmxg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmx(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vmxl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMXL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmxlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmxl(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmxlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmxl(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmxlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmxl(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmxlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmxl(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vmn( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMN_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmnb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmn(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmnh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmn(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmnf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmn(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmng( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmn(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vmnl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMNL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vmnlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmnl(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vmnlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmnl(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vmnlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmnl(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vmnlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vmnl(v1, v2, v3, VRET_DW); } // vector element type 'G' + +// Leading/Trailing Zeros, population count +inline void Assembler::z_vclz( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VCLZ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vclzb( VectorRegister v1, VectorRegister v2) {z_vclz(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vclzh( VectorRegister v1, VectorRegister v2) {z_vclz(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vclzf( VectorRegister v1, VectorRegister v2) {z_vclz(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vclzg( VectorRegister v1, VectorRegister v2) {z_vclz(v1, v2, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vctz( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VCTZ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vctzb( VectorRegister v1, VectorRegister v2) {z_vctz(v1, v2, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vctzh( VectorRegister v1, VectorRegister v2) {z_vctz(v1, v2, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vctzf( VectorRegister v1, VectorRegister v2) {z_vctz(v1, v2, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vctzg( VectorRegister v1, VectorRegister v2) {z_vctz(v1, v2, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vpopct( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VPOPCT_ZOPC| vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_DW, 32)); } + +// Rotate/Shift +inline void Assembler::z_verllv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VERLLV_ZOPC| vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_verllvb(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_verllv(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_verllvh(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_verllv(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_verllvf(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_verllv(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_verllvg(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_verllv(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_verll( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4) {emit_48(VERLL_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_verllb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_verll(v1, v3, d2, b2, VRET_BYTE);}// vector element type 'B' +inline void Assembler::z_verllh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_verll(v1, v3, d2, b2, VRET_HW);} // vector element type 'H' +inline void Assembler::z_verllf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_verll(v1, v3, d2, b2, VRET_FW);} // vector element type 'F' +inline void Assembler::z_verllg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_verll(v1, v3, d2, b2, VRET_DW);} // vector element type 'G' +inline void Assembler::z_verim( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t m5) {emit_48(VERLL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | uimm8(imm4, 24, 48) | vesc_mask(m5, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_verimb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4) {z_verim(v1, v2, v3, imm4, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_verimh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4) {z_verim(v1, v2, v3, imm4, VRET_HW); } // vector element type 'H' +inline void Assembler::z_verimf( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4) {z_verim(v1, v2, v3, imm4, VRET_FW); } // vector element type 'F' +inline void Assembler::z_verimg( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4) {z_verim(v1, v2, v3, imm4, VRET_DW); } // vector element type 'G' + +inline void Assembler::z_veslv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VESLV_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_veslvb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_veslv(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_veslvh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_veslv(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_veslvf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_veslv(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_veslvg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_veslv(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vesl( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4) {emit_48(VESL_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_veslb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesl(v1, v3, d2, b2, VRET_BYTE);} // vector element type 'B' +inline void Assembler::z_veslh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesl(v1, v3, d2, b2, VRET_HW);} // vector element type 'H' +inline void Assembler::z_veslf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesl(v1, v3, d2, b2, VRET_FW);} // vector element type 'F' +inline void Assembler::z_veslg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesl(v1, v3, d2, b2, VRET_DW);} // vector element type 'G' + +inline void Assembler::z_vesrav( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VESRAV_ZOPC| vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vesravb(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrav(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vesravh(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrav(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vesravf(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrav(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vesravg(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrav(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vesra( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4) {emit_48(VESRA_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vesrab( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesra(v1, v3, d2, b2, VRET_BYTE);}// vector element type 'B' +inline void Assembler::z_vesrah( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesra(v1, v3, d2, b2, VRET_HW);} // vector element type 'H' +inline void Assembler::z_vesraf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesra(v1, v3, d2, b2, VRET_FW);} // vector element type 'F' +inline void Assembler::z_vesrag( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesra(v1, v3, d2, b2, VRET_DW);} // vector element type 'G' +inline void Assembler::z_vesrlv( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VESRLV_ZOPC| vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vesrlvb(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrlv(v1, v2, v3, VRET_BYTE); } // vector element type 'B' +inline void Assembler::z_vesrlvh(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrlv(v1, v2, v3, VRET_HW); } // vector element type 'H' +inline void Assembler::z_vesrlvf(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrlv(v1, v2, v3, VRET_FW); } // vector element type 'F' +inline void Assembler::z_vesrlvg(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vesrlv(v1, v2, v3, VRET_DW); } // vector element type 'G' +inline void Assembler::z_vesrl( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2, int64_t m4) {emit_48(VESRL_ZOPC | vreg(v1, 8) | vreg(v3, 12) | rsmask_48(d2, b2) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } +inline void Assembler::z_vesrlb( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesrl(v1, v3, d2, b2, VRET_BYTE);}// vector element type 'B' +inline void Assembler::z_vesrlh( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesrl(v1, v3, d2, b2, VRET_HW);} // vector element type 'H' +inline void Assembler::z_vesrlf( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesrl(v1, v3, d2, b2, VRET_FW);} // vector element type 'F' +inline void Assembler::z_vesrlg( VectorRegister v1, VectorRegister v3, int64_t d2, Register b2) {z_vesrl(v1, v3, d2, b2, VRET_DW);} // vector element type 'G' + +inline void Assembler::z_vsl( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vslb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSLB_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vsldb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4) {emit_48(VSLDB_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | uimm8(imm4, 24, 48)); } + +inline void Assembler::z_vsra( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSRA_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vsrab( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSRAB_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vsrl( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSRL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } +inline void Assembler::z_vsrlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VSRLB_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } + +// Test under Mask +inline void Assembler::z_vtm( VectorRegister v1, VectorRegister v2) {emit_48(VTM_ZOPC | vreg(v1, 8) | vreg(v2, 12)); } + + //------------------------------- // FLOAT INSTRUCTIONS //------------------------------- diff --git a/src/hotspot/cpu/s390/register_definitions_s390.cpp b/src/hotspot/cpu/s390/register_definitions_s390.cpp index 99116f5399b..2378d513799 100644 --- a/src/hotspot/cpu/s390/register_definitions_s390.cpp +++ b/src/hotspot/cpu/s390/register_definitions_s390.cpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -35,3 +35,5 @@ REGISTER_DEFINITION(Register, noreg); REGISTER_DEFINITION(FloatRegister, fnoreg); + +REGISTER_DEFINITION(VectorRegister, vnoreg); diff --git a/src/hotspot/cpu/s390/register_s390.cpp b/src/hotspot/cpu/s390/register_s390.cpp index 1746da9f150..853b5642470 100644 --- a/src/hotspot/cpu/s390/register_s390.cpp +++ b/src/hotspot/cpu/s390/register_s390.cpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -46,3 +46,13 @@ const char* FloatRegisterImpl::name() const { }; return is_valid() ? names[encoding()] : "fnoreg"; } + +const char* VectorRegisterImpl::name() const { + const char* names[number_of_registers] = { + "Z_V0", "Z_V1", "Z_V2", "Z_V3", "Z_V4", "Z_V5", "Z_V6", "Z_V7", + "Z_V8", "Z_V9", "Z_V10", "Z_V11", "Z_V12", "Z_V13", "Z_V14", "Z_V15", + "Z_V16", "Z_V17", "Z_V18", "Z_V19", "Z_V20", "Z_V21", "Z_V22", "Z_V23", + "Z_V24", "Z_V25", "Z_V26", "Z_V27", "Z_V28", "Z_V29", "Z_V30", "Z_V31" + }; + return is_valid() ? names[encoding()] : "fnoreg"; +} diff --git a/src/hotspot/cpu/s390/register_s390.hpp b/src/hotspot/cpu/s390/register_s390.hpp index 4c61174a613..f8f218e1dd6 100644 --- a/src/hotspot/cpu/s390/register_s390.hpp +++ b/src/hotspot/cpu/s390/register_s390.hpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -34,11 +34,6 @@ class VMRegImpl; typedef VMRegImpl* VMReg; -// Use Register as shortcut. -class RegisterImpl; -typedef RegisterImpl* Register; - -// The implementation of integer registers for z/Architecture. // z/Architecture registers, see "LINUX for zSeries ELF ABI Supplement", IBM March 2001 // @@ -57,6 +52,17 @@ typedef RegisterImpl* Register; // f1,f3,f5,f7 General purpose (volatile) // f8-f15 General purpose (nonvolatile) + +//=========================== +//=== Integer Registers === +//=========================== + +// Use Register as shortcut. +class RegisterImpl; +typedef RegisterImpl* Register; + +// The implementation of integer registers for z/Architecture. + inline Register as_Register(int encoding) { return (Register)(long)encoding; } @@ -110,6 +116,11 @@ CONSTANT_REGISTER_DECLARATION(Register, Z_R13, (13)); CONSTANT_REGISTER_DECLARATION(Register, Z_R14, (14)); CONSTANT_REGISTER_DECLARATION(Register, Z_R15, (15)); + +//============================= +//=== Condition Registers === +//============================= + // Use ConditionRegister as shortcut class ConditionRegisterImpl; typedef ConditionRegisterImpl* ConditionRegister; @@ -159,7 +170,7 @@ CONSTANT_REGISTER_DECLARATION(ConditionRegister, Z_CR, (0)); // dangers of defines. // If a particular file has a problem with these defines then it's possible // to turn them off in that file by defining -// DONT_USE_REGISTER_DEFINES. Register_definition_s390.cpp does that +// DONT_USE_REGISTER_DEFINES. Register_definitions_s390.cpp does that // so that it's able to provide real definitions of these registers // for use in debuggers and such. @@ -186,6 +197,11 @@ CONSTANT_REGISTER_DECLARATION(ConditionRegister, Z_CR, (0)); #define Z_CR ((ConditionRegister)(Z_CR_ConditionRegisterEnumValue)) #endif // DONT_USE_REGISTER_DEFINES + +//========================= +//=== Float Registers === +//========================= + // Use FloatRegister as shortcut class FloatRegisterImpl; typedef FloatRegisterImpl* FloatRegister; @@ -263,22 +279,6 @@ CONSTANT_REGISTER_DECLARATION(FloatRegister, Z_F15, (15)); #define Z_F15 ((FloatRegister)( Z_F15_FloatRegisterEnumValue)) #endif // DONT_USE_REGISTER_DEFINES -// Need to know the total number of registers of all sorts for SharedInfo. -// Define a class that exports it. - -class ConcreteRegisterImpl : public AbstractRegisterImpl { - public: - enum { - number_of_registers = - (RegisterImpl::number_of_registers + - FloatRegisterImpl::number_of_registers) - * 2 // register halves - + 1 // condition code register - }; - static const int max_gpr; - static const int max_fpr; -}; - // Single, Double and Quad fp reg classes. These exist to map the ADLC // encoding for a floating point register, to the FloatRegister number // desired by the macroassembler. A FloatRegister is a number between @@ -329,6 +329,161 @@ class QuadFloatRegisterImpl { }; +//========================== +//=== Vector Registers === +//========================== + +// Use VectorRegister as shortcut +class VectorRegisterImpl; +typedef VectorRegisterImpl* VectorRegister; + +// The implementation of vector registers for z/Architecture. + +inline VectorRegister as_VectorRegister(int encoding) { + return (VectorRegister)(long)encoding; +} + +class VectorRegisterImpl: public AbstractRegisterImpl { + public: + enum { + number_of_registers = 32, + number_of_arg_registers = 0 + }; + + // construction + inline friend VectorRegister as_VectorRegister(int encoding); + + inline VMReg as_VMReg(); + + // accessors + int encoding() const { + assert(is_valid(), "invalid register"); return value(); + } + + bool is_valid() const { return 0 <= value() && value() < number_of_registers; } + bool is_volatile() const { return true; } + bool is_nonvolatile() const { return false; } + + // Register fields in z/Architecture instructions are 4 bits wide, restricting the + // addressable register set size to 16. + // The vector register set size is 32, requiring an extension, by one bit, of the + // register encoding. This is accomplished by the introduction of a RXB field in the + // instruction. RXB = Register eXtension Bits. + // The RXB field contains the MSBs (most significant bit) of the vector register numbers + // used for this instruction. Assignment of MSB in RBX is by bit position of the + // register field in the instruction. + // Example: + // The register field starting at bit position 12 in the instruction is assigned RXB bit 0b0100. + int64_t RXB_mask(int pos) { + if (encoding() >= number_of_registers/2) { + switch (pos) { + case 8: return ((int64_t)0b1000) << 8; // actual bit pos: 36 + case 12: return ((int64_t)0b0100) << 8; // actual bit pos: 37 + case 16: return ((int64_t)0b0010) << 8; // actual bit pos: 38 + case 32: return ((int64_t)0b0001) << 8; // actual bit pos: 39 + default: + ShouldNotReachHere(); + } + } + return 0; + } + + const char* name() const; + + VectorRegister successor() const { return as_VectorRegister(encoding() + 1); } +}; + +// The Vector registers of z/Architecture. + +CONSTANT_REGISTER_DECLARATION(VectorRegister, vnoreg, (-1)); + +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V0, (0)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V1, (1)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V2, (2)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V3, (3)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V4, (4)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V5, (5)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V6, (6)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V7, (7)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V8, (8)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V9, (9)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V10, (10)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V11, (11)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V12, (12)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V13, (13)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V14, (14)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V15, (15)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V16, (16)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V17, (17)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V18, (18)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V19, (19)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V20, (20)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V21, (21)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V22, (22)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V23, (23)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V24, (24)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V25, (25)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V26, (26)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V27, (27)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V28, (28)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V29, (29)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V30, (30)); +CONSTANT_REGISTER_DECLARATION(VectorRegister, Z_V31, (31)); + +#ifndef DONT_USE_REGISTER_DEFINES +#define vnoreg ((VectorRegister)(vnoreg_VectorRegisterEnumValue)) +#define Z_V0 ((VectorRegister)( Z_V0_VectorRegisterEnumValue)) +#define Z_V1 ((VectorRegister)( Z_V1_VectorRegisterEnumValue)) +#define Z_V2 ((VectorRegister)( Z_V2_VectorRegisterEnumValue)) +#define Z_V3 ((VectorRegister)( Z_V3_VectorRegisterEnumValue)) +#define Z_V4 ((VectorRegister)( Z_V4_VectorRegisterEnumValue)) +#define Z_V5 ((VectorRegister)( Z_V5_VectorRegisterEnumValue)) +#define Z_V6 ((VectorRegister)( Z_V6_VectorRegisterEnumValue)) +#define Z_V7 ((VectorRegister)( Z_V7_VectorRegisterEnumValue)) +#define Z_V8 ((VectorRegister)( Z_V8_VectorRegisterEnumValue)) +#define Z_V9 ((VectorRegister)( Z_V9_VectorRegisterEnumValue)) +#define Z_V10 ((VectorRegister)( Z_V10_VectorRegisterEnumValue)) +#define Z_V11 ((VectorRegister)( Z_V11_VectorRegisterEnumValue)) +#define Z_V12 ((VectorRegister)( Z_V12_VectorRegisterEnumValue)) +#define Z_V13 ((VectorRegister)( Z_V13_VectorRegisterEnumValue)) +#define Z_V14 ((VectorRegister)( Z_V14_VectorRegisterEnumValue)) +#define Z_V15 ((VectorRegister)( Z_V15_VectorRegisterEnumValue)) +#define Z_V16 ((VectorRegister)( Z_V16_VectorRegisterEnumValue)) +#define Z_V17 ((VectorRegister)( Z_V17_VectorRegisterEnumValue)) +#define Z_V18 ((VectorRegister)( Z_V18_VectorRegisterEnumValue)) +#define Z_V19 ((VectorRegister)( Z_V19_VectorRegisterEnumValue)) +#define Z_V20 ((VectorRegister)( Z_V20_VectorRegisterEnumValue)) +#define Z_V21 ((VectorRegister)( Z_V21_VectorRegisterEnumValue)) +#define Z_V22 ((VectorRegister)( Z_V22_VectorRegisterEnumValue)) +#define Z_V23 ((VectorRegister)( Z_V23_VectorRegisterEnumValue)) +#define Z_V24 ((VectorRegister)( Z_V24_VectorRegisterEnumValue)) +#define Z_V25 ((VectorRegister)( Z_V25_VectorRegisterEnumValue)) +#define Z_V26 ((VectorRegister)( Z_V26_VectorRegisterEnumValue)) +#define Z_V27 ((VectorRegister)( Z_V27_VectorRegisterEnumValue)) +#define Z_V28 ((VectorRegister)( Z_V28_VectorRegisterEnumValue)) +#define Z_V29 ((VectorRegister)( Z_V29_VectorRegisterEnumValue)) +#define Z_V30 ((VectorRegister)( Z_V30_VectorRegisterEnumValue)) +#define Z_V31 ((VectorRegister)( Z_V31_VectorRegisterEnumValue)) +#endif // DONT_USE_REGISTER_DEFINES + + +// Need to know the total number of registers of all sorts for SharedInfo. +// Define a class that exports it. + +class ConcreteRegisterImpl : public AbstractRegisterImpl { + public: + enum { + number_of_registers = + (RegisterImpl::number_of_registers + + FloatRegisterImpl::number_of_registers) + * 2 // register halves + + 1 // condition code register + }; + static const int max_gpr; + static const int max_fpr; +}; + + // Common register declarations used in assembler code. REGISTER_DECLARATION(Register, Z_EXC_OOP, Z_R2); REGISTER_DECLARATION(Register, Z_EXC_PC, Z_R3); From 737c0cd7a53bd1e0d8315bdd9f32c4e1991197ce Mon Sep 17 00:00:00 2001 From: Chris Plummer Date: Tue, 26 Sep 2017 10:09:54 -0700 Subject: [PATCH 09/80] 8179498: attach in linux should be relative to /proc/pid/root and namespace aware Map pid to namespace pid so proper tmp file name is used. Reviewed-by: sspitsyn, dholmes --- .../sun/tools/attach/VirtualMachineImpl.java | 72 ++++++++++++++++--- 1 file changed, 63 insertions(+), 9 deletions(-) diff --git a/src/jdk.attach/linux/classes/sun/tools/attach/VirtualMachineImpl.java b/src/jdk.attach/linux/classes/sun/tools/attach/VirtualMachineImpl.java index 4a5fbdd1294..5b021b58c88 100644 --- a/src/jdk.attach/linux/classes/sun/tools/attach/VirtualMachineImpl.java +++ b/src/jdk.attach/linux/classes/sun/tools/attach/VirtualMachineImpl.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2005, 2014, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2005, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -32,6 +32,10 @@ import com.sun.tools.attach.spi.AttachProvider; import java.io.InputStream; import java.io.IOException; import java.io.File; +import java.nio.charset.StandardCharsets; +import java.nio.file.Path; +import java.nio.file.Paths; +import java.nio.file.Files; /* * Linux implementation of HotSpotVirtualMachine @@ -63,12 +67,15 @@ public class VirtualMachineImpl extends HotSpotVirtualMachine { throw new AttachNotSupportedException("Invalid process identifier"); } + // Try to resolve to the "inner most" pid namespace + int ns_pid = getNamespacePid(pid); + // Find the socket file. If not found then we attempt to start the // attach mechanism in the target VM by sending it a QUIT signal. // Then we attempt to find the socket file again. - path = findSocketFile(pid); + path = findSocketFile(pid, ns_pid); if (path == null) { - File f = createAttachFile(pid); + File f = createAttachFile(pid, ns_pid); try { sendQuitTo(pid); @@ -83,7 +90,7 @@ public class VirtualMachineImpl extends HotSpotVirtualMachine { try { Thread.sleep(delay); } catch (InterruptedException x) { } - path = findSocketFile(pid); + path = findSocketFile(pid, ns_pid); time_spend += delay; if (time_spend > timeout/2 && path == null) { @@ -262,8 +269,12 @@ public class VirtualMachineImpl extends HotSpotVirtualMachine { } // Return the socket file for the given process. - private String findSocketFile(int pid) { - File f = new File(tmpdir, ".java_pid" + pid); + private String findSocketFile(int pid, int ns_pid) { + // A process may not exist in the same mount namespace as the caller. + // Instead, attach relative to the target root filesystem as exposed by + // procfs regardless of namespaces. + String root = "/proc/" + pid + "/root/" + tmpdir; + File f = new File(root, ".java_pid" + ns_pid); if (!f.exists()) { return null; } @@ -274,14 +285,23 @@ public class VirtualMachineImpl extends HotSpotVirtualMachine { // if not already started. The client creates a .attach_pid file in the // target VM's working directory (or temp directory), and the SIGQUIT handler // checks for the file. - private File createAttachFile(int pid) throws IOException { - String fn = ".attach_pid" + pid; + private File createAttachFile(int pid, int ns_pid) throws IOException { + String fn = ".attach_pid" + ns_pid; String path = "/proc/" + pid + "/cwd/" + fn; File f = new File(path); try { f.createNewFile(); } catch (IOException x) { - f = new File(tmpdir, fn); + String root; + if (pid != ns_pid) { + // A process may not exist in the same mount namespace as the caller. + // Instead, attach relative to the target root filesystem as exposed by + // procfs regardless of namespaces. + root = "/proc/" + pid + "/root/" + tmpdir; + } else { + root = tmpdir; + } + f = new File(root, fn); f.createNewFile(); } return f; @@ -307,6 +327,40 @@ public class VirtualMachineImpl extends HotSpotVirtualMachine { } + // Return the inner most namespaced PID if there is one, + // otherwise return the original PID. + private int getNamespacePid(int pid) throws AttachNotSupportedException, IOException { + // Assuming a real procfs sits beneath, reading this doesn't block + // nor will it consume a lot of memory. + String statusFile = "/proc/" + pid + "/status"; + File f = new File(statusFile); + if (!f.exists()) { + return pid; // Likely a bad pid, but this is properly handled later. + } + + Path statusPath = Paths.get(statusFile); + + try { + for (String line : Files.readAllLines(statusPath, StandardCharsets.UTF_8)) { + String[] parts = line.split(":"); + if (parts.length == 2 && parts[0].trim().equals("NSpid")) { + parts = parts[1].trim().split("\\s+"); + // The last entry represents the PID the JVM "thinks" it is. + // Even in non-namespaced pids these entries should be + // valid. You could refer to it as the inner most pid. + int ns_pid = Integer.parseInt(parts[parts.length - 1]); + return ns_pid; + } + } + // Old kernels may not have NSpid field (i.e. 3.10). + // Fallback to original pid in the event we cannot deduce. + return pid; + } catch (NumberFormatException | IOException x) { + throw new AttachNotSupportedException("Unable to parse namespace"); + } + } + + //-- native methods static native void sendQuitToChildrenOf(int pid) throws IOException; From 2a93b38ee95ef635c2736d1637a710f0fed702de Mon Sep 17 00:00:00 2001 From: Calvin Cheung Date: Tue, 26 Sep 2017 19:31:06 -0700 Subject: [PATCH 10/80] 8187124: [TESTBUG] TestInterpreterMethodEntries.java: Unable to create shared archive file Added the current timestamp into the shared archive file name Reviewed-by: mseledtsov, gtriantafill --- test/lib/jdk/test/lib/cds/CDSTestUtils.java | 16 +++++++++++++++- 1 file changed, 15 insertions(+), 1 deletion(-) diff --git a/test/lib/jdk/test/lib/cds/CDSTestUtils.java b/test/lib/jdk/test/lib/cds/CDSTestUtils.java index 16a32056ff3..8d0f9ef4bcb 100644 --- a/test/lib/jdk/test/lib/cds/CDSTestUtils.java +++ b/test/lib/jdk/test/lib/cds/CDSTestUtils.java @@ -26,7 +26,9 @@ import java.io.IOException; import java.io.File; import java.io.FileOutputStream; import java.io.PrintStream; +import java.text.SimpleDateFormat; import java.util.ArrayList; +import java.util.Date; import jdk.test.lib.Utils; import jdk.test.lib.process.OutputAnalyzer; import jdk.test.lib.process.ProcessTools; @@ -60,6 +62,8 @@ public class CDSTestUtils { public static OutputAnalyzer createArchive(CDSOptions opts) throws Exception { + startNewArchiveName(); + ArrayList cmd = new ArrayList(); for (String p : opts.prefix) cmd.add(p); @@ -328,9 +332,19 @@ public class CDSTestUtils { return testName; } + private static final SimpleDateFormat timeStampFormat = + new SimpleDateFormat("HH'h'mm'm'ss's'SSS"); + + private static String defaultArchiveName; + + // Call this method to start new archive with new unique name + public static void startNewArchiveName() { + defaultArchiveName = getTestName() + + timeStampFormat.format(new Date()) + ".jsa"; + } public static String getDefaultArchiveName() { - return getTestName() + ".jsa"; + return defaultArchiveName; } From 52c73dd8a99cf8d29fe9541e5bcdfd8c7a848637 Mon Sep 17 00:00:00 2001 From: Stefan Johansson Date: Thu, 21 Sep 2017 14:32:05 +0200 Subject: [PATCH 11/80] 8184286: print_tracing_info() does not use Unified Logging for output Reviewed-by: ehelin, sangheki --- .../gc/parallel/parallelScavengeHeap.cpp | 14 ++++--------- src/hotspot/share/gc/parallel/psMarkSweep.cpp | 8 ++++++-- .../share/gc/parallel/psParallelCompact.cpp | 6 ++++-- src/hotspot/share/gc/parallel/psScavenge.cpp | 8 ++++++-- .../share/gc/shared/genCollectedHeap.cpp | 9 ++++----- src/hotspot/share/gc/shared/generation.cpp | 20 ++++++------------- src/hotspot/share/gc/shared/generation.hpp | 3 +-- src/hotspot/share/runtime/globals.hpp | 6 ------ 8 files changed, 31 insertions(+), 43 deletions(-) diff --git a/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp b/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp index dba08b5a92a..d3f960dfaae 100644 --- a/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp +++ b/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -574,16 +574,10 @@ void ParallelScavengeHeap::print_gc_threads_on(outputStream* st) const { } void ParallelScavengeHeap::print_tracing_info() const { - if (TraceYoungGenTime) { - double time = PSScavenge::accumulated_time()->seconds(); - tty->print_cr("[Accumulated GC generation 0 time %3.7f secs]", time); - } - if (TraceOldGenTime) { - double time = UseParallelOldGC ? PSParallelCompact::accumulated_time()->seconds() : PSMarkSweep::accumulated_time()->seconds(); - tty->print_cr("[Accumulated GC generation 1 time %3.7f secs]", time); - } - AdaptiveSizePolicyOutput::print(); + log_debug(gc, heap, exit)("Accumulated young generation GC time %3.7f secs", PSScavenge::accumulated_time()->seconds()); + log_debug(gc, heap, exit)("Accumulated old generation GC time %3.7f secs", + UseParallelOldGC ? PSParallelCompact::accumulated_time()->seconds() : PSMarkSweep::accumulated_time()->seconds()); } diff --git a/src/hotspot/share/gc/parallel/psMarkSweep.cpp b/src/hotspot/share/gc/parallel/psMarkSweep.cpp index 76f0d444f6f..3991d20674b 100644 --- a/src/hotspot/share/gc/parallel/psMarkSweep.cpp +++ b/src/hotspot/share/gc/parallel/psMarkSweep.cpp @@ -173,7 +173,9 @@ bool PSMarkSweep::invoke_no_policy(bool clear_all_softrefs) { TraceCollectorStats tcs(counters()); TraceMemoryManagerStats tms(true /* Full GC */,gc_cause); - if (TraceOldGenTime) accumulated_time()->start(); + if (log_is_enabled(Debug, gc, heap, exit)) { + accumulated_time()->start(); + } // Let the size policy know we're starting size_policy->major_collection_begin(); @@ -342,7 +344,9 @@ bool PSMarkSweep::invoke_no_policy(bool clear_all_softrefs) { // We collected the heap, recalculate the metaspace capacity MetaspaceGC::compute_new_size(); - if (TraceOldGenTime) accumulated_time()->stop(); + if (log_is_enabled(Debug, gc, heap, exit)) { + accumulated_time()->stop(); + } young_gen->print_used_change(young_gen_prev_used); old_gen->print_used_change(old_gen_prev_used); diff --git a/src/hotspot/share/gc/parallel/psParallelCompact.cpp b/src/hotspot/share/gc/parallel/psParallelCompact.cpp index ae04316cb3e..0678ee5b65b 100644 --- a/src/hotspot/share/gc/parallel/psParallelCompact.cpp +++ b/src/hotspot/share/gc/parallel/psParallelCompact.cpp @@ -1778,7 +1778,9 @@ bool PSParallelCompact::invoke_no_policy(bool maximum_heap_compaction) { TraceCollectorStats tcs(counters()); TraceMemoryManagerStats tms(true /* Full GC */,gc_cause); - if (TraceOldGenTime) accumulated_time()->start(); + if (log_is_enabled(Debug, gc, heap, exit)) { + accumulated_time()->start(); + } // Let the size policy know we're starting size_policy->major_collection_begin(); @@ -1897,7 +1899,7 @@ bool PSParallelCompact::invoke_no_policy(bool maximum_heap_compaction) { // Resize the metaspace capacity after a collection MetaspaceGC::compute_new_size(); - if (TraceOldGenTime) { + if (log_is_enabled(Debug, gc, heap, exit)) { accumulated_time()->stop(); } diff --git a/src/hotspot/share/gc/parallel/psScavenge.cpp b/src/hotspot/share/gc/parallel/psScavenge.cpp index db50e7bcf7b..0db1dee2061 100644 --- a/src/hotspot/share/gc/parallel/psScavenge.cpp +++ b/src/hotspot/share/gc/parallel/psScavenge.cpp @@ -306,7 +306,9 @@ bool PSScavenge::invoke_no_policy() { TraceCollectorStats tcs(counters()); TraceMemoryManagerStats tms(false /* not full GC */,gc_cause); - if (TraceYoungGenTime) accumulated_time()->start(); + if (log_is_enabled(Debug, gc, heap, exit)) { + accumulated_time()->start(); + } // Let the size policy know we're starting size_policy->minor_collection_begin(); @@ -607,7 +609,9 @@ bool PSScavenge::invoke_no_policy() { CardTableExtension::verify_all_young_refs_imprecise(); } - if (TraceYoungGenTime) accumulated_time()->stop(); + if (log_is_enabled(Debug, gc, heap, exit)) { + accumulated_time()->stop(); + } young_gen->print_used_change(pre_gc_values.young_gen_used()); old_gen->print_used_change(pre_gc_values.old_gen_used()); diff --git a/src/hotspot/share/gc/shared/genCollectedHeap.cpp b/src/hotspot/share/gc/shared/genCollectedHeap.cpp index eb98e3f2595..139fc32f2a6 100644 --- a/src/hotspot/share/gc/shared/genCollectedHeap.cpp +++ b/src/hotspot/share/gc/shared/genCollectedHeap.cpp @@ -1157,11 +1157,10 @@ void GenCollectedHeap::print_on_error(outputStream* st) const { } void GenCollectedHeap::print_tracing_info() const { - if (TraceYoungGenTime) { - _young_gen->print_summary_info(); - } - if (TraceOldGenTime) { - _old_gen->print_summary_info(); + if (log_is_enabled(Debug, gc, heap, exit)) { + LogStreamHandle(Debug, gc, heap, exit) lsh; + _young_gen->print_summary_info_on(&lsh); + _old_gen->print_summary_info_on(&lsh); } } diff --git a/src/hotspot/share/gc/shared/generation.cpp b/src/hotspot/share/gc/shared/generation.cpp index d86103ae077..68c92230729 100644 --- a/src/hotspot/share/gc/shared/generation.cpp +++ b/src/hotspot/share/gc/shared/generation.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -94,22 +94,14 @@ void Generation::print_on(outputStream* st) const { p2i(_virtual_space.high_boundary())); } -void Generation::print_summary_info() { print_summary_info_on(tty); } - void Generation::print_summary_info_on(outputStream* st) { StatRecord* sr = stat_record(); double time = sr->accumulated_time.seconds(); - // I didn't want to change the logging when removing the level concept, - // but I guess this logging could say young/old or something instead of 0/1. - uint level; - if (GenCollectedHeap::heap()->is_young_gen(this)) { - level = 0; - } else { - level = 1; - } - st->print_cr("[Accumulated GC generation %d time %3.7f secs, " - "%u GC's, avg GC time %3.7f]", - level, time, sr->invocations, + st->print_cr("Accumulated %s generation GC time %3.7f secs, " + "%u GC's, avg GC time %3.7f", + GenCollectedHeap::heap()->is_young_gen(this) ? "young" : "old" , + time, + sr->invocations, sr->invocations > 0 ? time / sr->invocations : 0.0); } diff --git a/src/hotspot/share/gc/shared/generation.hpp b/src/hotspot/share/gc/shared/generation.hpp index 7507e7763b3..00d17a22a33 100644 --- a/src/hotspot/share/gc/shared/generation.hpp +++ b/src/hotspot/share/gc/shared/generation.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -549,7 +549,6 @@ private: public: StatRecord* stat_record() { return &_stat_record; } - virtual void print_summary_info(); virtual void print_summary_info_on(outputStream* st); // Performance Counter support diff --git a/src/hotspot/share/runtime/globals.hpp b/src/hotspot/share/runtime/globals.hpp index 7e9dc8768f3..d5cd34f9434 100644 --- a/src/hotspot/share/runtime/globals.hpp +++ b/src/hotspot/share/runtime/globals.hpp @@ -2344,12 +2344,6 @@ public: range(30*K, max_uintx/BytesPerWord) \ constraint(InitialBootClassLoaderMetaspaceSizeConstraintFunc, AfterErgo)\ \ - product(bool, TraceYoungGenTime, false, \ - "Trace accumulated time for young collection") \ - \ - product(bool, TraceOldGenTime, false, \ - "Trace accumulated time for old collection") \ - \ product(bool, PrintHeapAtSIGBREAK, true, \ "Print heap layout in response to SIGBREAK") \ \ From da300604af06cecef50fcb85e7af8cbf8b35ee51 Mon Sep 17 00:00:00 2001 From: John Paul Adrian Glaubitz Date: Wed, 27 Sep 2017 17:01:34 +0200 Subject: [PATCH 12/80] 8186578: Zero fails to build on linux-sparc due to sparc-specific code Reviewed-by: kbarrett, ihse, coleenp --- make/hotspot/lib/JvmFeatures.gmk | 3 +++ src/hotspot/share/compiler/oopMap.cpp | 5 +---- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/make/hotspot/lib/JvmFeatures.gmk b/make/hotspot/lib/JvmFeatures.gmk index 3880e685fe3..e7c4e1c1840 100644 --- a/make/hotspot/lib/JvmFeatures.gmk +++ b/make/hotspot/lib/JvmFeatures.gmk @@ -47,6 +47,9 @@ endif ifeq ($(call check-jvm-feature, zero), true) JVM_CFLAGS_FEATURES += -DZERO -DCC_INTERP -DZERO_LIBARCH='"$(OPENJDK_TARGET_CPU_LEGACY_LIB)"' $(LIBFFI_CFLAGS) JVM_LIBS_FEATURES += $(LIBFFI_LIBS) + ifeq ($(OPENJDK_TARGET_CPU), sparcv9) + BUILD_LIBJVM_EXTRA_FILES := $(TOPDIR)/src/hotspot/cpu/sparc/memset_with_concurrent_readers_sparc.cpp + endif endif ifeq ($(call check-jvm-feature, shark), true) diff --git a/src/hotspot/share/compiler/oopMap.cpp b/src/hotspot/share/compiler/oopMap.cpp index 7759615c4ce..e218a2d045e 100644 --- a/src/hotspot/share/compiler/oopMap.cpp +++ b/src/hotspot/share/compiler/oopMap.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1998, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1998, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -40,9 +40,6 @@ #ifdef COMPILER2 #include "opto/optoreg.hpp" #endif -#ifdef SPARC -#include "vmreg_sparc.inline.hpp" -#endif // OopMapStream From 92ad2630a12ef81877ad5dbae2ac012c13dea63f Mon Sep 17 00:00:00 2001 From: Jiangli Zhou Date: Wed, 27 Sep 2017 17:55:20 -0400 Subject: [PATCH 13/80] 8068314: "Java fields that are currently set during shared space dumping" comment is incorrect CDS dump time should also initialize preallocated out_of_memory error messages. Reviewed-by: iklam, hseigel --- src/hotspot/share/memory/universe.cpp | 56 +++++++++++++-------------- 1 file changed, 26 insertions(+), 30 deletions(-) diff --git a/src/hotspot/share/memory/universe.cpp b/src/hotspot/share/memory/universe.cpp index 5d3a57b59fe..335df28fe79 100644 --- a/src/hotspot/share/memory/universe.cpp +++ b/src/hotspot/share/memory/universe.cpp @@ -1064,44 +1064,40 @@ bool universe_post_init() { Universe::_vm_exception = InstanceKlass::cast(k)->allocate_instance(CHECK_false); - if (!DumpSharedSpaces) { - // These are the only Java fields that are currently set during shared space dumping. - // We prefer to not handle this generally, so we always reinitialize these detail messages. - Handle msg = java_lang_String::create_from_str("Java heap space", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_java_heap, msg()); + Handle msg = java_lang_String::create_from_str("Java heap space", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_java_heap, msg()); - msg = java_lang_String::create_from_str("Metaspace", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_metaspace, msg()); - msg = java_lang_String::create_from_str("Compressed class space", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_class_metaspace, msg()); + msg = java_lang_String::create_from_str("Metaspace", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_metaspace, msg()); + msg = java_lang_String::create_from_str("Compressed class space", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_class_metaspace, msg()); - msg = java_lang_String::create_from_str("Requested array size exceeds VM limit", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_array_size, msg()); + msg = java_lang_String::create_from_str("Requested array size exceeds VM limit", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_array_size, msg()); - msg = java_lang_String::create_from_str("GC overhead limit exceeded", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_gc_overhead_limit, msg()); + msg = java_lang_String::create_from_str("GC overhead limit exceeded", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_gc_overhead_limit, msg()); - msg = java_lang_String::create_from_str("Java heap space: failed reallocation of scalar replaced objects", CHECK_false); - java_lang_Throwable::set_message(Universe::_out_of_memory_error_realloc_objects, msg()); + msg = java_lang_String::create_from_str("Java heap space: failed reallocation of scalar replaced objects", CHECK_false); + java_lang_Throwable::set_message(Universe::_out_of_memory_error_realloc_objects, msg()); - msg = java_lang_String::create_from_str("/ by zero", CHECK_false); - java_lang_Throwable::set_message(Universe::_arithmetic_exception_instance, msg()); + msg = java_lang_String::create_from_str("/ by zero", CHECK_false); + java_lang_Throwable::set_message(Universe::_arithmetic_exception_instance, msg()); - // Setup the array of errors that have preallocated backtrace - k = Universe::_out_of_memory_error_java_heap->klass(); - assert(k->name() == vmSymbols::java_lang_OutOfMemoryError(), "should be out of memory error"); - ik = InstanceKlass::cast(k); + // Setup the array of errors that have preallocated backtrace + k = Universe::_out_of_memory_error_java_heap->klass(); + assert(k->name() == vmSymbols::java_lang_OutOfMemoryError(), "should be out of memory error"); + ik = InstanceKlass::cast(k); - int len = (StackTraceInThrowable) ? (int)PreallocatedOutOfMemoryErrorCount : 0; - Universe::_preallocated_out_of_memory_error_array = oopFactory::new_objArray(ik, len, CHECK_false); - for (int i=0; iallocate_instance(CHECK_false); - Handle err_h = Handle(THREAD, err); - java_lang_Throwable::allocate_backtrace(err_h, CHECK_false); - Universe::preallocated_out_of_memory_errors()->obj_at_put(i, err_h()); - } - Universe::_preallocated_out_of_memory_error_avail_count = (jint)len; + int len = (StackTraceInThrowable) ? (int)PreallocatedOutOfMemoryErrorCount : 0; + Universe::_preallocated_out_of_memory_error_array = oopFactory::new_objArray(ik, len, CHECK_false); + for (int i=0; iallocate_instance(CHECK_false); + Handle err_h = Handle(THREAD, err); + java_lang_Throwable::allocate_backtrace(err_h, CHECK_false); + Universe::preallocated_out_of_memory_errors()->obj_at_put(i, err_h()); } + Universe::_preallocated_out_of_memory_error_avail_count = (jint)len; Universe::initialize_known_methods(CHECK_false); From ba16fabd204928e611e8b7a37cb5c667a1a79e46 Mon Sep 17 00:00:00 2001 From: Jiangli Zhou Date: Wed, 27 Sep 2017 20:40:33 -0400 Subject: [PATCH 14/80] 8186789: CDS dump crashes at ConstantPool::resolve_class_constants ConstantPool::resolve_class_constants needs to check for NULL _cache. Reviewed-by: sspitsyn, coleenp, iklam --- src/hotspot/share/oops/constantPool.cpp | 38 ++++++++++++++----------- src/hotspot/share/oops/constantPool.hpp | 2 +- 2 files changed, 23 insertions(+), 17 deletions(-) diff --git a/src/hotspot/share/oops/constantPool.cpp b/src/hotspot/share/oops/constantPool.cpp index 158103c1dc1..9106e55b710 100644 --- a/src/hotspot/share/oops/constantPool.cpp +++ b/src/hotspot/share/oops/constantPool.cpp @@ -294,6 +294,28 @@ void ConstantPool::archive_resolved_references(Thread* THREAD) { set_resolved_references(NULL); } } + +void ConstantPool::resolve_class_constants(TRAPS) { + assert(DumpSharedSpaces, "used during dump time only"); + // The _cache may be NULL if the _pool_holder klass fails verification + // at dump time due to missing dependencies. + if (cache() == NULL || reference_map() == NULL) { + return; // nothing to do + } + + constantPoolHandle cp(THREAD, this); + for (int index = 1; index < length(); index++) { // Index 0 is unused + if (tag_at(index).is_string()) { + Symbol* sym = cp->unresolved_string_at(index); + // Look up only. Only resolve references to already interned strings. + oop str = StringTable::lookup(sym); + if (str != NULL) { + int cache_index = cp->cp_to_object_index(index); + cp->string_at_put(index, cache_index, str); + } + } + } +} #endif // CDS support. Create a new resolved_references array. @@ -722,22 +744,6 @@ void ConstantPool::resolve_string_constants_impl(const constantPoolHandle& this_ } } -bool ConstantPool::resolve_class_constants(TRAPS) { - constantPoolHandle cp(THREAD, this); - for (int index = 1; index < length(); index++) { // Index 0 is unused - if (tag_at(index).is_string()) { - Symbol* sym = cp->unresolved_string_at(index); - // Look up only. Only resolve references to already interned strings. - oop str = StringTable::lookup(sym); - if (str != NULL) { - int cache_index = cp->cp_to_object_index(index); - cp->string_at_put(index, cache_index, str); - } - } - } - return true; -} - Symbol* ConstantPool::exception_message(const constantPoolHandle& this_cp, int which, constantTag tag, oop pending_exception) { // Dig out the detailed message to reuse if possible Symbol* message = java_lang_Throwable::detail_message(pending_exception); diff --git a/src/hotspot/share/oops/constantPool.hpp b/src/hotspot/share/oops/constantPool.hpp index b2c0fa18f24..f71b22af412 100644 --- a/src/hotspot/share/oops/constantPool.hpp +++ b/src/hotspot/share/oops/constantPool.hpp @@ -717,9 +717,9 @@ class ConstantPool : public Metadata { // CDS support void archive_resolved_references(Thread *THREAD) NOT_CDS_JAVA_HEAP_RETURN; + void resolve_class_constants(TRAPS) NOT_CDS_JAVA_HEAP_RETURN; void remove_unshareable_info(); void restore_unshareable_info(TRAPS); - bool resolve_class_constants(TRAPS); // The ConstantPool vtable is restored by this call when the ConstantPool is // in the shared archive. See patch_klass_vtables() in metaspaceShared.cpp for // all the gory details. SA, dtrace and pstack helpers distinguish metadata From e840fdf6941597357b8fc2a8cc2e6bb2285bf45b Mon Sep 17 00:00:00 2001 From: Tobias Hartmann Date: Thu, 28 Sep 2017 11:02:55 +0200 Subject: [PATCH 15/80] 8187780: VM crashes while generating replay compilation file Fixed two problems with generation of replay file. Reviewed-by: kvn --- src/hotspot/share/ci/ciInstanceKlass.cpp | 5 +- src/hotspot/share/opto/bytecodeInfo.cpp | 3 +- .../compiler/ciReplay/TestDumpReplay.java | 73 +++++++++++++++++++ 3 files changed, 77 insertions(+), 4 deletions(-) create mode 100644 test/hotspot/jtreg/compiler/ciReplay/TestDumpReplay.java diff --git a/src/hotspot/share/ci/ciInstanceKlass.cpp b/src/hotspot/share/ci/ciInstanceKlass.cpp index e0b910cc2d3..00f4a3f14dd 100644 --- a/src/hotspot/share/ci/ciInstanceKlass.cpp +++ b/src/hotspot/share/ci/ciInstanceKlass.cpp @@ -665,9 +665,8 @@ class StaticFinalFieldPrinter : public FieldClosure { _out->print_cr("null"); } else if (value->is_instance()) { if (value->is_a(SystemDictionary::String_klass())) { - _out->print("\""); - _out->print_raw(java_lang_String::as_quoted_ascii(value)); - _out->print_cr("\""); + const char* ascii_value = java_lang_String::as_quoted_ascii(value); + _out->print("\"%s\"", (ascii_value != NULL) ? ascii_value : ""); } else { const char* klass_name = value->klass()->name()->as_quoted_ascii(); _out->print_cr("%s", klass_name); diff --git a/src/hotspot/share/opto/bytecodeInfo.cpp b/src/hotspot/share/opto/bytecodeInfo.cpp index 8071d76b95c..2558c77e0e4 100644 --- a/src/hotspot/share/opto/bytecodeInfo.cpp +++ b/src/hotspot/share/opto/bytecodeInfo.cpp @@ -644,7 +644,8 @@ InlineTree *InlineTree::build_inline_tree_for_callee( ciMethod* callee_method, J C->log()->elem("inline_level_discount caller='%d' callee='%d'", id1, id2); } } - InlineTree* ilt = new InlineTree(C, this, callee_method, caller_jvms, caller_bci, recur_frequency, _max_inline_level + max_inline_level_adjust); + // Allocate in the comp_arena to make sure the InlineTree is live when dumping a replay compilation file + InlineTree* ilt = new (C->comp_arena()) InlineTree(C, this, callee_method, caller_jvms, caller_bci, recur_frequency, _max_inline_level + max_inline_level_adjust); _subtrees.append(ilt); NOT_PRODUCT( _count_inlines += 1; ) diff --git a/test/hotspot/jtreg/compiler/ciReplay/TestDumpReplay.java b/test/hotspot/jtreg/compiler/ciReplay/TestDumpReplay.java new file mode 100644 index 00000000000..d1f03a8429e --- /dev/null +++ b/test/hotspot/jtreg/compiler/ciReplay/TestDumpReplay.java @@ -0,0 +1,73 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @library /test/lib + * @modules java.base/jdk.internal.misc:+open + * @build sun.hotspot.WhiteBox + * @run main ClassFileInstaller sun.hotspot.WhiteBox + * @run main/othervm -Xbootclasspath/a:. -XX:+UnlockDiagnosticVMOptions -XX:+WhiteBoxAPI + * -Xbatch -XX:-TieredCompilation -XX:+AlwaysIncrementalInline + * -XX:CompileCommand=compileonly,compiler.ciReplay.TestDumpReplay::* + * compiler.ciReplay.TestDumpReplay + */ + +package compiler.ciReplay; + +import sun.hotspot.WhiteBox; + +public class TestDumpReplay { + private static final WhiteBox WHITE_BOX = WhiteBox.getWhiteBox(); + + private static final String emptyString; + + static { + emptyString = ""; + } + + public static void m1() { + m2(); + } + + public static void m2() { + m3(); + } + + public static void m3() { + + } + + public static void main(String[] args) { + // Add compiler control directive to force generation of replay file + String directive = "[{ match: \"*.*\", DumpReplay: true }]"; + if (WHITE_BOX.addCompilerDirective(directive) != 1) { + throw new RuntimeException("Failed to add compiler directive"); + } + + // Trigger compilation of m1 + for (int i = 0; i < 10_000; ++i) { + m1(); + } + } +} From 394e6a8318e3d72044705e82d7bc135aac1633ba Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Erik=20=C3=96sterlund?= Date: Tue, 26 Sep 2017 14:05:27 +0200 Subject: [PATCH 16/80] 8186838: Generalize Atomic::inc/dec with templates Reviewed-by: kbarrett, coleenp, dholmes --- src/hotspot/os/windows/os_windows.cpp | 4 +- src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp | 77 ------- src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp | 40 ---- .../os_cpu/bsd_zero/atomic_bsd_zero.hpp | 24 -- .../linux_aarch64/atomic_linux_aarch64.hpp | 30 --- .../os_cpu/linux_arm/atomic_linux_arm.hpp | 25 -- .../os_cpu/linux_ppc/atomic_linux_ppc.hpp | 78 ------- .../os_cpu/linux_s390/atomic_linux_s390.hpp | 213 ------------------ .../os_cpu/linux_sparc/atomic_linux_sparc.hpp | 8 - .../os_cpu/linux_x86/atomic_linux_x86.hpp | 40 ---- .../os_cpu/linux_zero/atomic_linux_zero.hpp | 24 -- .../solaris_sparc/atomic_solaris_sparc.hpp | 9 - .../os_cpu/solaris_x86/atomic_solaris_x86.hpp | 8 - .../os_cpu/windows_x86/atomic_windows_x86.hpp | 56 ----- .../gc/cms/concurrentMarkSweepGeneration.cpp | 4 +- src/hotspot/share/gc/cms/parNewGeneration.cpp | 2 +- .../share/gc/g1/g1StringDedupQueue.cpp | 4 +- .../share/gc/parallel/parMarkBitMap.cpp | 4 +- .../share/gc/parallel/psParallelCompact.cpp | 2 +- .../share/gc/parallel/psParallelCompact.hpp | 2 +- src/hotspot/share/runtime/atomic.hpp | 56 ++--- 21 files changed, 39 insertions(+), 671 deletions(-) diff --git a/src/hotspot/os/windows/os_windows.cpp b/src/hotspot/os/windows/os_windows.cpp index 5c464768eea..dd4402dd83a 100644 --- a/src/hotspot/os/windows/os_windows.cpp +++ b/src/hotspot/os/windows/os_windows.cpp @@ -428,7 +428,7 @@ static unsigned __stdcall thread_native_entry(Thread* thread) { // When the VMThread gets here, the main thread may have already exited // which frees the CodeHeap containing the Atomic::add code if (thread != VMThread::vm_thread() && VMThread::vm_thread() != NULL) { - Atomic::dec_ptr((intptr_t*)&os::win32::_os_thread_count); + Atomic::dec(&os::win32::_os_thread_count); } // If a thread has not deleted itself ("delete this") as part of its @@ -634,7 +634,7 @@ bool os::create_thread(Thread* thread, ThreadType thr_type, return NULL; } - Atomic::inc_ptr((intptr_t*)&os::win32::_os_thread_count); + Atomic::inc(&os::win32::_os_thread_count); // Store info on the Win32 thread into the OSThread osthread->set_thread_handle(thread_handle); diff --git a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp index cbf54b82c0b..455a301456f 100644 --- a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp +++ b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp @@ -149,83 +149,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co } -inline void Atomic::inc (volatile jint* dest) { - - unsigned int temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: lwarx %0, 0, %2 \n" - " addic %0, %0, 1 \n" - " stwcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - - long temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: ldarx %0, 0, %2 \n" - " addic %0, %0, 1 \n" - " stdcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - - -inline void Atomic::dec (volatile jint* dest) { - - unsigned int temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: lwarx %0, 0, %2 \n" - " addic %0, %0, -1 \n" - " stwcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - - long temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: ldarx %0, 0, %2 \n" - " addic %0, %0, -1 \n" - " stdcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { // Note that xchg_ptr doesn't necessarily do an acquire diff --git a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp index 77528598d15..fc825ce9a1c 100644 --- a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp +++ b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp @@ -61,24 +61,6 @@ inline D Atomic::PlatformAdd<4>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline void Atomic::inc (volatile jint* dest) { - __asm__ volatile ( "lock addl $1,(%0)" : - : "r" (dest) : "cc", "memory"); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - -inline void Atomic::dec (volatile jint* dest) { - __asm__ volatile ( "lock subl $1,(%0)" : - : "r" (dest) : "cc", "memory"); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { __asm__ volatile ( "xchgl (%2),%0" : "=r" (exchange_value) @@ -136,20 +118,6 @@ inline D Atomic::PlatformAdd<8>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - __asm__ __volatile__ ( "lock addq $1,(%0)" - : - : "r" (dest) - : "cc", "memory"); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - __asm__ __volatile__ ( "lock subq $1,(%0)" - : - : "r" (dest) - : "cc", "memory"); -} - inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { __asm__ __volatile__ ("xchgq (%2),%0" : "=r" (exchange_value) @@ -176,14 +144,6 @@ inline jlong Atomic::load(const volatile jlong* src) { return *src; } #else // !AMD64 -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - inc((volatile jint*)dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - dec((volatile jint*)dest); -} - inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); } diff --git a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp index 7fcaf785f9a..235427ea40f 100644 --- a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp +++ b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp @@ -207,30 +207,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return __sync_add_and_fetch(dest, add_value); } -inline void Atomic::inc(volatile jint* dest) { - add(1, dest); -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - add_ptr(1, dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - add_ptr(1, dest); -} - -inline void Atomic::dec(volatile jint* dest) { - add(-1, dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - add_ptr(-1, dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - add_ptr(-1, dest); -} - inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { #ifdef ARM return arm_lock_test_and_set(dest, exchange_value); diff --git a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp index 4074df4fe5a..72a2f3b6555 100644 --- a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp +++ b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp @@ -57,26 +57,6 @@ struct Atomic::PlatformAdd } }; -inline void Atomic::inc(volatile jint* dest) -{ - add(1, dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) -{ - add_ptr(1, dest); -} - -inline void Atomic::dec (volatile jint* dest) -{ - add(-1, dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) -{ - add_ptr(-1, dest); -} - inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { jint res = __sync_lock_test_and_set (dest, exchange_value); @@ -110,16 +90,6 @@ inline T Atomic::PlatformCmpxchg::operator()(T exchange_value, inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline void Atomic::inc_ptr(volatile intptr_t* dest) -{ - add_ptr(1, dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) -{ - add_ptr(-1, dest); -} - inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { intptr_t res = __sync_lock_test_and_set (dest, exchange_value); diff --git a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp index fcd7e1f9ba2..76c7b69076a 100644 --- a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp +++ b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp @@ -122,14 +122,6 @@ inline D Atomic::PlatformAdd<4>::add_and_fetch(I add_value, D volatile* dest) co #endif } -inline void Atomic::inc(volatile jint* dest) { - Atomic::add(1, (volatile jint *)dest); -} - -inline void Atomic::dec(volatile jint* dest) { - Atomic::add(-1, (volatile jint *)dest); -} - #ifdef AARCH64 template<> template @@ -151,23 +143,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co } #endif // AARCH64 -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - Atomic::add_ptr(1, dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - Atomic::add_ptr(-1, dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - - inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { #ifdef AARCH64 jint old_val; diff --git a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp index a5a0f7d3124..82bf9c2d3c4 100644 --- a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp +++ b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp @@ -146,84 +146,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return result; } - -inline void Atomic::inc (volatile jint* dest) { - - unsigned int temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: lwarx %0, 0, %2 \n" - " addic %0, %0, 1 \n" - " stwcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - - long temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: ldarx %0, 0, %2 \n" - " addic %0, %0, 1 \n" - " stdcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - - -inline void Atomic::dec (volatile jint* dest) { - - unsigned int temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: lwarx %0, 0, %2 \n" - " addic %0, %0, -1 \n" - " stwcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - - long temp; - - __asm__ __volatile__ ( - strasm_nobarrier - "1: ldarx %0, 0, %2 \n" - " addic %0, %0, -1 \n" - " stdcx. %0, 0, %2 \n" - " bne- 1b \n" - strasm_nobarrier - : /*%0*/"=&r" (temp), "=m" (*dest) - : /*%2*/"r" (dest), "m" (*dest) - : "cc" strasm_nobarrier_clobber_memory); - -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { // Note that xchg_ptr doesn't necessarily do an acquire diff --git a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp index e7c436bdd6e..ef9391db80c 100644 --- a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp +++ b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp @@ -192,219 +192,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I inc, D volatile* dest) const { } -//------------ -// Atomic::inc -//------------ -// These methods force the value in memory to be incremented (augmented by 1). -// Both, memory value and increment, are treated as 32bit signed binary integers. -// No overflow exceptions are recognized, and the condition code does not hold -// information about the value in memory. -// -// The value in memory is updated by using a compare-and-swap instruction. The -// instruction is retried as often as required. - -inline void Atomic::inc(volatile jint* dest) { - unsigned int old, upd; - - if (VM_Version::has_LoadAndALUAtomicV1()) { -// tty->print_cr("Atomic::inc called... dest @%p", dest); - __asm__ __volatile__ ( - " LGHI 2,1 \n\t" // load increment - " LA 3,%[mem] \n\t" // force data address into ARG2 -// " LAA %[upd],%[inc],%[mem] \n\t" // increment and get old value -// " LAA 2,2,0(3) \n\t" // actually coded instruction - " .byte 0xeb \n\t" // LAA main opcode - " .byte 0x22 \n\t" // R1,R3 - " .byte 0x30 \n\t" // R2,disp1 - " .byte 0x00 \n\t" // disp2,disp3 - " .byte 0x00 \n\t" // disp4,disp5 - " .byte 0xf8 \n\t" // LAA minor opcode - " AGHI 2,1 \n\t" // calc new value in register - " LR %[upd],2 \n\t" // move to result register - //---< outputs >--- - : [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : -// : [inc] "a" (inc) // read-only. - //---< clobbered >--- - : "cc", "r2", "r3", "memory" - ); - } else { - __asm__ __volatile__ ( - " LLGF %[old],%[mem] \n\t" // get old value - "0: LA %[upd],1(,%[old]) \n\t" // calc result - " CS %[old],%[upd],%[mem] \n\t" // try to xchg res with mem - " JNE 0b \n\t" // no success? -> retry - //---< outputs >--- - : [old] "=&a" (old) // write-only, old counter value - , [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : - //---< clobbered >--- - : "cc", "memory" - ); - } -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - unsigned long old, upd; - - if (VM_Version::has_LoadAndALUAtomicV1()) { - __asm__ __volatile__ ( - " LGHI 2,1 \n\t" // load increment - " LA 3,%[mem] \n\t" // force data address into ARG2 -// " LAAG %[upd],%[inc],%[mem] \n\t" // increment and get old value -// " LAAG 2,2,0(3) \n\t" // actually coded instruction - " .byte 0xeb \n\t" // LAA main opcode - " .byte 0x22 \n\t" // R1,R3 - " .byte 0x30 \n\t" // R2,disp1 - " .byte 0x00 \n\t" // disp2,disp3 - " .byte 0x00 \n\t" // disp4,disp5 - " .byte 0xe8 \n\t" // LAA minor opcode - " AGHI 2,1 \n\t" // calc new value in register - " LR %[upd],2 \n\t" // move to result register - //---< outputs >--- - : [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : -// : [inc] "a" (inc) // read-only. - //---< clobbered >--- - : "cc", "r2", "r3", "memory" - ); - } else { - __asm__ __volatile__ ( - " LG %[old],%[mem] \n\t" // get old value - "0: LA %[upd],1(,%[old]) \n\t" // calc result - " CSG %[old],%[upd],%[mem] \n\t" // try to xchg res with mem - " JNE 0b \n\t" // no success? -> retry - //---< outputs >--- - : [old] "=&a" (old) // write-only, old counter value - , [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : - //---< clobbered >--- - : "cc", "memory" - ); - } -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - -//------------ -// Atomic::dec -//------------ -// These methods force the value in memory to be decremented (augmented by -1). -// Both, memory value and decrement, are treated as 32bit signed binary integers. -// No overflow exceptions are recognized, and the condition code does not hold -// information about the value in memory. -// -// The value in memory is updated by using a compare-and-swap instruction. The -// instruction is retried as often as required. - -inline void Atomic::dec(volatile jint* dest) { - unsigned int old, upd; - - if (VM_Version::has_LoadAndALUAtomicV1()) { - __asm__ __volatile__ ( - " LGHI 2,-1 \n\t" // load increment - " LA 3,%[mem] \n\t" // force data address into ARG2 -// " LAA %[upd],%[inc],%[mem] \n\t" // increment and get old value -// " LAA 2,2,0(3) \n\t" // actually coded instruction - " .byte 0xeb \n\t" // LAA main opcode - " .byte 0x22 \n\t" // R1,R3 - " .byte 0x30 \n\t" // R2,disp1 - " .byte 0x00 \n\t" // disp2,disp3 - " .byte 0x00 \n\t" // disp4,disp5 - " .byte 0xf8 \n\t" // LAA minor opcode - " AGHI 2,-1 \n\t" // calc new value in register - " LR %[upd],2 \n\t" // move to result register - //---< outputs >--- - : [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : -// : [inc] "a" (inc) // read-only. - //---< clobbered >--- - : "cc", "r2", "r3", "memory" - ); - } else { - __asm__ __volatile__ ( - " LLGF %[old],%[mem] \n\t" // get old value - // LAY not supported by inline assembler - // "0: LAY %[upd],-1(,%[old]) \n\t" // calc result - "0: LR %[upd],%[old] \n\t" // calc result - " AHI %[upd],-1 \n\t" - " CS %[old],%[upd],%[mem] \n\t" // try to xchg res with mem - " JNE 0b \n\t" // no success? -> retry - //---< outputs >--- - : [old] "=&a" (old) // write-only, old counter value - , [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : - //---< clobbered >--- - : "cc", "memory" - ); - } -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - unsigned long old, upd; - - if (VM_Version::has_LoadAndALUAtomicV1()) { - __asm__ __volatile__ ( - " LGHI 2,-1 \n\t" // load increment - " LA 3,%[mem] \n\t" // force data address into ARG2 -// " LAAG %[upd],%[inc],%[mem] \n\t" // increment and get old value -// " LAAG 2,2,0(3) \n\t" // actually coded instruction - " .byte 0xeb \n\t" // LAA main opcode - " .byte 0x22 \n\t" // R1,R3 - " .byte 0x30 \n\t" // R2,disp1 - " .byte 0x00 \n\t" // disp2,disp3 - " .byte 0x00 \n\t" // disp4,disp5 - " .byte 0xe8 \n\t" // LAA minor opcode - " AGHI 2,-1 \n\t" // calc new value in register - " LR %[upd],2 \n\t" // move to result register - //---< outputs >--- - : [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : -// : [inc] "a" (inc) // read-only. - //---< clobbered >--- - : "cc", "r2", "r3", "memory" - ); - } else { - __asm__ __volatile__ ( - " LG %[old],%[mem] \n\t" // get old value -// LAY not supported by inline assembler -// "0: LAY %[upd],-1(,%[old]) \n\t" // calc result - "0: LGR %[upd],%[old] \n\t" // calc result - " AGHI %[upd],-1 \n\t" - " CSG %[old],%[upd],%[mem] \n\t" // try to xchg res with mem - " JNE 0b \n\t" // no success? -> retry - //---< outputs >--- - : [old] "=&a" (old) // write-only, old counter value - , [upd] "=&d" (upd) // write-only, updated counter value - , [mem] "+Q" (*dest) // read/write, memory to be updated atomically - //---< inputs >--- - : - //---< clobbered >--- - : "cc", "memory" - ); - } -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - //------------- // Atomic::xchg //------------- diff --git a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp index 3ea20f8789d..1b40854558a 100644 --- a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp +++ b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp @@ -41,14 +41,6 @@ inline void Atomic::store (jlong store_value, volatile jlong* dest) { * inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } -inline void Atomic::inc (volatile jint* dest) { (void)add (1, dest); } -inline void Atomic::inc_ptr(volatile intptr_t* dest) { (void)add_ptr(1, dest); } -inline void Atomic::inc_ptr(volatile void* dest) { (void)add_ptr(1, dest); } - -inline void Atomic::dec (volatile jint* dest) { (void)add (-1, dest); } -inline void Atomic::dec_ptr(volatile intptr_t* dest) { (void)add_ptr(-1, dest); } -inline void Atomic::dec_ptr(volatile void* dest) { (void)add_ptr(-1, dest); } - inline jlong Atomic::load(const volatile jlong* src) { return *src; } template diff --git a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp index f19bfa767a9..51ed87f3dd8 100644 --- a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp +++ b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp @@ -61,24 +61,6 @@ inline D Atomic::PlatformAdd<4>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline void Atomic::inc (volatile jint* dest) { - __asm__ volatile ( "lock addl $1,(%0)" : - : "r" (dest) : "cc", "memory"); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc_ptr((volatile intptr_t*)dest); -} - -inline void Atomic::dec (volatile jint* dest) { - __asm__ volatile ( "lock subl $1,(%0)" : - : "r" (dest) : "cc", "memory"); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec_ptr((volatile intptr_t*)dest); -} - inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { __asm__ volatile ( "xchgl (%2),%0" : "=r" (exchange_value) @@ -136,20 +118,6 @@ inline D Atomic::PlatformAdd<8>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - __asm__ __volatile__ ("lock addq $1,(%0)" - : - : "r" (dest) - : "cc", "memory"); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - __asm__ __volatile__ ("lock subq $1,(%0)" - : - : "r" (dest) - : "cc", "memory"); -} - inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { __asm__ __volatile__ ("xchgq (%2),%0" : "=r" (exchange_value) @@ -176,14 +144,6 @@ inline jlong Atomic::load(const volatile jlong* src) { return *src; } #else // !AMD64 -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - inc((volatile jint*)dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - dec((volatile jint*)dest); -} - inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); } diff --git a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp index 22af8a7fbb8..97c6ed1b2b7 100644 --- a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp +++ b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp @@ -201,30 +201,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return __sync_add_and_fetch(dest, add_value); } -inline void Atomic::inc(volatile jint* dest) { - add(1, dest); -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - add_ptr(1, dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - add_ptr(1, dest); -} - -inline void Atomic::dec(volatile jint* dest) { - add(-1, dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - add_ptr(-1, dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - add_ptr(-1, dest); -} - inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { #ifdef ARM return arm_lock_test_and_set(dest, exchange_value); diff --git a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp index 5314e931cf9..5a1a470ae58 100644 --- a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp +++ b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp @@ -39,15 +39,6 @@ inline void Atomic::store (jint store_value, volatile jint* dest) { * inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } -inline void Atomic::inc (volatile jint* dest) { (void)add (1, dest); } -inline void Atomic::inc_ptr(volatile intptr_t* dest) { (void)add_ptr(1, dest); } -inline void Atomic::inc_ptr(volatile void* dest) { (void)add_ptr(1, dest); } - -inline void Atomic::dec (volatile jint* dest) { (void)add (-1, dest); } -inline void Atomic::dec_ptr(volatile intptr_t* dest) { (void)add_ptr(-1, dest); } -inline void Atomic::dec_ptr(volatile void* dest) { (void)add_ptr(-1, dest); } - - inline void Atomic::store(jlong store_value, jlong* dest) { *dest = store_value; } inline void Atomic::store(jlong store_value, volatile jlong* dest) { *dest = store_value; } inline jlong Atomic::load(const volatile jlong* src) { return *src; } diff --git a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp index c6919fbf38b..310592eadb9 100644 --- a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp +++ b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp @@ -39,14 +39,6 @@ inline void Atomic::store (jint store_value, volatile jint* dest) { * inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } -inline void Atomic::inc (volatile jint* dest) { (void)add (1, dest); } -inline void Atomic::inc_ptr(volatile intptr_t* dest) { (void)add_ptr(1, dest); } -inline void Atomic::inc_ptr(volatile void* dest) { (void)add_ptr(1, dest); } - -inline void Atomic::dec (volatile jint* dest) { (void)add (-1, dest); } -inline void Atomic::dec_ptr(volatile intptr_t* dest) { (void)add_ptr(-1, dest); } -inline void Atomic::dec_ptr(volatile void* dest) { (void)add_ptr(-1, dest); } - // For Sun Studio - implementation is in solaris_x86_64.il. extern "C" { diff --git a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp index abf266917a1..e1ba4f45235 100644 --- a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp +++ b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp @@ -81,30 +81,6 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return add_using_helper(os::atomic_add_ptr_func, add_value, dest); } -inline void Atomic::inc (volatile jint* dest) { - (void)add (1, dest); -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - (void)add_ptr(1, dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - (void)add_ptr(1, dest); -} - -inline void Atomic::dec (volatile jint* dest) { - (void)add (-1, dest); -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - (void)add_ptr(-1, dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - (void)add_ptr(-1, dest); -} - inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { return (jint)(*os::atomic_xchg_func)(exchange_value, dest); } @@ -152,38 +128,6 @@ inline D Atomic::PlatformAdd<4>::add_and_fetch(I add_value, D volatile* dest) co } } -inline void Atomic::inc (volatile jint* dest) { - // alternative for InterlockedIncrement - __asm { - mov edx, dest; - lock add dword ptr [edx], 1; - } -} - -inline void Atomic::inc_ptr(volatile intptr_t* dest) { - inc((volatile jint*)dest); -} - -inline void Atomic::inc_ptr(volatile void* dest) { - inc((volatile jint*)dest); -} - -inline void Atomic::dec (volatile jint* dest) { - // alternative for InterlockedDecrement - __asm { - mov edx, dest; - lock sub dword ptr [edx], 1; - } -} - -inline void Atomic::dec_ptr(volatile intptr_t* dest) { - dec((volatile jint*)dest); -} - -inline void Atomic::dec_ptr(volatile void* dest) { - dec((volatile jint*)dest); -} - inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { // alternative for InterlockedExchange __asm { diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp index 22d5030ba72..e9a2fe8123b 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp @@ -1075,7 +1075,7 @@ ConcurrentMarkSweepGeneration::par_promote(int thread_num, obj_ptr, old->is_objArray(), word_sz); NOT_PRODUCT( - Atomic::inc_ptr(&_numObjectsPromoted); + Atomic::inc(&_numObjectsPromoted); Atomic::add_ptr(alloc_sz, &_numWordsPromoted); ) @@ -7974,7 +7974,7 @@ void CMSCollector::push_on_overflow_list(oop p) { // Multi-threaded; use CAS to prepend to overflow list void CMSCollector::par_push_on_overflow_list(oop p) { - NOT_PRODUCT(Atomic::inc_ptr(&_num_par_pushes);) + NOT_PRODUCT(Atomic::inc(&_num_par_pushes);) assert(oopDesc::is_oop(p), "Not an oop"); par_preserve_mark_if_necessary(p); oop observed_overflow_list = _overflow_list; diff --git a/src/hotspot/share/gc/cms/parNewGeneration.cpp b/src/hotspot/share/gc/cms/parNewGeneration.cpp index 5d651e0507e..873fad0b251 100644 --- a/src/hotspot/share/gc/cms/parNewGeneration.cpp +++ b/src/hotspot/share/gc/cms/parNewGeneration.cpp @@ -1281,7 +1281,7 @@ void ParNewGeneration::push_on_overflow_list(oop from_space_obj, ParScanThreadSt // XXX This is horribly inefficient when a promotion failure occurs // and should be fixed. XXX FIX ME !!! #ifndef PRODUCT - Atomic::inc_ptr(&_num_par_pushes); + Atomic::inc(&_num_par_pushes); assert(_num_par_pushes > 0, "Tautology"); #endif if (from_space_obj->forwardee() == from_space_obj) { diff --git a/src/hotspot/share/gc/g1/g1StringDedupQueue.cpp b/src/hotspot/share/gc/g1/g1StringDedupQueue.cpp index b029c3f2b40..546f33d9120 100644 --- a/src/hotspot/share/gc/g1/g1StringDedupQueue.cpp +++ b/src/hotspot/share/gc/g1/g1StringDedupQueue.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2014, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2014, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -90,7 +90,7 @@ void G1StringDedupQueue::push(uint worker_id, oop java_string) { } } else { // Queue is full, drop the string and update the statistics - Atomic::inc_ptr(&_queue->_dropped); + Atomic::inc(&_queue->_dropped); } } diff --git a/src/hotspot/share/gc/parallel/parMarkBitMap.cpp b/src/hotspot/share/gc/parallel/parMarkBitMap.cpp index 8696160c880..83f8af7335e 100644 --- a/src/hotspot/share/gc/parallel/parMarkBitMap.cpp +++ b/src/hotspot/share/gc/parallel/parMarkBitMap.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2005, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2005, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -89,7 +89,7 @@ ParMarkBitMap::mark_obj(HeapWord* addr, size_t size) const idx_t end_bit = addr_to_bit(addr + size - 1); bool end_bit_ok = _end_bits.par_set_bit(end_bit); assert(end_bit_ok, "concurrency problem"); - DEBUG_ONLY(Atomic::inc_ptr(&mark_bitmap_count)); + DEBUG_ONLY(Atomic::inc(&mark_bitmap_count)); DEBUG_ONLY(Atomic::add_ptr(size, &mark_bitmap_size)); return true; } diff --git a/src/hotspot/share/gc/parallel/psParallelCompact.cpp b/src/hotspot/share/gc/parallel/psParallelCompact.cpp index 0678ee5b65b..8ed22f4ab2a 100644 --- a/src/hotspot/share/gc/parallel/psParallelCompact.cpp +++ b/src/hotspot/share/gc/parallel/psParallelCompact.cpp @@ -520,7 +520,7 @@ void ParallelCompactData::add_obj(HeapWord* addr, size_t len) const size_t beg_region = obj_ofs >> Log2RegionSize; const size_t end_region = (obj_ofs + len - 1) >> Log2RegionSize; - DEBUG_ONLY(Atomic::inc_ptr(&add_obj_count);) + DEBUG_ONLY(Atomic::inc(&add_obj_count);) DEBUG_ONLY(Atomic::add_ptr(len, &add_obj_size);) if (beg_region == end_region) { diff --git a/src/hotspot/share/gc/parallel/psParallelCompact.hpp b/src/hotspot/share/gc/parallel/psParallelCompact.hpp index 6bf8270d7fd..abc5019f652 100644 --- a/src/hotspot/share/gc/parallel/psParallelCompact.hpp +++ b/src/hotspot/share/gc/parallel/psParallelCompact.hpp @@ -517,7 +517,7 @@ ParallelCompactData::RegionData::set_blocks_filled() OrderAccess::release(); _blocks_filled = true; // Debug builds count the number of times the table was filled. - DEBUG_ONLY(Atomic::inc_ptr(&_blocks_filled_count)); + DEBUG_ONLY(Atomic::inc(&_blocks_filled_count)); } inline void diff --git a/src/hotspot/share/runtime/atomic.hpp b/src/hotspot/share/runtime/atomic.hpp index 108c841ed96..a34d7f389f8 100644 --- a/src/hotspot/share/runtime/atomic.hpp +++ b/src/hotspot/share/runtime/atomic.hpp @@ -97,21 +97,21 @@ class Atomic : AllStatic { return add(add_value, reinterpret_cast(dest)); } - // Atomically increment location. inc*() provide: + // Atomically increment location. inc() provide: // increment-dest - inline static void inc (volatile jint* dest); - inline static void inc (volatile jshort* dest); - inline static void inc (volatile size_t* dest); - inline static void inc_ptr(volatile intptr_t* dest); - inline static void inc_ptr(volatile void* dest); + // The type D may be either a pointer type, or an integral + // type. If it is a pointer type, then the increment is + // scaled to the size of the type pointed to by the pointer. + template + inline static void inc(D volatile* dest); - // Atomically decrement a location. dec*() provide: + // Atomically decrement a location. dec() provide: // decrement-dest - inline static void dec (volatile jint* dest); - inline static void dec (volatile jshort* dest); - inline static void dec (volatile size_t* dest); - inline static void dec_ptr(volatile intptr_t* dest); - inline static void dec_ptr(volatile void* dest); + // The type D may be either a pointer type, or an integral + // type. If it is a pointer type, then the decrement is + // scaled to the size of the type pointed to by the pointer. + template + inline static void dec(D volatile* dest); // Performs atomic exchange of *dest with exchange_value. Returns old // prior value of *dest. xchg*() provide: @@ -312,6 +312,22 @@ struct Atomic::AddAndFetch VALUE_OBJ_CLASS_SPEC { D operator()(I add_value, D volatile* dest) const; }; +template +inline void Atomic::inc(D volatile* dest) { + STATIC_ASSERT(IsPointer::value || IsIntegral::value); + typedef typename Conditional::value, ptrdiff_t, D>::type I; + Atomic::add(I(1), dest); +} + +template +inline void Atomic::dec(D volatile* dest) { + STATIC_ASSERT(IsPointer::value || IsIntegral::value); + typedef typename Conditional::value, ptrdiff_t, D>::type I; + // Assumes two's complement integer representation. + #pragma warning(suppress: 4146) + Atomic::add(I(-1), dest); +} + // Define the class before including platform file, which may specialize // the operator definition. No generic definition of specializations // of the operator template are provided, nor are there any generic @@ -437,14 +453,6 @@ inline D Atomic::add_using_helper(Fn fn, I add_value, D volatile* dest) { reinterpret_cast(dest))); } -inline void Atomic::inc(volatile size_t* dest) { - inc_ptr((volatile intptr_t*) dest); -} - -inline void Atomic::dec(volatile size_t* dest) { - dec_ptr((volatile intptr_t*) dest); -} - template inline D Atomic::cmpxchg(T exchange_value, D volatile* dest, @@ -591,12 +599,4 @@ inline unsigned Atomic::xchg(unsigned int exchange_value, volatile unsigned int* return (unsigned int)Atomic::xchg((jint)exchange_value, (volatile jint*)dest); } -inline void Atomic::inc(volatile jshort* dest) { - (void)add(jshort(1), dest); -} - -inline void Atomic::dec(volatile jshort* dest) { - (void)add(jshort(-1), dest); -} - #endif // SHARE_VM_RUNTIME_ATOMIC_HPP From c4ba1b52b377c65842c5f6300aa5ad891664a4fe Mon Sep 17 00:00:00 2001 From: Zhengyu Gu Date: Thu, 28 Sep 2017 09:56:54 -0400 Subject: [PATCH 17/80] 8186770: NMT: Report metadata information in NMT summary Added metadata statistics in NMT summary report Reviewed-by: adinn, coleenp --- src/hotspot/share/memory/metaspace.cpp | 2 +- src/hotspot/share/memory/metaspace.hpp | 2 +- src/hotspot/share/services/memBaseline.cpp | 1 + src/hotspot/share/services/memBaseline.hpp | 5 + src/hotspot/share/services/memReporter.cpp | 118 ++++++++++++++++-- src/hotspot/share/services/memReporter.hpp | 12 +- .../share/services/virtualMemoryTracker.cpp | 35 +++++- .../share/services/virtualMemoryTracker.hpp | 28 ++++- 8 files changed, 191 insertions(+), 12 deletions(-) diff --git a/src/hotspot/share/memory/metaspace.cpp b/src/hotspot/share/memory/metaspace.cpp index b1d90841010..c4c306aae84 100644 --- a/src/hotspot/share/memory/metaspace.cpp +++ b/src/hotspot/share/memory/metaspace.cpp @@ -2718,7 +2718,7 @@ void SpaceManager::dump(outputStream* const out) const { size_t MetaspaceAux::_capacity_words[] = {0, 0}; -size_t MetaspaceAux::_used_words[] = {0, 0}; +volatile size_t MetaspaceAux::_used_words[] = {0, 0}; size_t MetaspaceAux::free_bytes(Metaspace::MetadataType mdtype) { VirtualSpaceList* list = Metaspace::get_space_list(mdtype); diff --git a/src/hotspot/share/memory/metaspace.hpp b/src/hotspot/share/memory/metaspace.hpp index 879388e7f32..81ad7288676 100644 --- a/src/hotspot/share/memory/metaspace.hpp +++ b/src/hotspot/share/memory/metaspace.hpp @@ -273,7 +273,7 @@ class MetaspaceAux : AllStatic { // Running sum of space in all Metachunks that // are being used for metadata. One for each // type of Metadata. - static size_t _used_words[Metaspace:: MetadataTypeCount]; + static volatile size_t _used_words[Metaspace:: MetadataTypeCount]; public: // Decrement and increment _allocated_capacity_words diff --git a/src/hotspot/share/services/memBaseline.cpp b/src/hotspot/share/services/memBaseline.cpp index f580aada254..f2d6c36188c 100644 --- a/src/hotspot/share/services/memBaseline.cpp +++ b/src/hotspot/share/services/memBaseline.cpp @@ -144,6 +144,7 @@ class VirtualMemoryAllocationWalker : public VirtualMemoryWalker { bool MemBaseline::baseline_summary() { MallocMemorySummary::snapshot(&_malloc_memory_snapshot); VirtualMemorySummary::snapshot(&_virtual_memory_snapshot); + MetaspaceSnapshot::snapshot(_metaspace_snapshot); return true; } diff --git a/src/hotspot/share/services/memBaseline.hpp b/src/hotspot/share/services/memBaseline.hpp index 238d29d82fe..9040306aca4 100644 --- a/src/hotspot/share/services/memBaseline.hpp +++ b/src/hotspot/share/services/memBaseline.hpp @@ -65,6 +65,7 @@ class MemBaseline VALUE_OBJ_CLASS_SPEC { // Summary information MallocMemorySnapshot _malloc_memory_snapshot; VirtualMemorySnapshot _virtual_memory_snapshot; + MetaspaceSnapshot _metaspace_snapshot; size_t _class_count; @@ -103,6 +104,10 @@ class MemBaseline VALUE_OBJ_CLASS_SPEC { return &_virtual_memory_snapshot; } + MetaspaceSnapshot* metaspace_snapshot() { + return &_metaspace_snapshot; + } + MallocSiteIterator malloc_sites(SortingOrder order); VirtualMemorySiteIterator virtual_memory_sites(SortingOrder order); diff --git a/src/hotspot/share/services/memReporter.cpp b/src/hotspot/share/services/memReporter.cpp index 8199ee0aa68..77abb49833d 100644 --- a/src/hotspot/share/services/memReporter.cpp +++ b/src/hotspot/share/services/memReporter.cpp @@ -175,12 +175,44 @@ void MemSummaryReporter::report_summary_of_type(MEMFLAGS flag, amount_in_current_scale(_malloc_snapshot->malloc_overhead()->size()) > 0) { out->print_cr("%27s (tracking overhead=" SIZE_FORMAT "%s)", " ", amount_in_current_scale(_malloc_snapshot->malloc_overhead()->size()), scale); + } else if (flag == mtClass) { + // Metadata information + report_metadata(Metaspace::NonClassType); + if (Metaspace::using_class_space()) { + report_metadata(Metaspace::ClassType); + } } - out->print_cr(" "); } } +void MemSummaryReporter::report_metadata(Metaspace::MetadataType type) const { + assert(type == Metaspace::NonClassType || type == Metaspace::ClassType, + "Invalid metadata type"); + const char* name = (type == Metaspace::NonClassType) ? + "Metadata: " : "Class space:"; + + outputStream* out = output(); + const char* scale = current_scale(); + size_t committed = MetaspaceAux::committed_bytes(type); + size_t used = MetaspaceAux::used_bytes(type); + size_t free = (MetaspaceAux::capacity_bytes(type) - used) + + MetaspaceAux::free_chunks_total_bytes(type) + + MetaspaceAux::free_bytes(type); + + assert(committed >= used + free, "Sanity"); + size_t waste = committed - (used + free); + + out->print_cr("%27s ( %s)", " ", name); + out->print("%27s ( ", " "); + print_total(MetaspaceAux::reserved_bytes(type), committed); + out->print_cr(")"); + out->print_cr("%27s ( used=" SIZE_FORMAT "%s)", " ", amount_in_current_scale(used), scale); + out->print_cr("%27s ( free=" SIZE_FORMAT "%s)", " ", amount_in_current_scale(free), scale); + out->print_cr("%27s ( waste=" SIZE_FORMAT "%s =%2.2f%%)", " ", amount_in_current_scale(waste), + scale, ((float)waste * 100)/committed); +} + void MemDetailReporter::report_detail() { // Start detail report outputStream* out = output(); @@ -305,9 +337,13 @@ void MemSummaryDiffReporter::report_diff() { MEMFLAGS flag = NMTUtil::index_to_flag(index); // thread stack is reported as part of thread category if (flag == mtThreadStack) continue; - diff_summary_of_type(flag, _early_baseline.malloc_memory(flag), - _early_baseline.virtual_memory(flag), _current_baseline.malloc_memory(flag), - _current_baseline.virtual_memory(flag)); + diff_summary_of_type(flag, + _early_baseline.malloc_memory(flag), + _early_baseline.virtual_memory(flag), + _early_baseline.metaspace_snapshot(), + _current_baseline.malloc_memory(flag), + _current_baseline.virtual_memory(flag), + _current_baseline.metaspace_snapshot()); } } @@ -367,9 +403,11 @@ void MemSummaryDiffReporter::print_virtual_memory_diff(size_t current_reserved, } -void MemSummaryDiffReporter::diff_summary_of_type(MEMFLAGS flag, const MallocMemory* early_malloc, - const VirtualMemory* early_vm, const MallocMemory* current_malloc, - const VirtualMemory* current_vm) const { +void MemSummaryDiffReporter::diff_summary_of_type(MEMFLAGS flag, + const MallocMemory* early_malloc, const VirtualMemory* early_vm, + const MetaspaceSnapshot* early_ms, + const MallocMemory* current_malloc, const VirtualMemory* current_vm, + const MetaspaceSnapshot* current_ms) const { outputStream* out = output(); const char* scale = current_scale(); @@ -486,11 +524,77 @@ void MemSummaryDiffReporter::diff_summary_of_type(MEMFLAGS flag, const MallocMem out->print(" %+ld%s", overhead_diff, scale); } out->print_cr(")"); + } else if (flag == mtClass) { + assert(current_ms != NULL && early_ms != NULL, "Sanity"); + print_metaspace_diff(current_ms, early_ms); } out->print_cr(" "); } } +void MemSummaryDiffReporter::print_metaspace_diff(const MetaspaceSnapshot* current_ms, + const MetaspaceSnapshot* early_ms) const { + print_metaspace_diff(Metaspace::NonClassType, current_ms, early_ms); + if (Metaspace::using_class_space()) { + print_metaspace_diff(Metaspace::ClassType, current_ms, early_ms); + } +} + +void MemSummaryDiffReporter::print_metaspace_diff(Metaspace::MetadataType type, + const MetaspaceSnapshot* current_ms, + const MetaspaceSnapshot* early_ms) const { + const char* name = (type == Metaspace::NonClassType) ? + "Metadata: " : "Class space:"; + + outputStream* out = output(); + const char* scale = current_scale(); + + out->print_cr("%27s ( %s)", " ", name); + out->print("%27s ( ", " "); + print_virtual_memory_diff(current_ms->reserved_in_bytes(type), + current_ms->committed_in_bytes(type), + early_ms->reserved_in_bytes(type), + early_ms->committed_in_bytes(type)); + out->print_cr(")"); + + long diff_used = diff_in_current_scale(current_ms->used_in_bytes(type), + early_ms->used_in_bytes(type)); + long diff_free = diff_in_current_scale(current_ms->free_in_bytes(type), + early_ms->free_in_bytes(type)); + + size_t current_waste = current_ms->committed_in_bytes(type) + - (current_ms->used_in_bytes(type) + current_ms->free_in_bytes(type)); + size_t early_waste = early_ms->committed_in_bytes(type) + - (early_ms->used_in_bytes(type) + early_ms->free_in_bytes(type)); + long diff_waste = diff_in_current_scale(current_waste, early_waste); + + // Diff used + out->print("%27s ( used=" SIZE_FORMAT "%s", " ", + amount_in_current_scale(current_ms->used_in_bytes(type)), scale); + if (diff_used != 0) { + out->print(" %+ld%s", diff_used, scale); + } + out->print_cr(")"); + + // Diff free + out->print("%27s ( free=" SIZE_FORMAT "%s", " ", + amount_in_current_scale(current_ms->free_in_bytes(type)), scale); + if (diff_free != 0) { + out->print(" %+ld%s", diff_free, scale); + } + out->print_cr(")"); + + + // Diff waste + out->print("%27s ( waste=" SIZE_FORMAT "%s =%2.2f%%", " ", + amount_in_current_scale(current_waste), scale, + ((float)current_waste * 100) / current_ms->committed_in_bytes(type)); + if (diff_waste != 0) { + out->print(" %+ld%s", diff_waste, scale); + } + out->print_cr(")"); +} + void MemDetailDiffReporter::report_diff() { MemSummaryDiffReporter::report_diff(); diff_malloc_sites(); diff --git a/src/hotspot/share/services/memReporter.hpp b/src/hotspot/share/services/memReporter.hpp index 9b83f8ce4f0..f244ad55248 100644 --- a/src/hotspot/share/services/memReporter.hpp +++ b/src/hotspot/share/services/memReporter.hpp @@ -27,6 +27,7 @@ #if INCLUDE_NMT +#include "memory/metaspace.hpp" #include "oops/instanceKlass.hpp" #include "services/memBaseline.hpp" #include "services/nmtCommon.hpp" @@ -110,6 +111,8 @@ class MemSummaryReporter : public MemReporterBase { // Report summary for each memory type void report_summary_of_type(MEMFLAGS type, MallocMemory* malloc_memory, VirtualMemory* virtual_memory); + + void report_metadata(Metaspace::MetadataType type) const; }; /* @@ -170,7 +173,9 @@ class MemSummaryDiffReporter : public MemReporterBase { // report the comparison of each memory type void diff_summary_of_type(MEMFLAGS type, const MallocMemory* early_malloc, const VirtualMemory* early_vm, - const MallocMemory* current_malloc, const VirtualMemory* current_vm) const; + const MetaspaceSnapshot* early_ms, + const MallocMemory* current_malloc, const VirtualMemory* current_vm, + const MetaspaceSnapshot* current_ms) const; protected: void print_malloc_diff(size_t current_amount, size_t current_count, @@ -179,6 +184,11 @@ class MemSummaryDiffReporter : public MemReporterBase { size_t early_reserved, size_t early_committed) const; void print_arena_diff(size_t current_amount, size_t current_count, size_t early_amount, size_t early_count) const; + + void print_metaspace_diff(const MetaspaceSnapshot* current_ms, + const MetaspaceSnapshot* early_ms) const; + void print_metaspace_diff(Metaspace::MetadataType type, + const MetaspaceSnapshot* current_ms, const MetaspaceSnapshot* early_ms) const; }; /* diff --git a/src/hotspot/share/services/virtualMemoryTracker.cpp b/src/hotspot/share/services/virtualMemoryTracker.cpp index c21aa542b2d..97bc9d5ef7c 100644 --- a/src/hotspot/share/services/virtualMemoryTracker.cpp +++ b/src/hotspot/share/services/virtualMemoryTracker.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2013, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2013, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -23,6 +23,7 @@ */ #include "precompiled.hpp" +#include "memory/metaspace.hpp" #include "runtime/atomic.hpp" #include "runtime/os.hpp" #include "runtime/threadCritical.hpp" @@ -492,3 +493,35 @@ bool VirtualMemoryTracker::transition(NMT_TrackingLevel from, NMT_TrackingLevel return true; } + +// Metaspace Support +MetaspaceSnapshot::MetaspaceSnapshot() { + for (int index = (int)Metaspace::ClassType; index < (int)Metaspace::MetadataTypeCount; index ++) { + Metaspace::MetadataType type = (Metaspace::MetadataType)index; + assert_valid_metadata_type(type); + _reserved_in_bytes[type] = 0; + _committed_in_bytes[type] = 0; + _used_in_bytes[type] = 0; + _free_in_bytes[type] = 0; + } +} + +void MetaspaceSnapshot::snapshot(Metaspace::MetadataType type, MetaspaceSnapshot& mss) { + assert_valid_metadata_type(type); + + mss._reserved_in_bytes[type] = MetaspaceAux::reserved_bytes(type); + mss._committed_in_bytes[type] = MetaspaceAux::committed_bytes(type); + mss._used_in_bytes[type] = MetaspaceAux::used_bytes(type); + + size_t free_in_bytes = (MetaspaceAux::capacity_bytes(type) - MetaspaceAux::used_bytes(type)) + + MetaspaceAux::free_chunks_total_bytes(type) + + MetaspaceAux::free_bytes(type); + mss._free_in_bytes[type] = free_in_bytes; +} + +void MetaspaceSnapshot::snapshot(MetaspaceSnapshot& mss) { + snapshot(Metaspace::ClassType, mss); + if (Metaspace::using_class_space()) { + snapshot(Metaspace::NonClassType, mss); + } +} diff --git a/src/hotspot/share/services/virtualMemoryTracker.hpp b/src/hotspot/share/services/virtualMemoryTracker.hpp index 02d21bd53bb..9a02676ade0 100644 --- a/src/hotspot/share/services/virtualMemoryTracker.hpp +++ b/src/hotspot/share/services/virtualMemoryTracker.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2013, 2014, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2013, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -28,6 +28,7 @@ #if INCLUDE_NMT #include "memory/allocation.hpp" +#include "memory/metaspace.hpp" #include "services/allocationSite.hpp" #include "services/nmtCommon.hpp" #include "utilities/linkedlist.hpp" @@ -419,6 +420,31 @@ class VirtualMemoryTracker : AllStatic { }; +class MetaspaceSnapshot : public ResourceObj { +private: + size_t _reserved_in_bytes[Metaspace::MetadataTypeCount]; + size_t _committed_in_bytes[Metaspace::MetadataTypeCount]; + size_t _used_in_bytes[Metaspace::MetadataTypeCount]; + size_t _free_in_bytes[Metaspace::MetadataTypeCount]; + +public: + MetaspaceSnapshot(); + size_t reserved_in_bytes(Metaspace::MetadataType type) const { assert_valid_metadata_type(type); return _reserved_in_bytes[type]; } + size_t committed_in_bytes(Metaspace::MetadataType type) const { assert_valid_metadata_type(type); return _committed_in_bytes[type]; } + size_t used_in_bytes(Metaspace::MetadataType type) const { assert_valid_metadata_type(type); return _used_in_bytes[type]; } + size_t free_in_bytes(Metaspace::MetadataType type) const { assert_valid_metadata_type(type); return _free_in_bytes[type]; } + + static void snapshot(MetaspaceSnapshot& s); + +private: + static void snapshot(Metaspace::MetadataType type, MetaspaceSnapshot& s); + + static void assert_valid_metadata_type(Metaspace::MetadataType type) { + assert(type == Metaspace::ClassType || type == Metaspace::NonClassType, + "Invalid metadata type"); + } +}; + #endif // INCLUDE_NMT #endif // SHARE_VM_SERVICES_VIRTUAL_MEMORY_TRACKER_HPP From 87e30fd80172c5bd6748f140ddf6cd19adb62764 Mon Sep 17 00:00:00 2001 From: Harold Seigel Date: Thu, 28 Sep 2017 13:01:24 -0400 Subject: [PATCH 18/80] 8186092: Unnecessary loader constraints produced when there are multiple defaults Do not check loader constraints for overpass methods Reviewed-by: dholmes, acorn --- .../share/classfile/defaultMethods.cpp | 16 ++-- src/hotspot/share/oops/klassVtable.cpp | 80 ++++++++++--------- .../runtime/LoaderConstraints/common/C.jasm | 37 +++++++++ .../runtime/LoaderConstraints/common/Foo.java | 24 ++++++ .../runtime/LoaderConstraints/common/J.java | 26 ++++++ .../common/PreemptingClassLoader.java | 59 ++++++++++++++ .../LoaderConstraints/itableICCE/I.java | 26 ++++++ .../LoaderConstraints/itableICCE/Task.java | 31 +++++++ .../LoaderConstraints/itableICCE/Test.java | 59 ++++++++++++++ .../itableLdrConstraint/I.java | 26 ++++++ .../itableLdrConstraint/Task.java | 31 +++++++ .../itableLdrConstraint/Test.java | 60 ++++++++++++++ .../LoaderConstraints/vtableAME/I.java | 26 ++++++ .../LoaderConstraints/vtableAME/Task.java | 24 ++++++ .../LoaderConstraints/vtableAME/Test.java | 66 +++++++++++++++ .../vtableLdrConstraint/I.java | 25 ++++++ .../vtableLdrConstraint/Task.java | 30 +++++++ .../vtableLdrConstraint/Test.java | 63 +++++++++++++++ 18 files changed, 666 insertions(+), 43 deletions(-) create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/common/C.jasm create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/common/Foo.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/common/J.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/common/PreemptingClassLoader.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/I.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Task.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Test.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/I.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Task.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Test.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/I.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Task.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Test.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/I.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Task.java create mode 100644 test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Test.java diff --git a/src/hotspot/share/classfile/defaultMethods.cpp b/src/hotspot/share/classfile/defaultMethods.cpp index 596b567db49..b09d552bcf4 100644 --- a/src/hotspot/share/classfile/defaultMethods.cpp +++ b/src/hotspot/share/classfile/defaultMethods.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2012, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2012, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -767,15 +767,14 @@ static void create_default_methods( InstanceKlass* klass, // This is the guts of the default methods implementation. This is called just // after the classfile has been parsed if some ancestor has default methods. // -// First if finds any name/signature slots that need any implementation (either +// First it finds any name/signature slots that need any implementation (either // because they are miranda or a superclass's implementation is an overpass // itself). For each slot, iterate over the hierarchy, to see if they contain a // signature that matches the slot we are looking at. // -// For each slot filled, we generate an overpass method that either calls the -// unique default method candidate using invokespecial, or throws an exception -// (in the case of no default method candidates, or more than one valid -// candidate). These methods are then added to the class's method list. +// For each slot filled, we either record the default method candidate in the +// klass default_methods list or, only to handle exception cases, we create an +// overpass method that throws an exception and add it to the klass methods list. // The JVM does not create bridges nor handle generic signatures here. void DefaultMethods::generate_default_methods( InstanceKlass* klass, const GrowableArray* mirandas, TRAPS) { @@ -901,6 +900,11 @@ static void switchover_constant_pool(BytecodeConstantPool* bpool, // This allows virtual methods to override the overpass, but ensures // that a local method search will find the exception rather than an abstract // or default method that is not a valid candidate. +// +// Note that if overpass method are ever created that are not exception +// throwing methods then the loader constraint checking logic for vtable and +// itable creation needs to be changed to check loader constraints for the +// overpass methods that do not throw exceptions. static void create_defaults_and_exceptions( GrowableArray* slots, InstanceKlass* klass, TRAPS) { diff --git a/src/hotspot/share/oops/klassVtable.cpp b/src/hotspot/share/oops/klassVtable.cpp index bb6966cdfe5..6ebf6988b43 100644 --- a/src/hotspot/share/oops/klassVtable.cpp +++ b/src/hotspot/share/oops/klassVtable.cpp @@ -479,13 +479,15 @@ bool klassVtable::update_inherited_vtable(InstanceKlass* klass, const methodHand allocate_new = false; } - if (checkconstraints) { - // Override vtable entry if passes loader constraint check - // if loader constraint checking requested - // No need to visit his super, since he and his super - // have already made any needed loader constraints. - // Since loader constraints are transitive, it is enough - // to link to the first super, and we get all the others. + // Do not check loader constraints for overpass methods because overpass + // methods are created by the jvm to throw exceptions. + if (checkconstraints && !target_method()->is_overpass()) { + // Override vtable entry if passes loader constraint check + // if loader constraint checking requested + // No need to visit his super, since he and his super + // have already made any needed loader constraints. + // Since loader constraints are transitive, it is enough + // to link to the first super, and we get all the others. Handle super_loader(THREAD, super_klass->class_loader()); if (target_loader() != super_loader()) { @@ -495,21 +497,23 @@ bool klassVtable::update_inherited_vtable(InstanceKlass* klass, const methodHand super_loader, true, CHECK_(false)); if (failed_type_symbol != NULL) { - const char* msg = "loader constraint violation: when resolving " - "overridden method \"%s\" the class loader (instance" - " of %s) of the current class, %s, and its superclass loader " - "(instance of %s), have different Class objects for the type " - "%s used in the signature"; + const char* msg = "loader constraint violation for class %s: when selecting " + "overriding method \"%s\" the class loader (instance of %s) of the " + "selected method's type %s, and the class loader (instance of %s) for its super " + "type %s have different Class objects for the type %s used in the signature"; + char* curr_class = klass->name()->as_C_string(); char* sig = target_method()->name_and_sig_as_C_string(); const char* loader1 = SystemDictionary::loader_name(target_loader()); - char* current = target_klass->name()->as_C_string(); + char* sel_class = target_klass->name()->as_C_string(); const char* loader2 = SystemDictionary::loader_name(super_loader()); + char* super_class = super_klass->name()->as_C_string(); char* failed_type_name = failed_type_symbol->as_C_string(); - size_t buflen = strlen(msg) + strlen(sig) + strlen(loader1) + - strlen(current) + strlen(loader2) + strlen(failed_type_name); + size_t buflen = strlen(msg) + strlen(curr_class) + strlen(sig) + + strlen(loader1) + strlen(sel_class) + strlen(loader2) + + strlen(super_class) + strlen(failed_type_name); char* buf = NEW_RESOURCE_ARRAY_IN_THREAD(THREAD, char, buflen); - jio_snprintf(buf, buflen, msg, sig, loader1, current, loader2, - failed_type_name); + jio_snprintf(buf, buflen, msg, curr_class, sig, loader1, sel_class, loader2, + super_class, failed_type_name); THROW_MSG_(vmSymbols::java_lang_LinkageError(), buf, false); } } @@ -1193,13 +1197,15 @@ void klassItable::initialize_itable_for_interface(int method_table_offset, Klass // to correctly enforce loader constraints for interface method inheritance target = LinkResolver::lookup_instance_method_in_klasses(_klass, m->name(), m->signature(), CHECK); } - if (target == NULL || !target->is_public() || target->is_abstract()) { - // Entry does not resolve. Leave it empty for AbstractMethodError. - if (!(target == NULL) && !target->is_public()) { - // Stuff an IllegalAccessError throwing method in there instead. - itableOffsetEntry::method_entry(_klass, method_table_offset)[m->itable_index()]. - initialize(Universe::throw_illegal_access_error()); - } + if (target == NULL || !target->is_public() || target->is_abstract() || target->is_overpass()) { + assert(target == NULL || !target->is_overpass() || target->is_public(), + "Non-public overpass method!"); + // Entry does not resolve. Leave it empty for AbstractMethodError or other error. + if (!(target == NULL) && !target->is_public()) { + // Stuff an IllegalAccessError throwing method in there instead. + itableOffsetEntry::method_entry(_klass, method_table_offset)[m->itable_index()]. + initialize(Universe::throw_illegal_access_error()); + } } else { // Entry did resolve, check loader constraints before initializing // if checkconstraints requested @@ -1213,24 +1219,24 @@ void klassItable::initialize_itable_for_interface(int method_table_offset, Klass interface_loader, true, CHECK); if (failed_type_symbol != NULL) { - const char* msg = "loader constraint violation in interface " - "itable initialization: when resolving method \"%s\" the class" - " loader (instance of %s) of the current class, %s, " - "and the class loader (instance of %s) for interface " - "%s have different Class objects for the type %s " - "used in the signature"; - char* sig = target()->name_and_sig_as_C_string(); - const char* loader1 = SystemDictionary::loader_name(method_holder_loader()); + const char* msg = "loader constraint violation in interface itable" + " initialization for class %s: when selecting method \"%s\" the" + " class loader (instance of %s) for super interface %s, and the class" + " loader (instance of %s) of the selected method's type, %s have" + " different Class objects for the type %s used in the signature"; char* current = _klass->name()->as_C_string(); - const char* loader2 = SystemDictionary::loader_name(interface_loader()); + char* sig = m->name_and_sig_as_C_string(); + const char* loader1 = SystemDictionary::loader_name(interface_loader()); char* iface = InstanceKlass::cast(interf)->name()->as_C_string(); + const char* loader2 = SystemDictionary::loader_name(method_holder_loader()); + char* mclass = target()->method_holder()->name()->as_C_string(); char* failed_type_name = failed_type_symbol->as_C_string(); - size_t buflen = strlen(msg) + strlen(sig) + strlen(loader1) + - strlen(current) + strlen(loader2) + strlen(iface) + + size_t buflen = strlen(msg) + strlen(current) + strlen(sig) + + strlen(loader1) + strlen(iface) + strlen(loader2) + strlen(mclass) + strlen(failed_type_name); char* buf = NEW_RESOURCE_ARRAY_IN_THREAD(THREAD, char, buflen); - jio_snprintf(buf, buflen, msg, sig, loader1, current, loader2, - iface, failed_type_name); + jio_snprintf(buf, buflen, msg, current, sig, loader1, iface, + loader2, mclass, failed_type_name); THROW_MSG(vmSymbols::java_lang_LinkageError(), buf); } } diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/common/C.jasm b/test/hotspot/jtreg/runtime/LoaderConstraints/common/C.jasm new file mode 100644 index 00000000000..a7d3f94dffd --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/common/C.jasm @@ -0,0 +1,37 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +// If this file was written in java then some of the tests would fail during +// compilation with errors such as: +// class C inherits unrelated defaults for m() from types I and J +// C is not abstract and does not override abstract method m() in I + +super public class C implements I, J version 52:0 { + + public Method "":"()V" stack 1 locals 1 { + aload_0; + invokespecial Method java/lang/Object."":"()V"; + return; + } + +} // end Class C diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/common/Foo.java b/test/hotspot/jtreg/runtime/LoaderConstraints/common/Foo.java new file mode 100644 index 00000000000..1a82277ad34 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/common/Foo.java @@ -0,0 +1,24 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class Foo {} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/common/J.java b/test/hotspot/jtreg/runtime/LoaderConstraints/common/J.java new file mode 100644 index 00000000000..e9f58ca2777 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/common/J.java @@ -0,0 +1,26 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public interface J { + public default Foo m() { return null; } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/common/PreemptingClassLoader.java b/test/hotspot/jtreg/runtime/LoaderConstraints/common/PreemptingClassLoader.java new file mode 100644 index 00000000000..2cc8db0b3ec --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/common/PreemptingClassLoader.java @@ -0,0 +1,59 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +import java.util.*; +import java.io.*; + +public class PreemptingClassLoader extends ClassLoader { + + private final Set names = new HashSet<>(); + + public PreemptingClassLoader(String... names) { + for (String n : names) this.names.add(n); + } + + protected Class loadClass(String name, boolean resolve) throws ClassNotFoundException { + if (!names.contains(name)) return super.loadClass(name, resolve); + Class result = findLoadedClass(name); + if (result == null) { + String filename = name.replace('.', '/') + ".class"; + try (InputStream data = getResourceAsStream(filename)) { + if (data == null) throw new ClassNotFoundException(); + try (ByteArrayOutputStream buffer = new ByteArrayOutputStream()) { + int b; + do { + b = data.read(); + if (b >= 0) buffer.write(b); + } while (b >= 0); + byte[] bytes = buffer.toByteArray(); + result = defineClass(name, bytes, 0, bytes.length); + } + } catch (IOException e) { + throw new ClassNotFoundException("Error reading class file", e); + } + } + if (resolve) resolveClass(result); + return result; + } + +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/I.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/I.java new file mode 100644 index 00000000000..25a6c63acfc --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/I.java @@ -0,0 +1,26 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public interface I { + public default Foo m() { return null; } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Task.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Task.java new file mode 100644 index 00000000000..144d8514010 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Task.java @@ -0,0 +1,31 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class Task implements Runnable { + + public void run() { + Class c = Foo.class; // forces PreemptingClassLoader to load Foo + C x = new C(); // should not trigger loader constraints exception + x.m(); + } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Test.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Test.java new file mode 100644 index 00000000000..3cc83b2351b --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableICCE/Test.java @@ -0,0 +1,59 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8186092 + * @compile ../common/Foo.java + * I.java + * ../common/J.java + * ../common/C.jasm + * Task.java + * ../common/PreemptingClassLoader.java + * @run main/othervm Test + */ + +public class Test { + + // Test that LinkageError exceptions are not thrown during itable creation, + // for loader constraint errors, if the target method is an overpass method. + // + // In this test, during itable creation for class C, method "m()LFoo;" for + // C's super interface I has a different class Foo than the selected method's + // type J. But, the selected method is an overpass method (that throws an + // ICCE). So, no LinkageError exception should be thrown because the loader + // constraint check that would cause the LinkageError should not be done. + public static void main(String... args) throws Exception { + Class c = Foo.class; // forces standard class loader to load Foo + ClassLoader l = new PreemptingClassLoader("Task", "Foo", "C", "I"); + Runnable r = (Runnable) l.loadClass("Task").newInstance(); + try { + r.run(); // Cause an ICCE because both I and J define m()LFoo; + throw new RuntimeException("Expected ICCE exception not thrown"); + } catch (IncompatibleClassChangeError e) { + if (!e.getMessage().contains("Conflicting default methods: I.m J.m")) { + throw new RuntimeException("Wrong ICCE exception thrown: " + e.getMessage()); + } + } + } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/I.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/I.java new file mode 100644 index 00000000000..97fdaa8830b --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/I.java @@ -0,0 +1,26 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public interface I { + public Foo m(); +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Task.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Task.java new file mode 100644 index 00000000000..6d409023eec --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Task.java @@ -0,0 +1,31 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class Task implements Runnable { + + public void run() { + Class c = Foo.class; // forces PreemptingClassLoader to load Foo + C x = new C(); // triggers overloading constraints + x.m(); + } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Test.java b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Test.java new file mode 100644 index 00000000000..3f2793934c7 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/itableLdrConstraint/Test.java @@ -0,0 +1,60 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8186092 + * @compile ../common/Foo.java + * ../common/J.java + * I.java + * ../common/C.jasm + * Task.java + * ../common/PreemptingClassLoader.java + * @run main/othervm Test + */ + +public class Test { + + // Test that the error message is correct when a loader constraint error is + // detected during itable creation. + // + // In this test, during itable creation for class C, method "m()LFoo;" for + // C's super interface I has a different class Foo than the selected method's + // type super interface J. The selected method is not an overpass method nor + // otherwise excluded from loader constraint checking. So, a LinkageError + // exception should be thrown because the loader constraint check will fail. + public static void main(String... args) throws Exception { + Class c = Foo.class; // forces standard class loader to load Foo + ClassLoader l = new PreemptingClassLoader("Task", "Foo", "C", "I"); + Runnable r = (Runnable) l.loadClass("Task").newInstance(); + try { + r.run(); + throw new RuntimeException("Expected LinkageError exception not thrown"); + } catch (LinkageError e) { + if (!e.getMessage().contains( + "loader constraint violation in interface itable initialization for class C:")) { + throw new RuntimeException("Wrong LinkageError exception thrown: " + e.getMessage()); + } + } + } +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/I.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/I.java new file mode 100644 index 00000000000..f6e47464837 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/I.java @@ -0,0 +1,26 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public interface I extends J { + public Foo m(); +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Task.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Task.java new file mode 100644 index 00000000000..ffc2acd8223 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Task.java @@ -0,0 +1,24 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class Task extends C { } diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Test.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Test.java new file mode 100644 index 00000000000..83a5a7f01e7 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableAME/Test.java @@ -0,0 +1,66 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8186092 + * @compile ../common/Foo.java + * ../common/J.java + * I.java + * ../common/C.jasm + * Task.java + * ../common/PreemptingClassLoader.java + * @run main/othervm Test + */ + +import java.io.PrintStream; +import java.lang.reflect.*; + +public class Test { + + // Test that LinkageError exceptions are not thrown during vtable creation, + // for loader constraint errors, if the target method is an overpass method. + // + // In this test, during vtable creation for class Task, the target method + // "Task.m()LFoo;" is an overpass method (that throws an AME). So, even + // though it is inheriting the method from its super class C, and Task has + // a different class Foo than C, no LinkageError exception should be thrown + // because the loader constraint check that would cause the LinkageError + // should not be done. + public static void main(String args[]) throws Exception { + Class c = Foo.class; // forces standard class loader to load Foo + ClassLoader l = new PreemptingClassLoader("Task", "Foo", "I", "J"); + l.loadClass("Foo"); + l.loadClass("Task").newInstance(); + Task t = new Task(); + try { + t.m(); // Should get AME + throw new RuntimeException("Missing AbstractMethodError exception"); + } catch (AbstractMethodError e) { + if (!e.getMessage().contains("Method Task.m()LFoo; is abstract")) { + throw new RuntimeException("Wrong AME exception thrown: " + e.getMessage()); + } + } + } + +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/I.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/I.java new file mode 100644 index 00000000000..f6db30fe83b --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/I.java @@ -0,0 +1,25 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public interface I extends J { +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Task.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Task.java new file mode 100644 index 00000000000..d59a7a4fc76 --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Task.java @@ -0,0 +1,30 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class Task extends C { + + public Foo m() { + return null; + } + +} diff --git a/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Test.java b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Test.java new file mode 100644 index 00000000000..e474c1ee16d --- /dev/null +++ b/test/hotspot/jtreg/runtime/LoaderConstraints/vtableLdrConstraint/Test.java @@ -0,0 +1,63 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8186092 + * @compile ../common/Foo.java + * ../common/J.java + * I.java + * ../common/C.jasm + * Task.java + * ../common/PreemptingClassLoader.java + * @run main/othervm Test + */ + +public class Test { + + // Test that the error message is correct when a loader constraint error is + // detected during vtable creation. + // + // In this test, during vtable creation for class Task, method "Task.m()LFoo;" + // overrides "J.m()LFoo;". But, Task's class Foo and super type J's class Foo + // are different. So, a LinkageError exception should be thrown because the + // loader constraint check will fail. + public static void main(String args[]) throws Exception { + Class c = Foo.class; // forces standard class loader to load Foo + ClassLoader l = new PreemptingClassLoader("Task", "Foo", "I"); + l.loadClass("Foo"); + try { + l.loadClass("Task").newInstance(); + throw new RuntimeException("Expected LinkageError exception not thrown"); + } catch (LinkageError e) { + if (!e.getMessage().contains( + "loader constraint violation for class Task: when selecting overriding method") || + !e.getMessage().contains( + "for its super type J have different Class objects for the type Foo")) { + throw new RuntimeException("Wrong LinkageError exception thrown: " + e.getMessage()); + } + } + } + +} + From c56b6c1c4f0e601b219b26b08da27157572a6c70 Mon Sep 17 00:00:00 2001 From: Sangheon Kim Date: Thu, 28 Sep 2017 12:13:57 -0700 Subject: [PATCH 19/80] 8186465: Each j.l.Reference elapsed time log is incorrect Fixed wrongly referencing variable and updated regression test to compare each elapsed time vs. sum of those Reviewed-by: stefank, tschatzl --- .../shared/referenceProcessorPhaseTimes.cpp | 2 +- .../jtreg/gc/logging/TestPrintReferences.java | 150 ++++++++++++++---- 2 files changed, 121 insertions(+), 31 deletions(-) diff --git a/src/hotspot/share/gc/shared/referenceProcessorPhaseTimes.cpp b/src/hotspot/share/gc/shared/referenceProcessorPhaseTimes.cpp index 2a026d15275..f0dc927339a 100644 --- a/src/hotspot/share/gc/shared/referenceProcessorPhaseTimes.cpp +++ b/src/hotspot/share/gc/shared/referenceProcessorPhaseTimes.cpp @@ -272,7 +272,7 @@ ReferenceProcessorPhaseTimes::~ReferenceProcessorPhaseTimes() { double ReferenceProcessorPhaseTimes::ref_proc_time_ms(ReferenceType ref_type) const { ASSERT_REF_TYPE(ref_type); - return _par_phase_time_ms[ref_type_2_index(ref_type)]; + return _ref_proc_time_ms[ref_type_2_index(ref_type)]; } void ReferenceProcessorPhaseTimes::set_ref_proc_time_ms(ReferenceType ref_type, diff --git a/test/hotspot/jtreg/gc/logging/TestPrintReferences.java b/test/hotspot/jtreg/gc/logging/TestPrintReferences.java index 2a1bb194b6d..f6ab7de5cfe 100644 --- a/test/hotspot/jtreg/gc/logging/TestPrintReferences.java +++ b/test/hotspot/jtreg/gc/logging/TestPrintReferences.java @@ -23,7 +23,7 @@ /* * @test TestPrintReferences - * @bug 8136991 8186402 + * @bug 8136991 8186402 8186465 * @summary Validate the reference processing logging * @key gc * @library /test/lib @@ -36,36 +36,58 @@ import java.util.ArrayList; import jdk.test.lib.process.OutputAnalyzer; import jdk.test.lib.process.ProcessTools; +import java.util.regex.Pattern; +import java.util.regex.Matcher; public class TestPrintReferences { + static String output; + static final String doubleRegex = "[0-9]+[.,][0-9]+"; + static final String referenceProcessing = "Reference Processing"; + static final String softReference = "SoftReference"; + static final String weakReference = "WeakReference"; + static final String finalReference = "FinalReference"; + static final String phantomReference = "PhantomReference"; + static final String phase1 = "Phase1"; + static final String phase2 = "Phase2"; + static final String phase3 = "Phase3"; + static final String gcLogTimeRegex = ".* GC\\([0-9]+\\) "; + public static void main(String[] args) throws Exception { ProcessBuilder pb_enabled = ProcessTools.createJavaProcessBuilder("-Xlog:gc+phases+ref=debug", "-XX:+UseG1GC", - "-Xmx10M", + "-Xmx32M", // Explicit thread setting is required to avoid using only 1 thread "-XX:ParallelGCThreads=2", GCTest.class.getName()); OutputAnalyzer output = new OutputAnalyzer(pb_enabled.start()); - String indent_4 = " "; - String indent_6 = " "; - String indent_8 = " "; - String gcLogTimeRegex = ".* GC\\([0-9]+\\) "; + checkLogFormat(output); + checkLogValue(output); + + output.shouldHaveExitValue(0); + } + + static String indent(int count) { + return " {" + count + "}"; + } + + // Find the first Reference Processing log and check its format. + public static void checkLogFormat(OutputAnalyzer output) { String countRegex = "[0-9]+"; - String timeRegex = "[0-9]+[.,][0-9]+ms"; - String totalRegex = gcLogTimeRegex + indent_4 + "Reference Processing: " + timeRegex + "\n"; - String balanceRegex = gcLogTimeRegex + indent_8 + "Balance queues: " + timeRegex + "\n"; - String softRefRegex = gcLogTimeRegex + indent_6 + "SoftReference: " + timeRegex + "\n"; - String weakRefRegex = gcLogTimeRegex + indent_6 + "WeakReference: " + timeRegex + "\n"; - String finalRefRegex = gcLogTimeRegex + indent_6 + "FinalReference: " + timeRegex + "\n"; - String phantomRefRegex = gcLogTimeRegex + indent_6 + "PhantomReference: " + timeRegex + "\n"; - String refDetailRegex = gcLogTimeRegex + indent_8 + "Phase2: " + timeRegex + "\n" + - gcLogTimeRegex + indent_8 + "Phase3: " + timeRegex + "\n" + - gcLogTimeRegex + indent_8 + "Discovered: " + countRegex + "\n" + - gcLogTimeRegex + indent_8 + "Cleared: " + countRegex + "\n"; - String softRefDetailRegex = gcLogTimeRegex + indent_8 + "Phase1: " + timeRegex + "\n" + refDetailRegex; - String enqueueRegex = gcLogTimeRegex + indent_4 + "Reference Enqueuing: " + timeRegex + "\n"; - String enqueueDetailRegex = gcLogTimeRegex + indent_6 + "Reference Counts: Soft: " + countRegex + + String timeRegex = doubleRegex + "ms"; + String totalRegex = gcLogTimeRegex + indent(4) + referenceProcessing + ": " + timeRegex + "\n"; + String balanceRegex = gcLogTimeRegex + indent(8) + "Balance queues: " + timeRegex + "\n"; + String softRefRegex = gcLogTimeRegex + indent(6) + softReference + ": " + timeRegex + "\n"; + String weakRefRegex = gcLogTimeRegex + indent(6) + weakReference + ": " + timeRegex + "\n"; + String finalRefRegex = gcLogTimeRegex + indent(6) + finalReference + ": " + timeRegex + "\n"; + String phantomRefRegex = gcLogTimeRegex + indent(6) + phantomReference + ": " + timeRegex + "\n"; + String refDetailRegex = gcLogTimeRegex + indent(8) + phase2 + ": " + timeRegex + "\n" + + gcLogTimeRegex + indent(8) + phase3 + ": " + timeRegex + "\n" + + gcLogTimeRegex + indent(8) + "Discovered: " + countRegex + "\n" + + gcLogTimeRegex + indent(8) + "Cleared: " + countRegex + "\n"; + String softRefDetailRegex = gcLogTimeRegex + indent(8) + phase1 + ": " + timeRegex + "\n" + refDetailRegex; + String enqueueRegex = gcLogTimeRegex + indent(4) + "Reference Enqueuing: " + timeRegex + "\n"; + String enqueueDetailRegex = gcLogTimeRegex + indent(6) + "Reference Counts: Soft: " + countRegex + " Weak: " + countRegex + " Final: " + countRegex + " Phantom: " + countRegex + "\n"; output.shouldMatch(/* Total Reference processing time */ @@ -83,22 +105,90 @@ public class TestPrintReferences { /* Enqueued Stats */ enqueueDetailRegex ); + } - output.shouldHaveExitValue(0); + // After getting time value, update 'output' for next use. + public static double getTimeValue(String name, int indentCount) { + // Pattern of 'name', 'value' and some extra strings. + String patternString = gcLogTimeRegex + indent(indentCount) + name + ": " + "(" + doubleRegex + ")"; + Matcher m = Pattern.compile(patternString).matcher(output); + if (!m.find()) { + throw new RuntimeException("Could not find time log for " + patternString); + } + + String match = m.group(); + String value = m.group(1); + + double result = Double.parseDouble(value); + + int index = output.indexOf(match); + if (index != -1) { + output = output.substring(index, output.length()); + } + + return result; + } + + // Reference log is printing 1 decimal place of elapsed time. + // So sum of each sub-phases could be slightly larger than the enclosing phase in some cases. + // As the maximum of sub-phases is 3, allow 0.1 of TOLERANCE. + // e.g. Actual value: SoftReference(5.55) = phase1(1.85) + phase2(1.85) + phase3(1.85) + // Log value: SoftReference(5.6) = phase1(1.9) + phase2(1.9) + phase3(1.9) + // When checked: 5.6 < 5.7 (sum of phase1~3) + public static boolean approximatelyEqual(double a, double b) { + final double TOLERANCE = 0.1; + + return Math.abs(a - b) <= TOLERANCE; + } + + // Return false, if 'total' is larger and not approximately equal to 'refTime'. + public static boolean compare(double refTime, double total) { + return (refTime < total) && (!approximatelyEqual(refTime, total)); + } + + public static double checkRefTime(String refType) { + double refTime = getTimeValue(refType, 2); + double total = 0.0; + + if (softReference.equals(refType)) { + total += getTimeValue(phase1, 4); + } + total += getTimeValue(phase2, 4); + total += getTimeValue(phase3, 4); + + if (compare(refTime, total)) { + throw new RuntimeException(refType +" time(" + refTime + + "ms) is less than the sum(" + total + "ms) of each phases"); + } + + return refTime; + } + + // Find the first concurrent Reference Processing log and compare sub-time vs. total. + public static void checkLogValue(OutputAnalyzer out) { + output = out.getStdout(); + + double refProcTime = getTimeValue(referenceProcessing, 0); + + double total = 0.0; + total += checkRefTime(softReference); + total += checkRefTime(weakReference); + total += checkRefTime(finalReference); + total += checkRefTime(phantomReference); + + if (compare(refProcTime, total)) { + throw new RuntimeException("Reference Processing time(" + refProcTime + "ms) is less than the sum(" + + total + "ms) of each phases"); + } } static class GCTest { - static final int M = 1024 * 1024; + static final int SIZE = 512 * 1024; + static Object[] dummy = new Object[SIZE]; public static void main(String [] args) { - - ArrayList arrSoftRefs = new ArrayList(); - - // Populate to triger GC and then Reference related logs will be printed. - for (int i = 0; i < 10; i++) { - byte[] tmp = new byte[M]; - - arrSoftRefs.add(new SoftReference(tmp)); + for (int i = 0; i < SIZE; i++) { + dummy[i] = new SoftReference<>(new Object()); } } } From d72e093a748c25bc50792d8457b0786c987c72dc Mon Sep 17 00:00:00 2001 From: Jaroslav Tulach Date: Thu, 28 Sep 2017 13:52:15 -0700 Subject: [PATCH 20/80] 8182701: Modify JVMCI to allow Graal Compiler to expose platform MBean Reviewed-by: dnsimon, kvn, alanb, mchung, dfuchs --- make/common/Modules.gmk | 2 + .../share/classes/module-info.java | 3 +- .../share/classes/module-info.java | 3 + .../share/classes/module-info.java | 41 +++++++++ .../compiler/hotspot/jmx/GraalMBeans.java | 91 +++++++++++++++++++ .../share/classes/module-info.java | 4 +- .../hotspot/HotSpotGraalCompiler.java | 7 ++ .../compiler/hotspot/HotSpotGraalRuntime.java | 4 + 8 files changed, 153 insertions(+), 2 deletions(-) create mode 100644 src/jdk.internal.vm.compiler.management/share/classes/module-info.java create mode 100644 src/jdk.internal.vm.compiler.management/share/classes/org/graalvm/compiler/hotspot/jmx/GraalMBeans.java diff --git a/make/common/Modules.gmk b/make/common/Modules.gmk index ee697971a2d..736e0607725 100644 --- a/make/common/Modules.gmk +++ b/make/common/Modules.gmk @@ -113,6 +113,7 @@ PLATFORM_MODULES += \ jdk.crypto.ec \ jdk.dynalink \ jdk.incubator.httpclient \ + jdk.internal.vm.compiler.management \ jdk.jsobject \ jdk.localedata \ jdk.naming.dns \ @@ -215,6 +216,7 @@ endif ifeq ($(INCLUDE_GRAAL), false) MODULES_FILTER += jdk.internal.vm.compiler + MODULES_FILTER += jdk.internal.vm.compiler.management endif ################################################################################ diff --git a/src/java.management/share/classes/module-info.java b/src/java.management/share/classes/module-info.java index 2b2054cb724..26f34ba21b9 100644 --- a/src/java.management/share/classes/module-info.java +++ b/src/java.management/share/classes/module-info.java @@ -64,7 +64,8 @@ module java.management { exports sun.management.counter.perf to jdk.management.agent; exports sun.management.spi to - jdk.management; + jdk.management, + jdk.internal.vm.compiler.management; uses javax.management.remote.JMXConnectorProvider; uses javax.management.remote.JMXConnectorServerProvider; diff --git a/src/jdk.internal.vm.ci/share/classes/module-info.java b/src/jdk.internal.vm.ci/share/classes/module-info.java index e6001b18f37..fca5828dd06 100644 --- a/src/jdk.internal.vm.ci/share/classes/module-info.java +++ b/src/jdk.internal.vm.ci/share/classes/module-info.java @@ -25,6 +25,9 @@ module jdk.internal.vm.ci { exports jdk.vm.ci.services to jdk.internal.vm.compiler; + exports jdk.vm.ci.runtime to + jdk.internal.vm.compiler, + jdk.internal.vm.compiler.management; uses jdk.vm.ci.services.JVMCIServiceLocator; uses jdk.vm.ci.hotspot.HotSpotJVMCIBackendFactory; diff --git a/src/jdk.internal.vm.compiler.management/share/classes/module-info.java b/src/jdk.internal.vm.compiler.management/share/classes/module-info.java new file mode 100644 index 00000000000..328648d4456 --- /dev/null +++ b/src/jdk.internal.vm.compiler.management/share/classes/module-info.java @@ -0,0 +1,41 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. Oracle designates this + * particular file as subject to the "Classpath" exception as provided + * by Oracle in the LICENSE file that accompanied this code. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/** + * Registers Graal Compiler specific management interfaces for the JVM. + * + * @moduleGraph + * @since 10 + */ +module jdk.internal.vm.compiler.management { + requires java.management; + requires jdk.management; + requires jdk.internal.vm.ci; + requires jdk.internal.vm.compiler; + + provides sun.management.spi.PlatformMBeanProvider with + org.graalvm.compiler.hotspot.jmx.GraalMBeans; +} + diff --git a/src/jdk.internal.vm.compiler.management/share/classes/org/graalvm/compiler/hotspot/jmx/GraalMBeans.java b/src/jdk.internal.vm.compiler.management/share/classes/org/graalvm/compiler/hotspot/jmx/GraalMBeans.java new file mode 100644 index 00000000000..0161f92a216 --- /dev/null +++ b/src/jdk.internal.vm.compiler.management/share/classes/org/graalvm/compiler/hotspot/jmx/GraalMBeans.java @@ -0,0 +1,91 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ +package org.graalvm.compiler.hotspot.jmx; + +import java.util.ArrayList; +import java.util.Collections; +import java.util.List; +import java.util.Map; +import java.util.Set; +import jdk.vm.ci.runtime.JVMCI; +import jdk.vm.ci.runtime.JVMCICompiler; +import jdk.vm.ci.runtime.JVMCIRuntime; +import org.graalvm.compiler.hotspot.HotSpotGraalCompiler; +import sun.management.spi.PlatformMBeanProvider; +import sun.management.spi.PlatformMBeanProvider.PlatformComponent; + +public final class GraalMBeans extends PlatformMBeanProvider { + @Override + public List> getPlatformComponentList() { + List> components = new ArrayList<>(); + try { + Object bean = findGraalRuntimeBean(); + if (bean != null) { + components.add(new HotSpotRuntimeMBeanComponent(bean)); + } + } catch (InternalError | LinkageError err) { + // go on and ignore + } + return components; + } + + public static Object findGraalRuntimeBean() { + JVMCIRuntime r = JVMCI.getRuntime(); + JVMCICompiler c = r.getCompiler(); + if (c instanceof HotSpotGraalCompiler) { + return ((HotSpotGraalCompiler) c).mbean(); + } + return null; + } + + private static final class HotSpotRuntimeMBeanComponent implements PlatformComponent { + + private final String name; + private final Object mbean; + + HotSpotRuntimeMBeanComponent(Object mbean) { + this.name = "org.graalvm.compiler.hotspot:type=Options"; + this.mbean = mbean; + } + + @Override + public Set> mbeanInterfaces() { + return Collections.emptySet(); + } + + @Override + public Set mbeanInterfaceNames() { + return Collections.emptySet(); + } + + @Override + public String getObjectNamePattern() { + return name; + } + + @Override + public Map nameToMBeanMap() { + return Collections.singletonMap(name, mbean); + } + } +} diff --git a/src/jdk.internal.vm.compiler/share/classes/module-info.java b/src/jdk.internal.vm.compiler/share/classes/module-info.java index 0cae4bc22d9..44c1259646d 100644 --- a/src/jdk.internal.vm.compiler/share/classes/module-info.java +++ b/src/jdk.internal.vm.compiler/share/classes/module-info.java @@ -50,7 +50,9 @@ module jdk.internal.vm.compiler { exports org.graalvm.compiler.core.target to jdk.aot; exports org.graalvm.compiler.debug to jdk.aot; exports org.graalvm.compiler.graph to jdk.aot; - exports org.graalvm.compiler.hotspot to jdk.aot; + exports org.graalvm.compiler.hotspot to + jdk.aot, + jdk.internal.vm.compiler.management; exports org.graalvm.compiler.hotspot.meta to jdk.aot; exports org.graalvm.compiler.hotspot.replacements to jdk.aot; exports org.graalvm.compiler.hotspot.stubs to jdk.aot; diff --git a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalCompiler.java b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalCompiler.java index 489bbd73f5f..c77d3eebf18 100644 --- a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalCompiler.java +++ b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalCompiler.java @@ -282,6 +282,13 @@ public class HotSpotGraalCompiler implements GraalJVMCICompiler { return suite; } + public Object mbean() { + if (graalRuntime instanceof HotSpotGraalRuntime) { + return ((HotSpotGraalRuntime)graalRuntime).mbean(); + } + return null; + } + /** * Converts {@code method} to a String with {@link JavaMethod#format(String)} and the format * string {@code "%H.%n(%p)"}. diff --git a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalRuntime.java b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalRuntime.java index 3e433b13378..c56d8105219 100644 --- a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalRuntime.java +++ b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/HotSpotGraalRuntime.java @@ -316,4 +316,8 @@ public final class HotSpotGraalRuntime implements HotSpotGraalRuntimeProvider { public Map getCompilationProblemsPerAction() { return compilationProblemsPerAction; } + + final Object mbean() { + return mBean; + } } From 9f006db9f83899dab7d757065ffb1633d22c3d9e Mon Sep 17 00:00:00 2001 From: Igor Ignatyev Date: Fri, 1 Sep 2017 15:28:54 -0700 Subject: [PATCH 21/80] 8187020: AOT tests should not fail if devkit dependency isn't resolved Reviewed-by: kvn --- .../jtreg/compiler/aot/AotCompiler.java | 38 ++++++++++++++++--- 1 file changed, 32 insertions(+), 6 deletions(-) diff --git a/test/hotspot/jtreg/compiler/aot/AotCompiler.java b/test/hotspot/jtreg/compiler/aot/AotCompiler.java index 9a3654b1355..5c230309013 100644 --- a/test/hotspot/jtreg/compiler/aot/AotCompiler.java +++ b/test/hotspot/jtreg/compiler/aot/AotCompiler.java @@ -145,13 +145,37 @@ public class AotCompiler { + " [-compile ]* [-extraopt ]*"); } + // runs ld -v (or ld -V on solaris) and check its exit code + private static boolean checkLd(Path bin) { + try { + return 0 == ProcessTools.executeCommand(bin.toString(), + Platform.isSolaris() ? "-V" : "-v") + .getExitValue(); + } catch (Throwable t) { + // any errors mean ld doesn't work + return false; + } + } + public static String resolveLinker() { Path linker = null; - // 1st, check if PATH has ld - for (String path : System.getenv("PATH").split(File.pathSeparator)) { - if (Files.exists(Paths.get(path).resolve("ld"))) { - // there is ld in PATH, jaotc is supposed to find it by its own - return null; + // if non windows, 1st, check if PATH has ld + if (!Platform.isWindows()) { + String bin = "ld"; + for (String path : System.getenv("PATH").split(File.pathSeparator)) { + Path ld = Paths.get(path).resolve("ld"); + if (Files.exists(ld)) { + // there is ld in PATH + if (checkLd(ld)) { + System.out.println("found working linker: " + ld); + // ld works, jaotc is supposed to find and use it + return null; + } else { + System.out.println("found broken linker: " + ld); + // ld exists in PATH, but doesn't work, have to use devkit + break; + } + } } } // there is no ld in PATH, will use ld from devkit @@ -275,7 +299,9 @@ public class AotCompiler { } } } catch (FileNotFoundException e) { - throw new Error("artifact resolution error: " + e, e); + System.err.println("artifact resolution error: " + e); + // let jaotc try to find linker + return null; } if (linker != null) { return linker.toAbsolutePath().toString(); From 12a11f2c65432bc88cab3e74173bef3d736b0cde Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Fri, 29 Sep 2017 20:57:48 +0900 Subject: [PATCH 22/80] 8175816: SA: HSDB: Compute Liveness results in java.lang.IndexOutOfBoundsException Reviewed-by: sspitsyn, jgeorge --- .../sun/jvm/hotspot/oops/ConstantPool.java | 9 +- .../sa/TestRevPtrsForInvokeDynamic.java | 105 ++++++++++++++++++ 2 files changed, 109 insertions(+), 5 deletions(-) create mode 100644 test/hotspot/jtreg/serviceability/sa/TestRevPtrsForInvokeDynamic.java diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/ConstantPool.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/ConstantPool.java index c7285ed316d..b81b01b3881 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/ConstantPool.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/ConstantPool.java @@ -269,13 +269,12 @@ public class ConstantPool extends Metadata implements ClassConstants { public static int decodeInvokedynamicIndex(int i) { Assert.that(isInvokedynamicIndex(i), ""); return ~i; } - // The invokedynamic points at the object index. The object map points at - // the cpCache index and the cpCache entry points at the original constant - // pool index. + // The invokedynamic points at a CP cache entry. This entry points back + // at the original CP entry (CONSTANT_InvokeDynamic) and also (via f2) at an entry + // in the resolved_references array (which provides the appendix argument). public int invokedynamicCPCacheIndex(int index) { Assert.that(isInvokedynamicIndex(index), "should be a invokedynamic index"); - int rawIndex = decodeInvokedynamicIndex(index); - return referenceMap().at(rawIndex); + return decodeInvokedynamicIndex(index); } ConstantPoolCacheEntry invokedynamicCPCacheEntryAt(int index) { diff --git a/test/hotspot/jtreg/serviceability/sa/TestRevPtrsForInvokeDynamic.java b/test/hotspot/jtreg/serviceability/sa/TestRevPtrsForInvokeDynamic.java new file mode 100644 index 00000000000..4936e90cd31 --- /dev/null +++ b/test/hotspot/jtreg/serviceability/sa/TestRevPtrsForInvokeDynamic.java @@ -0,0 +1,105 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +import java.util.ArrayList; +import java.util.List; + +import sun.jvm.hotspot.HotSpotAgent; +import sun.jvm.hotspot.utilities.ReversePtrsAnalysis; + +import jdk.test.lib.apps.LingeredApp; +import jdk.test.lib.Asserts; +import jdk.test.lib.JDKToolFinder; +import jdk.test.lib.JDKToolLauncher; +import jdk.test.lib.Platform; +import jdk.test.lib.process.OutputAnalyzer; +import jdk.test.lib.process.ProcessTools; +import jdk.test.lib.Utils; + +/* + * @test + * @library /test/lib + * @requires os.family != "mac" + * @modules java.base/jdk.internal.misc + * jdk.hotspot.agent/sun.jvm.hotspot + * jdk.hotspot.agent/sun.jvm.hotspot.utilities + * @run main/othervm TestRevPtrsForInvokeDynamic + */ + +public class TestRevPtrsForInvokeDynamic { + + private static LingeredAppWithInvokeDynamic theApp = null; + + private static void computeReversePointers(String pid) throws Exception { + HotSpotAgent agent = new HotSpotAgent(); + + try { + agent.attach(Integer.parseInt(pid)); + ReversePtrsAnalysis analysis = new ReversePtrsAnalysis(); + analysis.run(); + } finally { + agent.detach(); + } + } + + private static void createAnotherToAttach(long lingeredAppPid) + throws Exception { + String[] toolArgs = { + "--add-modules=jdk.hotspot.agent", + "--add-exports=jdk.hotspot.agent/sun.jvm.hotspot=ALL-UNNAMED", + "--add-exports=jdk.hotspot.agent/sun.jvm.hotspot.utilities=ALL-UNNAMED", + "TestRevPtrsForInvokeDynamic", + Long.toString(lingeredAppPid) + }; + + // Start a new process to attach to the lingered app + ProcessBuilder processBuilder = ProcessTools.createJavaProcessBuilder(toolArgs); + OutputAnalyzer SAOutput = ProcessTools.executeProcess(processBuilder); + SAOutput.shouldHaveExitValue(0); + System.out.println(SAOutput.getOutput()); + } + + public static void main (String... args) throws Exception { + if (!Platform.shouldSAAttach()) { + System.out.println( + "SA attach not expected to work - test skipped."); + return; + } + + if (args == null || args.length == 0) { + try { + List vmArgs = new ArrayList(); + vmArgs.add("-XX:+UsePerfData"); + vmArgs.addAll(Utils.getVmOptions()); + + theApp = new LingeredAppWithInvokeDynamic(); + LingeredApp.startApp(vmArgs, theApp); + createAnotherToAttach(theApp.getPid()); + } finally { + LingeredApp.stopApp(theApp); + } + } else { + computeReversePointers(args[0]); + } + } +} From b787f1b55b30059da46b74733be0841325ad7c5f Mon Sep 17 00:00:00 2001 From: Dmitrij Pochepko Date: Mon, 2 Oct 2017 17:20:14 +0300 Subject: [PATCH 23/80] 8186915: AARCH64: Intrinsify squareToLen and mulAdd Reviewed-by: aph --- .../cpu/aarch64/macroAssembler_aarch64.cpp | 38 +++++++++++ .../cpu/aarch64/macroAssembler_aarch64.hpp | 1 + .../cpu/aarch64/stubGenerator_aarch64.cpp | 65 +++++++++++++++++++ .../cpu/aarch64/vm_version_aarch64.cpp | 8 +++ 4 files changed, 112 insertions(+) diff --git a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp index 78637f21dc1..c83f894c13e 100644 --- a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp @@ -2840,6 +2840,44 @@ void MacroAssembler::multiply_to_len(Register x, Register xlen, Register y, Regi bind(L_done); } +// Code for BigInteger::mulAdd instrinsic +// out = r0 +// in = r1 +// offset = r2 (already out.length-offset) +// len = r3 +// k = r4 +// +// pseudo code from java implementation: +// carry = 0; +// offset = out.length-offset - 1; +// for (int j=len-1; j >= 0; j--) { +// product = (in[j] & LONG_MASK) * kLong + (out[offset] & LONG_MASK) + carry; +// out[offset--] = (int)product; +// carry = product >>> 32; +// } +// return (int)carry; +void MacroAssembler::mul_add(Register out, Register in, Register offset, + Register len, Register k) { + Label LOOP, END; + // pre-loop + cmp(len, zr); // cmp, not cbz/cbnz: to use condition twice => less branches + csel(out, zr, out, Assembler::EQ); + br(Assembler::EQ, END); + add(in, in, len, LSL, 2); // in[j+1] address + add(offset, out, offset, LSL, 2); // out[offset + 1] address + mov(out, zr); // used to keep carry now + BIND(LOOP); + ldrw(rscratch1, Address(pre(in, -4))); + madd(rscratch1, rscratch1, k, out); + ldrw(rscratch2, Address(pre(offset, -4))); + add(rscratch1, rscratch1, rscratch2); + strw(rscratch1, Address(offset)); + lsr(out, rscratch1, 32); + subs(len, len, 1); + br(Assembler::NE, LOOP); + BIND(END); +} + /** * Emits code to update CRC-32 with a byte value according to constants in table * diff --git a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.hpp b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.hpp index a3a3c74c626..d0ca968bd44 100644 --- a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.hpp +++ b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.hpp @@ -1265,6 +1265,7 @@ public: void multiply_to_len(Register x, Register xlen, Register y, Register ylen, Register z, Register zlen, Register tmp1, Register tmp2, Register tmp3, Register tmp4, Register tmp5, Register tmp6, Register tmp7); + void mul_add(Register out, Register in, Register offs, Register len, Register k); // ISB may be needed because of a safepoint void maybe_isb() { isb(); } diff --git a/src/hotspot/cpu/aarch64/stubGenerator_aarch64.cpp b/src/hotspot/cpu/aarch64/stubGenerator_aarch64.cpp index e6e79a468d2..d9c2cdc4a52 100644 --- a/src/hotspot/cpu/aarch64/stubGenerator_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/stubGenerator_aarch64.cpp @@ -3607,6 +3607,63 @@ class StubGenerator: public StubCodeGenerator { return start; } + address generate_squareToLen() { + // squareToLen algorithm for sizes 1..127 described in java code works + // faster than multiply_to_len on some CPUs and slower on others, but + // multiply_to_len shows a bit better overall results + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", "squareToLen"); + address start = __ pc(); + + const Register x = r0; + const Register xlen = r1; + const Register z = r2; + const Register zlen = r3; + const Register y = r4; // == x + const Register ylen = r5; // == xlen + + const Register tmp1 = r10; + const Register tmp2 = r11; + const Register tmp3 = r12; + const Register tmp4 = r13; + const Register tmp5 = r14; + const Register tmp6 = r15; + const Register tmp7 = r16; + + RegSet spilled_regs = RegSet::of(y, ylen); + BLOCK_COMMENT("Entry:"); + __ enter(); + __ push(spilled_regs, sp); + __ mov(y, x); + __ mov(ylen, xlen); + __ multiply_to_len(x, xlen, y, ylen, z, zlen, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7); + __ pop(spilled_regs, sp); + __ leave(); + __ ret(lr); + return start; + } + + address generate_mulAdd() { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", "mulAdd"); + + address start = __ pc(); + + const Register out = r0; + const Register in = r1; + const Register offset = r2; + const Register len = r3; + const Register k = r4; + + BLOCK_COMMENT("Entry:"); + __ enter(); + __ mul_add(out, in, offset, len, k); + __ leave(); + __ ret(lr); + + return start; + } + void ghash_multiply(FloatRegister result_lo, FloatRegister result_hi, FloatRegister a, FloatRegister b, FloatRegister a1_xor_a0, FloatRegister tmp1, FloatRegister tmp2, FloatRegister tmp3, FloatRegister tmp4) { @@ -4913,6 +4970,14 @@ class StubGenerator: public StubCodeGenerator { StubRoutines::_multiplyToLen = generate_multiplyToLen(); } + if (UseSquareToLenIntrinsic) { + StubRoutines::_squareToLen = generate_squareToLen(); + } + + if (UseMulAddIntrinsic) { + StubRoutines::_mulAdd = generate_mulAdd(); + } + if (UseMontgomeryMultiplyIntrinsic) { StubCodeMark mark(this, "StubRoutines", "montgomeryMultiply"); MontgomeryMultiplyGenerator g(_masm, /*squaring*/false); diff --git a/src/hotspot/cpu/aarch64/vm_version_aarch64.cpp b/src/hotspot/cpu/aarch64/vm_version_aarch64.cpp index 722ebbba322..8480e4e8e71 100644 --- a/src/hotspot/cpu/aarch64/vm_version_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/vm_version_aarch64.cpp @@ -340,6 +340,14 @@ void VM_Version::get_processor_features() { UseMultiplyToLenIntrinsic = true; } + if (FLAG_IS_DEFAULT(UseSquareToLenIntrinsic)) { + UseSquareToLenIntrinsic = true; + } + + if (FLAG_IS_DEFAULT(UseMulAddIntrinsic)) { + UseMulAddIntrinsic = true; + } + if (FLAG_IS_DEFAULT(UseBarriersForVolatile)) { UseBarriersForVolatile = (_features & CPU_DMB_ATOMICS) != 0; } From 853f26ed15adb2e2bf8435e1d9e390eadbacee6f Mon Sep 17 00:00:00 2001 From: Ekaterina Pavlova Date: Mon, 2 Oct 2017 14:31:34 -0700 Subject: [PATCH 24/80] 8185134: [Graal] Introduce vm.graal predicate and tag tests which are not applicable for Graal Reviewed-by: kvn, dnsimon --- test/hotspot/jtreg/TEST.ROOT | 3 +- .../arraycopy/TestArrayCopyNoInitDeopt.java | 2 +- .../jtreg/compiler/c2/Test8004741.java | 1 + .../jcmd/PrintDirectivesTest.java | 2 +- .../logcompilation/LogTest.java | 2 + .../TestAESIntrinsicsOnSupportedConfig.java | 2 +- .../intrinsics/IntrinsicDisabledTest.java | 2 + .../klass/CastNullCheckDroppingsTest.java | 2 +- .../UseCountedLoopSafepointsTest.java | 2 +- test/jtreg-ext/requires/VMProps.java | 37 +++++++++++++++++++ 10 files changed, 49 insertions(+), 6 deletions(-) diff --git a/test/hotspot/jtreg/TEST.ROOT b/test/hotspot/jtreg/TEST.ROOT index 1fcc8610f36..ea7ebb451ee 100644 --- a/test/hotspot/jtreg/TEST.ROOT +++ b/test/hotspot/jtreg/TEST.ROOT @@ -52,7 +52,8 @@ requires.properties= \ vm.rtm.cpu \ vm.rtm.os \ vm.aot \ - vm.cds + vm.cds \ + vm.graal.enabled # Minimum jtreg version requiredVersion=4.2 b08 diff --git a/test/hotspot/jtreg/compiler/arraycopy/TestArrayCopyNoInitDeopt.java b/test/hotspot/jtreg/compiler/arraycopy/TestArrayCopyNoInitDeopt.java index 023bd266f31..34ff2e13393 100644 --- a/test/hotspot/jtreg/compiler/arraycopy/TestArrayCopyNoInitDeopt.java +++ b/test/hotspot/jtreg/compiler/arraycopy/TestArrayCopyNoInitDeopt.java @@ -25,7 +25,7 @@ * @test * @bug 8072016 * @summary Infinite deoptimization/recompilation cycles in case of arraycopy with tightly coupled allocation - * @requires vm.flavor == "server" & !vm.emulatedClient + * @requires vm.flavor == "server" & !vm.emulatedClient & !vm.graal.enabled * @library /test/lib / * @modules java.base/jdk.internal.misc * java.management diff --git a/test/hotspot/jtreg/compiler/c2/Test8004741.java b/test/hotspot/jtreg/compiler/c2/Test8004741.java index f52a68e0090..69d2ad9f0bd 100644 --- a/test/hotspot/jtreg/compiler/c2/Test8004741.java +++ b/test/hotspot/jtreg/compiler/c2/Test8004741.java @@ -26,6 +26,7 @@ * @bug 8004741 * @summary Missing compiled exception handle table entry for multidimensional array allocation * + * @requires !vm.graal.enabled * @run main/othervm -Xmx64m -Xbatch -XX:+IgnoreUnrecognizedVMOptions -XX:+UnlockDiagnosticVMOptions * -XX:-TieredCompilation -XX:+StressCompiledExceptionHandlers * -XX:+SafepointALot -XX:GuaranteedSafepointInterval=100 diff --git a/test/hotspot/jtreg/compiler/compilercontrol/jcmd/PrintDirectivesTest.java b/test/hotspot/jtreg/compiler/compilercontrol/jcmd/PrintDirectivesTest.java index 335e89c6668..2f8f4abc9f4 100644 --- a/test/hotspot/jtreg/compiler/compilercontrol/jcmd/PrintDirectivesTest.java +++ b/test/hotspot/jtreg/compiler/compilercontrol/jcmd/PrintDirectivesTest.java @@ -27,7 +27,7 @@ * @summary Tests jcmd to be able to add a directive to compile only specified methods * @modules java.base/jdk.internal.misc * @library /test/lib / - * @requires vm.flavor != "minimal" + * @requires vm.flavor != "minimal" & !vm.graal.enabled * * @build sun.hotspot.WhiteBox * @run driver ClassFileInstaller sun.hotspot.WhiteBox diff --git a/test/hotspot/jtreg/compiler/compilercontrol/logcompilation/LogTest.java b/test/hotspot/jtreg/compiler/compilercontrol/logcompilation/LogTest.java index b681029061a..97650e9fbf6 100644 --- a/test/hotspot/jtreg/compiler/compilercontrol/logcompilation/LogTest.java +++ b/test/hotspot/jtreg/compiler/compilercontrol/logcompilation/LogTest.java @@ -25,6 +25,8 @@ * @test * @bug 8137167 * @summary Tests LogCompilation executed standalone without log commands or directives + * + * @requires !vm.graal.enabled * @modules java.base/jdk.internal.misc * @library /test/lib / * diff --git a/test/hotspot/jtreg/compiler/cpuflags/TestAESIntrinsicsOnSupportedConfig.java b/test/hotspot/jtreg/compiler/cpuflags/TestAESIntrinsicsOnSupportedConfig.java index b4f62daa762..ac17e567b09 100644 --- a/test/hotspot/jtreg/compiler/cpuflags/TestAESIntrinsicsOnSupportedConfig.java +++ b/test/hotspot/jtreg/compiler/cpuflags/TestAESIntrinsicsOnSupportedConfig.java @@ -26,7 +26,7 @@ * @library /test/lib / * @modules java.base/jdk.internal.misc * java.management - * @requires vm.cpu.features ~= ".*aes.*" + * @requires vm.cpu.features ~= ".*aes.*" & !vm.graal.enabled * @build sun.hotspot.WhiteBox * @run driver ClassFileInstaller sun.hotspot.WhiteBox * sun.hotspot.WhiteBox$WhiteBoxPermission diff --git a/test/hotspot/jtreg/compiler/intrinsics/IntrinsicDisabledTest.java b/test/hotspot/jtreg/compiler/intrinsics/IntrinsicDisabledTest.java index aed0acab0ab..14edaf4e495 100644 --- a/test/hotspot/jtreg/compiler/intrinsics/IntrinsicDisabledTest.java +++ b/test/hotspot/jtreg/compiler/intrinsics/IntrinsicDisabledTest.java @@ -24,6 +24,8 @@ /* * @test * @bug 8138651 + * + * @requires !vm.graal.enabled * @modules java.base/jdk.internal.misc * @library /test/lib / * diff --git a/test/hotspot/jtreg/compiler/intrinsics/klass/CastNullCheckDroppingsTest.java b/test/hotspot/jtreg/compiler/intrinsics/klass/CastNullCheckDroppingsTest.java index 3285b904bf7..c31a87a46a2 100644 --- a/test/hotspot/jtreg/compiler/intrinsics/klass/CastNullCheckDroppingsTest.java +++ b/test/hotspot/jtreg/compiler/intrinsics/klass/CastNullCheckDroppingsTest.java @@ -25,7 +25,7 @@ * @test NullCheckDroppingsTest * @bug 8054492 * @summary Casting can result in redundant null checks in generated code - * @requires vm.flavor == "server" & !vm.emulatedClient + * @requires vm.flavor == "server" & !vm.emulatedClient & !vm.graal.enabled * @library /test/lib * @modules java.base/jdk.internal.misc * java.management diff --git a/test/hotspot/jtreg/compiler/loopopts/UseCountedLoopSafepointsTest.java b/test/hotspot/jtreg/compiler/loopopts/UseCountedLoopSafepointsTest.java index 111475fcbfd..f23673ad651 100644 --- a/test/hotspot/jtreg/compiler/loopopts/UseCountedLoopSafepointsTest.java +++ b/test/hotspot/jtreg/compiler/loopopts/UseCountedLoopSafepointsTest.java @@ -28,7 +28,7 @@ * @summary Test that C2 flag UseCountedLoopSafepoints ensures a safepoint is kept in a CountedLoop * @library /test/lib / * @requires vm.compMode != "Xint" & vm.flavor == "server" & (vm.opt.TieredStopAtLevel == null | vm.opt.TieredStopAtLevel == 4) & vm.debug == true - * @requires !vm.emulatedClient + * @requires !vm.emulatedClient & !vm.graal.enabled * @modules java.base/jdk.internal.misc * @build sun.hotspot.WhiteBox * @run driver ClassFileInstaller sun.hotspot.WhiteBox diff --git a/test/jtreg-ext/requires/VMProps.java b/test/jtreg-ext/requires/VMProps.java index 3623db4c5e5..c507a8c74c3 100644 --- a/test/jtreg-ext/requires/VMProps.java +++ b/test/jtreg-ext/requires/VMProps.java @@ -73,6 +73,8 @@ public class VMProps implements Callable> { map.put("vm.aot", vmAOT()); // vm.cds is true if the VM is compiled with cds support. map.put("vm.cds", vmCDS()); + // vm.graal.enabled is true if Graal is used as JIT + map.put("vm.graal.enabled", isGraalEnabled()); vmGC(map); // vm.gc.X = true/false VMProps.dump(map); @@ -292,6 +294,41 @@ public class VMProps implements Callable> { } } + /** + * Check if Graal is used as JIT compiler. + * + * @return true if Graal is used as JIT compiler. + */ + protected String isGraalEnabled() { + // Graal is enabled if following conditions are true: + // - we are not in Interpreter mode + // - UseJVMCICompiler flag is true + // - jvmci.Compiler variable is equal to 'graal' + // - TieredCompilation is not used or TieredStopAtLevel is greater than 3 + + Boolean useCompiler = WB.getBooleanVMFlag("UseCompiler"); + if (useCompiler == null || !useCompiler) + return "false"; + + Boolean useJvmciComp = WB.getBooleanVMFlag("UseJVMCICompiler"); + if (useJvmciComp == null || !useJvmciComp) + return "false"; + + // This check might be redundant but let's keep it for now. + String jvmciCompiler = System.getProperty("jvmci.Compiler"); + if (jvmciCompiler == null || !jvmciCompiler.equals("graal")) { + return "false"; + } + + Boolean tieredCompilation = WB.getBooleanVMFlag("TieredCompilation"); + Long compLevel = WB.getIntxVMFlag("TieredStopAtLevel"); + // if TieredCompilation is enabled and compilation level is <= 3 then no Graal is used + if (tieredCompilation != null && tieredCompilation && compLevel != null && compLevel <= 3) + return "false"; + + return "true"; + } + /** * Dumps the map to the file if the file name is given as the property. * This functionality could be helpful to know context in the real From fd93a046840bd5ff51bdbc4586319440b0041f1c Mon Sep 17 00:00:00 2001 From: David Holmes Date: Mon, 2 Oct 2017 18:56:30 -0400 Subject: [PATCH 25/80] 8185062: Set AssumeMP to true and deprecate the flag Reviewed-by: shade, dcubed, kvn --- src/hotspot/share/runtime/arguments.cpp | 11 +---------- src/hotspot/share/runtime/globals.hpp | 4 ++-- src/hotspot/share/runtime/os.hpp | 2 +- .../runtime/CommandLine/VMDeprecatedOptions.java | 1 + 4 files changed, 5 insertions(+), 13 deletions(-) diff --git a/src/hotspot/share/runtime/arguments.cpp b/src/hotspot/share/runtime/arguments.cpp index 0213dbc3b1c..a7ca6ce09bd 100644 --- a/src/hotspot/share/runtime/arguments.cpp +++ b/src/hotspot/share/runtime/arguments.cpp @@ -377,6 +377,7 @@ static SpecialFlag const special_jvm_flags[] = { // --- Non-alias flags - sorted by obsolete_in then expired_in: { "MaxGCMinorPauseMillis", JDK_Version::jdk(8), JDK_Version::undefined(), JDK_Version::undefined() }, { "UseConcMarkSweepGC", JDK_Version::jdk(9), JDK_Version::undefined(), JDK_Version::undefined() }, + { "AssumeMP", JDK_Version::jdk(10),JDK_Version::undefined(), JDK_Version::undefined() }, { "MonitorInUseLists", JDK_Version::jdk(10),JDK_Version::undefined(), JDK_Version::undefined() }, { "MaxRAMFraction", JDK_Version::jdk(10), JDK_Version::undefined(), JDK_Version::undefined() }, { "MinRAMFraction", JDK_Version::jdk(10), JDK_Version::undefined(), JDK_Version::undefined() }, @@ -4476,16 +4477,6 @@ jint Arguments::apply_ergo() { set_shared_spaces_flags(); -#if defined(SPARC) - // BIS instructions require 'membar' instruction regardless of the number - // of CPUs because in virtualized/container environments which might use only 1 - // CPU, BIS instructions may produce incorrect results. - - if (FLAG_IS_DEFAULT(AssumeMP)) { - FLAG_SET_DEFAULT(AssumeMP, true); - } -#endif - // Check the GC selections again. if (!check_gc_consistency()) { return JNI_EINVAL; diff --git a/src/hotspot/share/runtime/globals.hpp b/src/hotspot/share/runtime/globals.hpp index d5cd34f9434..755a7da1abb 100644 --- a/src/hotspot/share/runtime/globals.hpp +++ b/src/hotspot/share/runtime/globals.hpp @@ -592,8 +592,8 @@ public: range(8, 256) \ constraint(ObjectAlignmentInBytesConstraintFunc,AtParse) \ \ - product(bool, AssumeMP, false, \ - "Instruct the VM to assume multiple processors are available") \ + product(bool, AssumeMP, true, \ + "(Deprecated) Instruct the VM to assume multiple processors are available")\ \ /* UseMembar is theoretically a temp flag used for memory barrier */ \ /* removal testing. It was supposed to be removed before FCS but has */ \ diff --git a/src/hotspot/share/runtime/os.hpp b/src/hotspot/share/runtime/os.hpp index d5fbca9192d..b29c0c3d03a 100644 --- a/src/hotspot/share/runtime/os.hpp +++ b/src/hotspot/share/runtime/os.hpp @@ -213,7 +213,7 @@ class os: AllStatic { // the bootstrap routine for the stub generator needs to check // the processor count directly and leave the bootstrap routine // in place until called after initialization has ocurred. - return (_processor_count != 1) || AssumeMP; + return AssumeMP || (_processor_count != 1); } static julong available_memory(); static julong physical_memory(); diff --git a/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java b/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java index 4e1a6bd9434..d53218760ac 100644 --- a/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java +++ b/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java @@ -46,6 +46,7 @@ public class VMDeprecatedOptions { {"MaxRAMFraction", "8"}, {"MinRAMFraction", "2"}, {"InitialRAMFraction", "64"}, + {"AssumeMP", "false"}, // deprecated alias flags (see also aliased_jvm_flags): {"DefaultMaxRAMFraction", "4"}, From a2d1045eefe8b76e349d94b237f37d55baea3f19 Mon Sep 17 00:00:00 2001 From: Ioi Lam Date: Mon, 2 Oct 2017 16:00:42 -0700 Subject: [PATCH 26/80] 8187979: Clean up info printing at CDS dump time Reviewed-by: jiangli, ccheung --- src/hotspot/share/memory/allocation.hpp | 1 - src/hotspot/share/memory/metaspaceShared.cpp | 6 +++--- .../runtime/SharedArchiveFile/SpaceUtilizationCheck.java | 2 +- .../jtreg/runtime/modules/PatchModule/PatchModuleCDS.java | 6 +++--- 4 files changed, 7 insertions(+), 8 deletions(-) diff --git a/src/hotspot/share/memory/allocation.hpp b/src/hotspot/share/memory/allocation.hpp index aedaf90155b..01e44c5d7f1 100644 --- a/src/hotspot/share/memory/allocation.hpp +++ b/src/hotspot/share/memory/allocation.hpp @@ -233,7 +233,6 @@ class MetaspaceObj { void print_address_on(outputStream* st) const; // nonvirtual address printing #define METASPACE_OBJ_TYPES_DO(f) \ - f(Unknown) \ f(Class) \ f(Symbol) \ f(TypeArrayU1) \ diff --git a/src/hotspot/share/memory/metaspaceShared.cpp b/src/hotspot/share/memory/metaspaceShared.cpp index eb80850b151..1b7df68e3bb 100644 --- a/src/hotspot/share/memory/metaspaceShared.cpp +++ b/src/hotspot/share/memory/metaspaceShared.cpp @@ -165,7 +165,7 @@ public: } void print(size_t total_bytes) const { - tty->print_cr("%s space: " SIZE_FORMAT_W(9) " [ %4.1f%% of total] out of " SIZE_FORMAT_W(9) " bytes [%5.1f%% used] at " INTPTR_FORMAT, + tty->print_cr("%-3s space: " SIZE_FORMAT_W(9) " [ %4.1f%% of total] out of " SIZE_FORMAT_W(9) " bytes [%5.1f%% used] at " INTPTR_FORMAT, _name, used(), perc(used(), total_bytes), reserved(), perc(used(), reserved()), p2i(_base)); } void print_out_of_space_msg(const char* failing_region, size_t needed_bytes) { @@ -1405,7 +1405,7 @@ void VM_PopulateDumpSharedSpace::print_region_stats() { print_heap_region_stats(_string_regions, "st", total_reserved); print_heap_region_stats(_open_archive_heap_regions, "oa", total_reserved); - tty->print_cr("total : " SIZE_FORMAT_W(9) " [100.0%% of total] out of " SIZE_FORMAT_W(9) " bytes [%5.1f%% used]", + tty->print_cr("total : " SIZE_FORMAT_W(9) " [100.0%% of total] out of " SIZE_FORMAT_W(9) " bytes [%5.1f%% used]", total_bytes, total_reserved, total_u_perc); } @@ -1416,7 +1416,7 @@ void VM_PopulateDumpSharedSpace::print_heap_region_stats(GrowableArrayat(i).start(); size_t size = heap_mem->at(i).byte_size(); char* top = start + size; - tty->print_cr("%s%d space: " SIZE_FORMAT_W(9) " [ %4.1f%% of total] out of " SIZE_FORMAT_W(9) " bytes [100%% used] at " INTPTR_FORMAT, + tty->print_cr("%s%d space: " SIZE_FORMAT_W(9) " [ %4.1f%% of total] out of " SIZE_FORMAT_W(9) " bytes [100.0%% used] at " INTPTR_FORMAT, name, i, size, size/double(total_size)*100.0, size, p2i(start)); } diff --git a/test/hotspot/jtreg/runtime/SharedArchiveFile/SpaceUtilizationCheck.java b/test/hotspot/jtreg/runtime/SharedArchiveFile/SpaceUtilizationCheck.java index f2e0f6964ca..f9cfe9f3ae4 100644 --- a/test/hotspot/jtreg/runtime/SharedArchiveFile/SpaceUtilizationCheck.java +++ b/test/hotspot/jtreg/runtime/SharedArchiveFile/SpaceUtilizationCheck.java @@ -64,7 +64,7 @@ public class SpaceUtilizationCheck { static void test(String... extra_options) throws Exception { OutputAnalyzer output = CDSTestUtils.createArchive(extra_options); CDSTestUtils.checkDump(output); - Pattern pattern = Pattern.compile("^(..) space: *([0-9]+).* out of *([0-9]+) bytes .* at 0x([0-9a0-f]+)"); + Pattern pattern = Pattern.compile("^(..) *space: *([0-9]+).* out of *([0-9]+) bytes .* at 0x([0-9a0-f]+)"); WhiteBox wb = WhiteBox.getWhiteBox(); long reserve_alignment = wb.metaspaceReserveAlignment(); System.out.println("Metaspace::reserve_alignment() = " + reserve_alignment); diff --git a/test/hotspot/jtreg/runtime/modules/PatchModule/PatchModuleCDS.java b/test/hotspot/jtreg/runtime/modules/PatchModule/PatchModuleCDS.java index 8321eb6ddb2..6b5d3c7e37c 100644 --- a/test/hotspot/jtreg/runtime/modules/PatchModule/PatchModuleCDS.java +++ b/test/hotspot/jtreg/runtime/modules/PatchModule/PatchModuleCDS.java @@ -50,7 +50,7 @@ public class PatchModuleCDS { "-Xlog:class+path=info", "-version"); new OutputAnalyzer(pb.start()) - .shouldContain("ro space:"); // Make sure archive got created. + .shouldContain("ro space:"); // Make sure archive got created. // Case 2: Test that directory in --patch-module is supported for CDS dumping // Create a class file in the module java.base. @@ -73,7 +73,7 @@ public class PatchModuleCDS { "-Xlog:class+path=info", "-version"); new OutputAnalyzer(pb.start()) - .shouldContain("ro space:"); // Make sure archive got created. + .shouldContain("ro space:"); // Make sure archive got created. // Case 3a: Test CDS dumping with jar file in --patch-module BasicJarBuilder.build("javanaming", "javax/naming/spi/NamingManager"); @@ -87,7 +87,7 @@ public class PatchModuleCDS { "-Xlog:class+path=info", "PatchModuleMain", "javax.naming.spi.NamingManager"); new OutputAnalyzer(pb.start()) - .shouldContain("ro space:"); // Make sure archive got created. + .shouldContain("ro space:"); // Make sure archive got created. // Case 3b: Test CDS run with jar file in --patch-module pb = ProcessTools.createJavaProcessBuilder( From 1590eaa3b818554916d1d6e2637b9ed87d8ff955 Mon Sep 17 00:00:00 2001 From: David Holmes Date: Mon, 2 Oct 2017 21:58:22 -0400 Subject: [PATCH 27/80] 8188246: Add test/hotspot/jtreg/gc/logging/TestPrintReferences.java to ProblemList.txt Reviewed-by: dcubed --- test/hotspot/jtreg/ProblemList.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/test/hotspot/jtreg/ProblemList.txt b/test/hotspot/jtreg/ProblemList.txt index 1b118f407b2..fa0588e5094 100644 --- a/test/hotspot/jtreg/ProblemList.txt +++ b/test/hotspot/jtreg/ProblemList.txt @@ -64,6 +64,7 @@ gc/g1/logging/TestG1LoggingFailure.java 8169634 generic-all gc/g1/humongousObjects/TestHeapCounters.java 8178918 generic-all gc/stress/gclocker/TestGCLockerWithG1.java 8179226 generic-all gc/survivorAlignment/TestPromotionFromSurvivorToTenuredAfterMinorGC.java 8177765 generic-all +gc/logging/TestPrintReferences.java 8188245 generic-all ############################################################################# From aa72ba3a647593912d2288983e35062b35e213de Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Erik=20=C3=96sterlund?= Date: Tue, 26 Sep 2017 21:37:01 +0200 Subject: [PATCH 28/80] 8187977: Generalize Atomic::xchg to use templates Reviewed-by: kbarrett, coleenp --- src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp | 27 ++-- src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp | 20 +-- .../os_cpu/bsd_zero/atomic_bsd_zero.hpp | 38 ++--- .../linux_aarch64/atomic_linux_aarch64.hpp | 22 +-- .../os_cpu/linux_arm/atomic_linux_arm.hpp | 28 ++-- .../os_cpu/linux_ppc/atomic_linux_ppc.hpp | 25 ++-- .../os_cpu/linux_s390/atomic_linux_s390.hpp | 28 ++-- .../os_cpu/linux_sparc/atomic_linux_sparc.hpp | 21 +-- .../os_cpu/linux_x86/atomic_linux_x86.hpp | 20 +-- .../os_cpu/linux_zero/atomic_linux_zero.hpp | 38 ++--- .../solaris_sparc/atomic_solaris_sparc.hpp | 40 ++--- .../os_cpu/solaris_sparc/solaris_sparc.il | 41 ----- .../os_cpu/solaris_x86/atomic_solaris_x86.hpp | 32 ++-- .../os_cpu/windows_x86/atomic_windows_x86.hpp | 34 ++--- src/hotspot/share/compiler/compileBroker.hpp | 2 +- src/hotspot/share/runtime/atomic.hpp | 140 +++++++++++++++++- 16 files changed, 320 insertions(+), 236 deletions(-) diff --git a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp index 455a301456f..5ef5ce7f1bf 100644 --- a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp +++ b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp @@ -148,13 +148,15 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return result; } - -inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { - +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); // Note that xchg_ptr doesn't necessarily do an acquire // (see synchronizer.cpp). - unsigned int old_value; + T old_value; const uint64_t zero = 0; __asm__ __volatile__ ( @@ -182,15 +184,18 @@ inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { "memory" ); - return (jint) old_value; + return old_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); // Note that xchg_ptr doesn't necessarily do an acquire // (see synchronizer.cpp). - long old_value; + T old_value; const uint64_t zero = 0; __asm__ __volatile__ ( @@ -218,11 +223,7 @@ inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* des "memory" ); - return (intptr_t) old_value; -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); + return old_value; } inline void cmpxchg_pre_membar(cmpxchg_memory_order order) { diff --git a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp index fc825ce9a1c..4720e67e405 100644 --- a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp +++ b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp @@ -61,7 +61,11 @@ inline D Atomic::PlatformAdd<4>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); __asm__ volatile ( "xchgl (%2),%0" : "=r" (exchange_value) : "0" (exchange_value), "r" (dest) @@ -69,10 +73,6 @@ inline jint Atomic::xchg (jint exchange_value, volatile jint* des return exchange_value; } -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); -} - template<> template inline T Atomic::PlatformCmpxchg<1>::operator()(T exchange_value, @@ -118,7 +118,11 @@ inline D Atomic::PlatformAdd<8>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); __asm__ __volatile__ ("xchgq (%2),%0" : "=r" (exchange_value) : "0" (exchange_value), "r" (dest) @@ -144,10 +148,6 @@ inline jlong Atomic::load(const volatile jlong* src) { return *src; } #else // !AMD64 -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); -} - extern "C" { // defined in bsd_x86.s jlong _Atomic_cmpxchg_long(jlong, volatile jlong*, jlong, bool); diff --git a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp index 235427ea40f..7b76258649d 100644 --- a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp +++ b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp @@ -87,7 +87,7 @@ static inline int m68k_add_and_fetch(int add_value, volatile int *ptr) { /* Atomically write VALUE into `*PTR' and returns the previous contents of `*PTR'. */ -static inline int m68k_lock_test_and_set(volatile int *ptr, int newval) { +static inline int m68k_lock_test_and_set(int newval, volatile int *ptr) { for (;;) { // Loop until success. int prev = *ptr; @@ -148,7 +148,7 @@ static inline int arm_add_and_fetch(int add_value, volatile int *ptr) { /* Atomically write VALUE into `*PTR' and returns the previous contents of `*PTR'. */ -static inline int arm_lock_test_and_set(volatile int *ptr, int newval) { +static inline int arm_lock_test_and_set(int newval, volatile int *ptr) { for (;;) { // Loop until a __kernel_cmpxchg succeeds. int prev = *ptr; @@ -207,18 +207,22 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return __sync_add_and_fetch(dest, add_value); } -inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); #ifdef ARM - return arm_lock_test_and_set(dest, exchange_value); + return xchg_using_helper(arm_lock_test_and_set, exchange_value, dest); #else #ifdef M68K - return m68k_lock_test_and_set(dest, exchange_value); + return xchg_using_helper(m68k_lock_test_and_set, exchange_value, dest); #else // __sync_lock_test_and_set is a bizarrely named atomic exchange // operation. Note that some platforms only support this with the // limitation that the only valid value to store is the immediate // constant 1. There is a test for this in JNI_CreateJavaVM(). - jint result = __sync_lock_test_and_set (dest, exchange_value); + T result = __sync_lock_test_and_set (dest, exchange_value); // All atomic operations are expected to be full memory barriers // (see atomic.hpp). However, __sync_lock_test_and_set is not // a full memory barrier, but an acquire barrier. Hence, this added @@ -229,24 +233,14 @@ inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { #endif // ARM } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, - volatile intptr_t* dest) { -#ifdef ARM - return arm_lock_test_and_set(dest, exchange_value); -#else -#ifdef M68K - return m68k_lock_test_and_set(dest, exchange_value); -#else - intptr_t result = __sync_lock_test_and_set (dest, exchange_value); +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T result = __sync_lock_test_and_set (dest, exchange_value); __sync_synchronize(); return result; -#endif // M68K -#endif // ARM -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void *) xchg_ptr((intptr_t) exchange_value, - (volatile intptr_t*) dest); } // No direct support for cmpxchg of bytes; emulate using int. diff --git a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp index 72a2f3b6555..88ba2654cc4 100644 --- a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp +++ b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp @@ -57,19 +57,16 @@ struct Atomic::PlatformAdd } }; -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) -{ - jint res = __sync_lock_test_and_set (dest, exchange_value); +template +template +inline T Atomic::PlatformXchg::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(byte_size == sizeof(T)); + T res = __sync_lock_test_and_set(dest, exchange_value); FULL_MEM_BARRIER; return res; } -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) -{ - return (void *) xchg_ptr((intptr_t) exchange_value, - (volatile intptr_t*) dest); -} - template template inline T Atomic::PlatformCmpxchg::operator()(T exchange_value, @@ -90,13 +87,6 @@ inline T Atomic::PlatformCmpxchg::operator()(T exchange_value, inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) -{ - intptr_t res = __sync_lock_test_and_set (dest, exchange_value); - FULL_MEM_BARRIER; - return res; -} - inline jlong Atomic::load(const volatile jlong* src) { return *src; } #endif // OS_CPU_LINUX_AARCH64_VM_ATOMIC_LINUX_AARCH64_HPP diff --git a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp index 76c7b69076a..930d79289c0 100644 --- a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp +++ b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp @@ -141,11 +141,15 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co : "memory"); return val; } -#endif // AARCH64 +#endif -inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); #ifdef AARCH64 - jint old_val; + T old_val; int tmp; __asm__ volatile( "1:\n\t" @@ -157,13 +161,17 @@ inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { : "memory"); return old_val; #else - return (*os::atomic_xchg_func)(exchange_value, dest); + return xchg_using_helper(os::atomic_xchg_func, exchange_value, dest); #endif } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { #ifdef AARCH64 - intptr_t old_val; +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T old_val; int tmp; __asm__ volatile( "1:\n\t" @@ -174,14 +182,8 @@ inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* des : [new_val] "r" (exchange_value), [dest] "r" (dest) : "memory"); return old_val; -#else - return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); -#endif -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); } +#endif // AARCH64 // The memory_order parameter is ignored - we always provide the strongest/most-conservative ordering diff --git a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp index 82bf9c2d3c4..0056e306644 100644 --- a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp +++ b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp @@ -146,12 +146,14 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return result; } -inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { - +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { // Note that xchg_ptr doesn't necessarily do an acquire // (see synchronizer.cpp). - unsigned int old_value; + T old_value; const uint64_t zero = 0; __asm__ __volatile__ ( @@ -179,15 +181,18 @@ inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { "memory" ); - return (jint) old_value; + return old_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); // Note that xchg_ptr doesn't necessarily do an acquire // (see synchronizer.cpp). - long old_value; + T old_value; const uint64_t zero = 0; __asm__ __volatile__ ( @@ -215,11 +220,7 @@ inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* des "memory" ); - return (intptr_t) old_value; -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); + return old_value; } inline void cmpxchg_pre_membar(cmpxchg_memory_order order) { diff --git a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp index ef9391db80c..1f5db81b853 100644 --- a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp +++ b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp @@ -208,8 +208,12 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I inc, D volatile* dest) const { // // The return value is the (unchanged) value from memory as it was when the // replacement succeeded. -inline jint Atomic::xchg (jint xchg_val, volatile jint* dest) { - unsigned int old; +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); + T old; __asm__ __volatile__ ( " LLGF %[old],%[mem] \n\t" // get old value @@ -219,16 +223,20 @@ inline jint Atomic::xchg (jint xchg_val, volatile jint* dest) { : [old] "=&d" (old) // write-only, prev value irrelevant , [mem] "+Q" (*dest) // read/write, memory to be updated atomically //---< inputs >--- - : [upd] "d" (xchg_val) // read-only, value to be written to memory + : [upd] "d" (exchange_value) // read-only, value to be written to memory //---< clobbered >--- : "cc", "memory" ); - return (jint)old; + return old; } -inline intptr_t Atomic::xchg_ptr(intptr_t xchg_val, volatile intptr_t* dest) { - unsigned long old; +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T old; __asm__ __volatile__ ( " LG %[old],%[mem] \n\t" // get old value @@ -238,16 +246,12 @@ inline intptr_t Atomic::xchg_ptr(intptr_t xchg_val, volatile intptr_t* dest) { : [old] "=&d" (old) // write-only, init from memory , [mem] "+Q" (*dest) // read/write, memory to be updated atomically //---< inputs >--- - : [upd] "d" (xchg_val) // read-only, value to be written to memory + : [upd] "d" (exchange_value) // read-only, value to be written to memory //---< clobbered >--- : "cc", "memory" ); - return (intptr_t)old; -} - -inline void *Atomic::xchg_ptr(void *exchange_value, volatile void *dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); + return old; } //---------------- diff --git a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp index 1b40854558a..c671af04417 100644 --- a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp +++ b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp @@ -95,9 +95,12 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return rv; } - -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { - intptr_t rv = exchange_value; +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); + T rv = exchange_value; __asm__ volatile( " swap [%2],%1\n\t" : "=r" (rv) @@ -106,8 +109,12 @@ inline jint Atomic::xchg (jint exchange_value, volatile jint* des return rv; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - intptr_t rv = exchange_value; +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T rv = exchange_value; __asm__ volatile( "1:\n\t" " mov %1, %%o3\n\t" @@ -123,10 +130,6 @@ inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* des return rv; } -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); -} - // No direct support for cmpxchg of bytes; emulate using int. template<> struct Atomic::PlatformCmpxchg<1> : Atomic::CmpxchgByteUsingInt {}; diff --git a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp index 51ed87f3dd8..cbe5c3ede8a 100644 --- a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp +++ b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp @@ -61,7 +61,11 @@ inline D Atomic::PlatformAdd<4>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); __asm__ volatile ( "xchgl (%2),%0" : "=r" (exchange_value) : "0" (exchange_value), "r" (dest) @@ -69,10 +73,6 @@ inline jint Atomic::xchg (jint exchange_value, volatile jint* des return exchange_value; } -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); -} - template<> template inline T Atomic::PlatformCmpxchg<1>::operator()(T exchange_value, @@ -118,7 +118,11 @@ inline D Atomic::PlatformAdd<8>::fetch_and_add(I add_value, D volatile* dest) co return old_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); __asm__ __volatile__ ("xchgq (%2),%0" : "=r" (exchange_value) : "0" (exchange_value), "r" (dest) @@ -144,10 +148,6 @@ inline jlong Atomic::load(const volatile jlong* src) { return *src; } #else // !AMD64 -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); -} - extern "C" { // defined in linux_x86.s jlong _Atomic_cmpxchg_long(jlong, volatile jlong*, jlong); diff --git a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp index 97c6ed1b2b7..68d9575acae 100644 --- a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp +++ b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp @@ -87,7 +87,7 @@ static inline int m68k_add_and_fetch(int add_value, volatile int *ptr) { /* Atomically write VALUE into `*PTR' and returns the previous contents of `*PTR'. */ -static inline int m68k_lock_test_and_set(volatile int *ptr, int newval) { +static inline int m68k_lock_test_and_set(int newval, volatile int *ptr) { for (;;) { // Loop until success. int prev = *ptr; @@ -148,7 +148,7 @@ static inline int arm_add_and_fetch(int add_value, volatile int *ptr) { /* Atomically write VALUE into `*PTR' and returns the previous contents of `*PTR'. */ -static inline int arm_lock_test_and_set(volatile int *ptr, int newval) { +static inline int arm_lock_test_and_set(int newval, volatile int *ptr) { for (;;) { // Loop until a __kernel_cmpxchg succeeds. int prev = *ptr; @@ -201,18 +201,22 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return __sync_add_and_fetch(dest, add_value); } -inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); #ifdef ARM - return arm_lock_test_and_set(dest, exchange_value); + return xchg_using_helper(arm_lock_test_and_set, exchange_value, dest); #else #ifdef M68K - return m68k_lock_test_and_set(dest, exchange_value); + return xchg_using_helper(m68k_lock_test_and_set, exchange_value, dest); #else // __sync_lock_test_and_set is a bizarrely named atomic exchange // operation. Note that some platforms only support this with the // limitation that the only valid value to store is the immediate // constant 1. There is a test for this in JNI_CreateJavaVM(). - jint result = __sync_lock_test_and_set (dest, exchange_value); + T result = __sync_lock_test_and_set (dest, exchange_value); // All atomic operations are expected to be full memory barriers // (see atomic.hpp). However, __sync_lock_test_and_set is not // a full memory barrier, but an acquire barrier. Hence, this added @@ -223,24 +227,14 @@ inline jint Atomic::xchg(jint exchange_value, volatile jint* dest) { #endif // ARM } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, - volatile intptr_t* dest) { -#ifdef ARM - return arm_lock_test_and_set(dest, exchange_value); -#else -#ifdef M68K - return m68k_lock_test_and_set(dest, exchange_value); -#else - intptr_t result = __sync_lock_test_and_set (dest, exchange_value); +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T result = __sync_lock_test_and_set (dest, exchange_value); __sync_synchronize(); return result; -#endif // M68K -#endif // ARM -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void *) xchg_ptr((intptr_t) exchange_value, - (volatile intptr_t*) dest); } // No direct support for cmpxchg of bytes; emulate using int. diff --git a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp index 5a1a470ae58..b76aed3da85 100644 --- a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp +++ b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp @@ -43,16 +43,6 @@ inline void Atomic::store(jlong store_value, jlong* dest) { *dest = store_value; inline void Atomic::store(jlong store_value, volatile jlong* dest) { *dest = store_value; } inline jlong Atomic::load(const volatile jlong* src) { return *src; } - -// This is the interface to the atomic instructions in solaris_sparc.il. -// It's very messy because we need to support v8 and these instructions -// are illegal there. When sparc v8 is dropped, we can drop out lots of -// this code. Also compiler2 does not support v8 so the conditional code -// omits the instruction set check. - -extern "C" jint _Atomic_swap32(jint exchange_value, volatile jint* dest); -extern "C" intptr_t _Atomic_swap64(intptr_t exchange_value, volatile intptr_t* dest); - // Implement ADD using a CAS loop. template struct Atomic::PlatformAdd VALUE_OBJ_CLASS_SPEC { @@ -69,16 +59,30 @@ struct Atomic::PlatformAdd VALUE_OBJ_CLASS_SPEC { } }; -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { - return _Atomic_swap32(exchange_value, dest); +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); + __asm__ volatile ( "swap [%2],%0" + : "=r" (exchange_value) + : "0" (exchange_value), "r" (dest) + : "memory"); + return exchange_value; } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return _Atomic_swap64(exchange_value, dest); -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg_ptr((intptr_t)exchange_value, (volatile intptr_t*)dest); +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + T old_value = *dest; + while (true) { + T result = cmpxchg(exchange_value, dest, old_value); + if (result == old_value) break; + old_value = result; + } + return old_value; } // No direct support for cmpxchg of bytes; emulate using int. diff --git a/src/hotspot/os_cpu/solaris_sparc/solaris_sparc.il b/src/hotspot/os_cpu/solaris_sparc/solaris_sparc.il index 39ac68a7ec8..1f25542e5d5 100644 --- a/src/hotspot/os_cpu/solaris_sparc/solaris_sparc.il +++ b/src/hotspot/os_cpu/solaris_sparc/solaris_sparc.il @@ -32,47 +32,6 @@ .end - // Support for jint Atomic::xchg(jint exchange_value, volatile jint* dest). - // - // Arguments: - // exchange_value: O0 - // dest: O1 - // - // Results: - // O0: the value previously stored in dest - - .inline _Atomic_swap32, 2 - .volatile - swap [%o1],%o0 - .nonvolatile - .end - - - // Support for intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t * dest). - // - // 64-bit - // - // Arguments: - // exchange_value: O0 - // dest: O1 - // - // Results: - // O0: the value previously stored in dest - - .inline _Atomic_swap64, 2 - .volatile - 1: - mov %o0, %o3 - ldx [%o1], %o2 - casx [%o1], %o2, %o3 - cmp %o2, %o3 - bne %xcc, 1b - nop - mov %o2, %o0 - .nonvolatile - .end - - // Support for jlong Atomic::load and Atomic::store on v9. // // void _Atomic_move_long_v9(volatile jlong* src, volatile jlong* dst) diff --git a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp index 310592eadb9..fdf6f47cdf0 100644 --- a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp +++ b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp @@ -84,8 +84,26 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co reinterpret_cast(dest))); } -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { - return _Atomic_xchg(exchange_value, dest); +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); + return PrimitiveConversions::cast( + _Atomic_xchg(PrimitiveConversions::cast(exchange_value), + reinterpret_cast(dest))); +} + +extern "C" jlong _Atomic_xchg_long(jlong exchange_value, volatile jlong* dest); + +template<> +template +inline T Atomic::PlatformXchg<8>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + return PrimitiveConversions::cast( + _Atomic_xchg_long(PrimitiveConversions::cast(exchange_value), + reinterpret_cast(dest))); } // Not using cmpxchg_using_helper here, because some configurations of @@ -135,16 +153,6 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -extern "C" jlong _Atomic_xchg_long(jlong exchange_value, volatile jlong* dest); - -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return (intptr_t)_Atomic_xchg_long((jlong)exchange_value, (volatile jlong*)dest); -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)_Atomic_xchg_long((jlong)exchange_value, (volatile jlong*)dest); -} - inline jlong Atomic::load(const volatile jlong* src) { return *src; } #endif // OS_CPU_SOLARIS_X86_VM_ATOMIC_SOLARIS_X86_HPP diff --git a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp index e1ba4f45235..15635f2d6ed 100644 --- a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp +++ b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp @@ -81,17 +81,19 @@ inline D Atomic::PlatformAdd<8>::add_and_fetch(I add_value, D volatile* dest) co return add_using_helper(os::atomic_add_ptr_func, add_value, dest); } -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { - return (jint)(*os::atomic_xchg_func)(exchange_value, dest); -} +#define DEFINE_STUB_XCHG(ByteSize, StubType, StubName) \ + template<> \ + template \ + inline T Atomic::PlatformXchg::operator()(T exchange_value, \ + T volatile* dest) const { \ + STATIC_ASSERT(ByteSize == sizeof(T)); \ + return xchg_using_helper(StubName, exchange_value, dest); \ + } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return (intptr_t)(os::atomic_xchg_ptr_func)(exchange_value, dest); -} +DEFINE_STUB_XCHG(4, jint, os::atomic_xchg_func) +DEFINE_STUB_XCHG(8, jlong, os::atomic_xchg_ptr_func) -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void *)(os::atomic_xchg_ptr_func)((intptr_t)exchange_value, (volatile intptr_t*)dest); -} +#undef DEFINE_STUB_XCHG #define DEFINE_STUB_CMPXCHG(ByteSize, StubType, StubName) \ template<> \ @@ -128,7 +130,11 @@ inline D Atomic::PlatformAdd<4>::add_and_fetch(I add_value, D volatile* dest) co } } -inline jint Atomic::xchg (jint exchange_value, volatile jint* dest) { +template<> +template +inline T Atomic::PlatformXchg<4>::operator()(T exchange_value, + T volatile* dest) const { + STATIC_ASSERT(4 == sizeof(T)); // alternative for InterlockedExchange __asm { mov eax, exchange_value; @@ -137,14 +143,6 @@ inline jint Atomic::xchg (jint exchange_value, volatile jint* des } } -inline intptr_t Atomic::xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { - return (intptr_t)xchg((jint)exchange_value, (volatile jint*)dest); -} - -inline void* Atomic::xchg_ptr(void* exchange_value, volatile void* dest) { - return (void*)xchg((jint)exchange_value, (volatile jint*)dest); -} - template<> template inline T Atomic::PlatformCmpxchg<1>::operator()(T exchange_value, diff --git a/src/hotspot/share/compiler/compileBroker.hpp b/src/hotspot/share/compiler/compileBroker.hpp index 571ee7020e0..ced793a0c4f 100644 --- a/src/hotspot/share/compiler/compileBroker.hpp +++ b/src/hotspot/share/compiler/compileBroker.hpp @@ -332,7 +332,7 @@ public: static void disable_compilation_forever() { UseCompiler = false; AlwaysCompileLoopMethods = false; - Atomic::xchg(shutdown_compilation, &_should_compile_new_jobs); + Atomic::xchg(jint(shutdown_compilation), &_should_compile_new_jobs); } static bool is_compilation_disabled_forever() { diff --git a/src/hotspot/share/runtime/atomic.hpp b/src/hotspot/share/runtime/atomic.hpp index a34d7f389f8..e6f94f6f169 100644 --- a/src/hotspot/share/runtime/atomic.hpp +++ b/src/hotspot/share/runtime/atomic.hpp @@ -116,10 +116,19 @@ class Atomic : AllStatic { // Performs atomic exchange of *dest with exchange_value. Returns old // prior value of *dest. xchg*() provide: // exchange-value-with-dest - inline static jint xchg (jint exchange_value, volatile jint* dest); - inline static unsigned int xchg (unsigned int exchange_value, volatile unsigned int* dest); - inline static intptr_t xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest); - inline static void* xchg_ptr(void* exchange_value, volatile void* dest); + // The type T must be either a pointer type convertible to or equal + // to D, an integral/enum type equal to D, or a type equal to D that + // is primitive convertible using PrimitiveConversions. + template + inline static D xchg(T exchange_value, volatile D* dest); + + inline static intptr_t xchg_ptr(intptr_t exchange_value, volatile intptr_t* dest) { + return xchg(exchange_value, dest); + } + + inline static void* xchg_ptr(void* exchange_value, volatile void* dest) { + return xchg(exchange_value, reinterpret_cast(dest)); + } // Performs atomic compare of *dest and compare_value, and exchanges // *dest with exchange_value if the comparison succeeded. Returns prior @@ -280,6 +289,45 @@ private: public: // Temporary, can't be private: C++03 11.4/2. Fixed by C++11. struct CmpxchgByteUsingInt; private: + + // Dispatch handler for xchg. Provides type-based validity + // checking and limited conversions around calls to the + // platform-specific implementation layer provided by + // PlatformXchg. + template + struct XchgImpl; + + // Platform-specific implementation of xchg. Support for sizes + // of 4, and sizeof(intptr_t) are required. The class is a function + // object that must be default constructable, with these requirements: + // + // - dest is of type T*. + // - exchange_value is of type T. + // - platform_xchg is an object of type PlatformXchg. + // + // Then + // platform_xchg(exchange_value, dest) + // must be a valid expression, returning a result convertible to T. + // + // A default definition is provided, which declares a function template + // T operator()(T, T volatile*, T, cmpxchg_memory_order) const + // + // For each required size, a platform must either provide an + // appropriate definition of that function, or must entirely + // specialize the class template for that size. + template struct PlatformXchg; + + // Support for platforms that implement some variants of xchg + // using a (typically out of line) non-template helper function. + // The generic arguments passed to PlatformXchg need to be + // translated to the appropriate type for the helper function, the + // helper invoked on the translated arguments, and the result + // translated back. Type is the parameter / return type of the + // helper function. + template + static T xchg_using_helper(Fn fn, + T exchange_value, + T volatile* dest); }; template @@ -353,6 +401,18 @@ struct Atomic::CmpxchgByteUsingInt VALUE_OBJ_CLASS_SPEC { cmpxchg_memory_order order) const; }; +// Define the class before including platform file, which may specialize +// the operator definition. No generic definition of specializations +// of the operator template are provided, nor are there any generic +// specializations of the class. The platform file is responsible for +// providing those. +template +struct Atomic::PlatformXchg VALUE_OBJ_CLASS_SPEC { + template + T operator()(T exchange_value, + T volatile* dest) const; +}; + // platform specific in-line definitions - must come before shared definitions #include OS_CPU_HEADER(atomic) @@ -594,9 +654,75 @@ inline T Atomic::CmpxchgByteUsingInt::operator()(T exchange_value, return PrimitiveConversions::cast(cur_as_bytes[offset]); } -inline unsigned Atomic::xchg(unsigned int exchange_value, volatile unsigned int* dest) { - assert(sizeof(unsigned int) == sizeof(jint), "more work to do"); - return (unsigned int)Atomic::xchg((jint)exchange_value, (volatile jint*)dest); +// Handle xchg for integral and enum types. +// +// All the involved types must be identical. +template +struct Atomic::XchgImpl< + T, T, + typename EnableIf::value || IsRegisteredEnum::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + T operator()(T exchange_value, T volatile* dest) const { + // Forward to the platform handler for the size of T. + return PlatformXchg()(exchange_value, dest); + } +}; + +// Handle xchg for pointer types. +// +// The exchange_value must be implicitly convertible to the +// destination's type; it must be type-correct to store the +// exchange_value in the destination. +template +struct Atomic::XchgImpl< + T*, D*, + typename EnableIf::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + D* operator()(T* exchange_value, D* volatile* dest) const { + // Allow derived to base conversion, and adding cv-qualifiers. + D* new_value = exchange_value; + return PlatformXchg()(new_value, dest); + } +}; + +// Handle xchg for types that have a translator. +// +// All the involved types must be identical. +// +// This translates the original call into a call on the decayed +// arguments, and returns the recovered result of that translated +// call. +template +struct Atomic::XchgImpl< + T, T, + typename EnableIf::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + T operator()(T exchange_value, T volatile* dest) const { + typedef PrimitiveConversions::Translate Translator; + typedef typename Translator::Decayed Decayed; + STATIC_ASSERT(sizeof(T) == sizeof(Decayed)); + return Translator::recover( + xchg(Translator::decay(exchange_value), + reinterpret_cast(dest))); + } +}; + +template +inline T Atomic::xchg_using_helper(Fn fn, + T exchange_value, + T volatile* dest) { + STATIC_ASSERT(sizeof(Type) == sizeof(T)); + return PrimitiveConversions::cast( + fn(PrimitiveConversions::cast(exchange_value), + reinterpret_cast(dest))); +} + +template +inline D Atomic::xchg(T exchange_value, volatile D* dest) { + return XchgImpl()(exchange_value, dest); } #endif // SHARE_VM_RUNTIME_ATOMIC_HPP From 80f8ee98e49baaa91af9148f322fb7c7b163987e Mon Sep 17 00:00:00 2001 From: Erik Helin Date: Fri, 15 Sep 2017 10:43:03 +0200 Subject: [PATCH 29/80] 8187570: Comparison between pointer and char in MethodMatcher::canonicalize Reviewed-by: ysuenaga, eosterlund --- src/hotspot/share/compiler/methodMatcher.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/hotspot/share/compiler/methodMatcher.cpp b/src/hotspot/share/compiler/methodMatcher.cpp index 8113d859cff..cc84fb53e8b 100644 --- a/src/hotspot/share/compiler/methodMatcher.cpp +++ b/src/hotspot/share/compiler/methodMatcher.cpp @@ -96,7 +96,7 @@ bool MethodMatcher::canonicalize(char * line, const char *& error_msg) { bool have_colon = (colon != NULL); if (have_colon) { // Don't allow multiple '::' - if (colon + 2 != '\0') { + if (colon[2] != '\0') { if (strstr(colon+2, "::")) { error_msg = "Method pattern only allows one '::' allowed"; return false; From 73a801bc4368a9e7b219d7a66e93bc0f17b278b5 Mon Sep 17 00:00:00 2001 From: Coleen Phillimore Date: Tue, 3 Oct 2017 16:42:04 -0400 Subject: [PATCH 30/80] 8186777: Make Klass::_java_mirror an OopHandle Add indirection for fetching mirror so that GC doesn't have to follow CLD::_klasses Co-authored-by: Rickard Backman Reviewed-by: hseigel, thartmann, eosterlund, stefank --- .../cpu/aarch64/macroAssembler_aarch64.cpp | 1 + .../cpu/aarch64/templateTable_aarch64.cpp | 1 + src/hotspot/cpu/arm/macroAssembler_arm.cpp | 1 + src/hotspot/cpu/arm/templateTable_arm.cpp | 1 + src/hotspot/cpu/ppc/macroAssembler_ppc.cpp | 1 + src/hotspot/cpu/ppc/templateTable_ppc_64.cpp | 1 + src/hotspot/cpu/s390/macroAssembler_s390.cpp | 1 + src/hotspot/cpu/s390/templateTable_s390.cpp | 1 + .../cpu/sparc/macroAssembler_sparc.cpp | 1 + src/hotspot/cpu/sparc/templateTable_sparc.cpp | 1 + src/hotspot/cpu/x86/macroAssembler_x86.cpp | 1 + src/hotspot/cpu/x86/templateTable_x86.cpp | 1 + src/hotspot/share/c1/c1_LIRGenerator.cpp | 4 +- .../share/classfile/classLoaderData.cpp | 38 ++++--- .../share/classfile/classLoaderData.hpp | 28 ++++- src/hotspot/share/classfile/javaClasses.cpp | 2 +- src/hotspot/share/gc/cms/cmsOopClosures.hpp | 7 +- .../share/gc/cms/cmsOopClosures.inline.hpp | 4 +- .../gc/cms/concurrentMarkSweepGeneration.cpp | 105 +++++++++--------- .../gc/cms/concurrentMarkSweepGeneration.hpp | 2 +- src/hotspot/share/gc/cms/parNewGeneration.cpp | 9 +- src/hotspot/share/gc/cms/parOopClosures.hpp | 4 +- .../share/gc/cms/parOopClosures.inline.hpp | 6 +- src/hotspot/share/gc/g1/g1CollectedHeap.hpp | 1 - src/hotspot/share/gc/g1/g1HeapVerifier.cpp | 15 ++- src/hotspot/share/gc/g1/g1OopClosures.cpp | 22 ++-- src/hotspot/share/gc/g1/g1OopClosures.hpp | 18 +-- .../share/gc/g1/g1OopClosures.inline.hpp | 10 +- src/hotspot/share/gc/g1/g1SharedClosures.hpp | 21 ++-- src/hotspot/share/gc/parallel/pcTasks.cpp | 3 +- .../share/gc/parallel/psCompactionManager.hpp | 13 +-- .../parallel/psCompactionManager.inline.hpp | 9 +- .../share/gc/parallel/psParallelCompact.cpp | 8 +- .../share/gc/parallel/psScavenge.inline.hpp | 54 +++++---- src/hotspot/share/gc/parallel/psTasks.cpp | 4 +- .../share/gc/serial/defNewGeneration.cpp | 45 +++----- src/hotspot/share/gc/shared/cardTableRS.cpp | 25 +++-- src/hotspot/share/gc/shared/cardTableRS.hpp | 12 +- .../share/gc/shared/genOopClosures.hpp | 38 ++++--- .../share/gc/shared/genOopClosures.inline.hpp | 18 +-- src/hotspot/share/jvmci/jvmciCompilerToVM.cpp | 1 + src/hotspot/share/jvmci/vmStructs_jvmci.cpp | 5 +- src/hotspot/share/memory/iterator.cpp | 13 +-- src/hotspot/share/memory/iterator.hpp | 44 +------- src/hotspot/share/memory/iterator.inline.hpp | 6 +- src/hotspot/share/oops/instanceKlass.cpp | 3 + src/hotspot/share/oops/klass.cpp | 61 ++-------- src/hotspot/share/oops/klass.hpp | 40 ++----- src/hotspot/share/opto/library_call.cpp | 3 +- src/hotspot/share/opto/memnode.cpp | 49 +++++--- src/hotspot/share/opto/subnode.cpp | 8 +- src/hotspot/share/prims/jvmtiTagMap.cpp | 3 +- src/hotspot/share/prims/jvmtiThreadState.hpp | 8 +- src/hotspot/share/runtime/vmStructs.cpp | 2 +- .../classes/sun/jvm/hotspot/oops/Klass.java | 16 ++- .../HotSpotMemoryAccessProviderImpl.java | 33 +++--- .../jdk/vm/ci/hotspot/HotSpotVMConfig.java | 4 +- .../hotspot/GraalHotSpotVMConfig.java | 6 +- .../jdk/vm/ci/code/test/DataPatchTest.java | 10 +- .../vm/ci/code/test/TestHotSpotVMConfig.java | 4 +- .../test/MemoryAccessProviderData.java | 4 +- 61 files changed, 383 insertions(+), 477 deletions(-) diff --git a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp index 78637f21dc1..be04c5fdc2d 100644 --- a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp @@ -3291,6 +3291,7 @@ void MacroAssembler::load_mirror(Register dst, Register method) { ldr(dst, Address(dst, ConstMethod::constants_offset())); ldr(dst, Address(dst, ConstantPool::pool_holder_offset_in_bytes())); ldr(dst, Address(dst, mirror_offset)); + resolve_oop_handle(dst); } void MacroAssembler::cmp_klass(Register oop, Register trial_klass, Register tmp) { diff --git a/src/hotspot/cpu/aarch64/templateTable_aarch64.cpp b/src/hotspot/cpu/aarch64/templateTable_aarch64.cpp index ae182677be5..2ba42035e7b 100644 --- a/src/hotspot/cpu/aarch64/templateTable_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/templateTable_aarch64.cpp @@ -2297,6 +2297,7 @@ void TemplateTable::load_field_cp_cache_entry(Register obj, ConstantPoolCacheEntry::f1_offset()))); const int mirror_offset = in_bytes(Klass::java_mirror_offset()); __ ldr(obj, Address(obj, mirror_offset)); + __ resolve_oop_handle(obj); } } diff --git a/src/hotspot/cpu/arm/macroAssembler_arm.cpp b/src/hotspot/cpu/arm/macroAssembler_arm.cpp index 53eb53f2c7f..ea4d7782983 100644 --- a/src/hotspot/cpu/arm/macroAssembler_arm.cpp +++ b/src/hotspot/cpu/arm/macroAssembler_arm.cpp @@ -2899,6 +2899,7 @@ void MacroAssembler::load_mirror(Register mirror, Register method, Register tmp) ldr(tmp, Address(tmp, ConstMethod::constants_offset())); ldr(tmp, Address(tmp, ConstantPool::pool_holder_offset_in_bytes())); ldr(mirror, Address(tmp, mirror_offset)); + resolve_oop_handle(mirror); } diff --git a/src/hotspot/cpu/arm/templateTable_arm.cpp b/src/hotspot/cpu/arm/templateTable_arm.cpp index 7fd60ce8d2d..9eb74775ab1 100644 --- a/src/hotspot/cpu/arm/templateTable_arm.cpp +++ b/src/hotspot/cpu/arm/templateTable_arm.cpp @@ -2963,6 +2963,7 @@ void TemplateTable::load_field_cp_cache_entry(Register Rcache, cp_base_offset + ConstantPoolCacheEntry::f1_offset())); const int mirror_offset = in_bytes(Klass::java_mirror_offset()); __ ldr(Robj, Address(Robj, mirror_offset)); + __ resolve_oop_handle(Robj); } } diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp index 31dcfa7beba..bce57c7e137 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp @@ -3382,6 +3382,7 @@ void MacroAssembler::load_mirror_from_const_method(Register mirror, Register con ld(mirror, in_bytes(ConstMethod::constants_offset()), const_method); ld(mirror, ConstantPool::pool_holder_offset_in_bytes(), mirror); ld(mirror, in_bytes(Klass::java_mirror_offset()), mirror); + resolve_oop_handle(mirror); } // Clear Array diff --git a/src/hotspot/cpu/ppc/templateTable_ppc_64.cpp b/src/hotspot/cpu/ppc/templateTable_ppc_64.cpp index 43f6ad1c591..282ffeb218b 100644 --- a/src/hotspot/cpu/ppc/templateTable_ppc_64.cpp +++ b/src/hotspot/cpu/ppc/templateTable_ppc_64.cpp @@ -2224,6 +2224,7 @@ void TemplateTable::load_field_cp_cache_entry(Register Robj, if (is_static) { __ ld(Robj, in_bytes(cp_base_offset) + in_bytes(ConstantPoolCacheEntry::f1_offset()), Rcache); __ ld(Robj, in_bytes(Klass::java_mirror_offset()), Robj); + __ resolve_oop_handle(Robj); // Acquire not needed here. Following access has an address dependency on this value. } } diff --git a/src/hotspot/cpu/s390/macroAssembler_s390.cpp b/src/hotspot/cpu/s390/macroAssembler_s390.cpp index b8d3e4de275..af2c02934ff 100644 --- a/src/hotspot/cpu/s390/macroAssembler_s390.cpp +++ b/src/hotspot/cpu/s390/macroAssembler_s390.cpp @@ -4671,6 +4671,7 @@ void MacroAssembler::load_mirror(Register mirror, Register method) { mem2reg_opt(mirror, Address(mirror, ConstMethod::constants_offset())); mem2reg_opt(mirror, Address(mirror, ConstantPool::pool_holder_offset_in_bytes())); mem2reg_opt(mirror, Address(mirror, Klass::java_mirror_offset())); + resolve_oop_handle(mirror); } //--------------------------------------------------------------- diff --git a/src/hotspot/cpu/s390/templateTable_s390.cpp b/src/hotspot/cpu/s390/templateTable_s390.cpp index becbb0e48b5..50477e6e556 100644 --- a/src/hotspot/cpu/s390/templateTable_s390.cpp +++ b/src/hotspot/cpu/s390/templateTable_s390.cpp @@ -2382,6 +2382,7 @@ void TemplateTable::load_field_cp_cache_entry(Register obj, if (is_static) { __ mem2reg_opt(obj, Address(cache, index, cp_base_offset + ConstantPoolCacheEntry::f1_offset())); __ mem2reg_opt(obj, Address(obj, Klass::java_mirror_offset())); + __ resolve_oop_handle(obj); } } diff --git a/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp b/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp index 52d7d8c2fb3..30112382545 100644 --- a/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp +++ b/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp @@ -3844,6 +3844,7 @@ void MacroAssembler::load_mirror(Register mirror, Register method) { ld_ptr(mirror, in_bytes(ConstMethod::constants_offset()), mirror); ld_ptr(mirror, ConstantPool::pool_holder_offset_in_bytes(), mirror); ld_ptr(mirror, mirror_offset, mirror); + resolve_oop_handle(mirror); } void MacroAssembler::load_klass(Register src_oop, Register klass) { diff --git a/src/hotspot/cpu/sparc/templateTable_sparc.cpp b/src/hotspot/cpu/sparc/templateTable_sparc.cpp index f8d861a1df0..8683c35e635 100644 --- a/src/hotspot/cpu/sparc/templateTable_sparc.cpp +++ b/src/hotspot/cpu/sparc/templateTable_sparc.cpp @@ -2049,6 +2049,7 @@ void TemplateTable::load_field_cp_cache_entry(Register Robj, __ ld_ptr(Rcache, cp_base_offset + ConstantPoolCacheEntry::f1_offset(), Robj); const int mirror_offset = in_bytes(Klass::java_mirror_offset()); __ ld_ptr( Robj, mirror_offset, Robj); + __ resolve_oop_handle(Robj); } } diff --git a/src/hotspot/cpu/x86/macroAssembler_x86.cpp b/src/hotspot/cpu/x86/macroAssembler_x86.cpp index a8a908344e1..105c29fb972 100644 --- a/src/hotspot/cpu/x86/macroAssembler_x86.cpp +++ b/src/hotspot/cpu/x86/macroAssembler_x86.cpp @@ -6617,6 +6617,7 @@ void MacroAssembler::load_mirror(Register mirror, Register method) { movptr(mirror, Address(mirror, ConstMethod::constants_offset())); movptr(mirror, Address(mirror, ConstantPool::pool_holder_offset_in_bytes())); movptr(mirror, Address(mirror, mirror_offset)); + resolve_oop_handle(mirror); } void MacroAssembler::load_klass(Register dst, Register src) { diff --git a/src/hotspot/cpu/x86/templateTable_x86.cpp b/src/hotspot/cpu/x86/templateTable_x86.cpp index 60335333076..281a56c0f18 100644 --- a/src/hotspot/cpu/x86/templateTable_x86.cpp +++ b/src/hotspot/cpu/x86/templateTable_x86.cpp @@ -2665,6 +2665,7 @@ void TemplateTable::load_field_cp_cache_entry(Register obj, ConstantPoolCacheEntry::f1_offset()))); const int mirror_offset = in_bytes(Klass::java_mirror_offset()); __ movptr(obj, Address(obj, mirror_offset)); + __ resolve_oop_handle(obj); } } diff --git a/src/hotspot/share/c1/c1_LIRGenerator.cpp b/src/hotspot/share/c1/c1_LIRGenerator.cpp index 37bd62a6929..ed64f686a92 100644 --- a/src/hotspot/share/c1/c1_LIRGenerator.cpp +++ b/src/hotspot/share/c1/c1_LIRGenerator.cpp @@ -1304,7 +1304,9 @@ void LIRGenerator::do_getClass(Intrinsic* x) { // FIXME T_ADDRESS should actually be T_METADATA but it can't because the // meaning of these two is mixed up (see JDK-8026837). __ move(new LIR_Address(rcvr.result(), oopDesc::klass_offset_in_bytes(), T_ADDRESS), temp, info); - __ move_wide(new LIR_Address(temp, in_bytes(Klass::java_mirror_offset()), T_OBJECT), result); + __ move_wide(new LIR_Address(temp, in_bytes(Klass::java_mirror_offset()), T_ADDRESS), result); + // mirror = ((OopHandle)mirror)->resolve(); + __ move_wide(new LIR_Address(result, T_OBJECT), result); } // java.lang.Class::isPrimitive() diff --git a/src/hotspot/share/classfile/classLoaderData.cpp b/src/hotspot/share/classfile/classLoaderData.cpp index 8aaa0ee5044..927ce0663f5 100644 --- a/src/hotspot/share/classfile/classLoaderData.cpp +++ b/src/hotspot/share/classfile/classLoaderData.cpp @@ -98,7 +98,8 @@ ClassLoaderData::ClassLoaderData(Handle h_class_loader, bool is_anonymous, Depen _keep_alive((is_anonymous || h_class_loader.is_null()) ? 1 : 0), _metaspace(NULL), _unloading(false), _klasses(NULL), _modules(NULL), _packages(NULL), - _claimed(0), _jmethod_ids(NULL), _handles(), _deallocate_list(NULL), + _claimed(0), _modified_oops(true), _accumulated_modified_oops(false), + _jmethod_ids(NULL), _handles(), _deallocate_list(NULL), _next(NULL), _dependencies(dependencies), _metaspace_lock(new Mutex(Monitor::leaf+1, "Metaspace allocation lock", true, Monitor::_safepoint_check_never)) { @@ -207,7 +208,7 @@ bool ClassLoaderData::ChunkedHandleList::contains(oop* p) { oops_do(&cl); return cl.found(); } -#endif +#endif // ASSERT bool ClassLoaderData::claim() { if (_claimed == 1) { @@ -236,19 +237,19 @@ void ClassLoaderData::dec_keep_alive() { } } -void ClassLoaderData::oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim) { +void ClassLoaderData::oops_do(OopClosure* f, bool must_claim, bool clear_mod_oops) { if (must_claim && !claim()) { return; } + // Only clear modified_oops after the ClassLoaderData is claimed. + if (clear_mod_oops) { + clear_modified_oops(); + } + f->do_oop(&_class_loader); _dependencies.oops_do(f); - _handles.oops_do(f); - - if (klass_closure != NULL) { - classes_do(klass_closure); - } } void ClassLoaderData::Dependencies::oops_do(OopClosure* f) { @@ -368,6 +369,9 @@ void ClassLoaderData::record_dependency(const Klass* k, TRAPS) { // Must handle over GC point. Handle dependency(THREAD, to); from_cld->_dependencies.add(dependency, CHECK); + + // Added a potentially young gen oop to the ClassLoaderData + record_modified_oops(); } @@ -764,6 +768,7 @@ Metaspace* ClassLoaderData::metaspace_non_null() { OopHandle ClassLoaderData::add_handle(Handle h) { MutexLockerEx ml(metaspace_lock(), Mutex::_no_safepoint_check_flag); + record_modified_oops(); return OopHandle(_handles.add(h())); } @@ -875,8 +880,7 @@ void ClassLoaderData::dump(outputStream * const out) { if (Verbose) { Klass* k = _klasses; while (k != NULL) { - out->print_cr("klass " PTR_FORMAT ", %s, CT: %d, MUT: %d", k, k->name()->as_C_string(), - k->has_modified_oops(), k->has_accumulated_modified_oops()); + out->print_cr("klass " PTR_FORMAT ", %s", p2i(k), k->name()->as_C_string()); assert(k != k->next_link(), "no loops!"); k = k->next_link(); } @@ -1003,25 +1007,25 @@ void ClassLoaderDataGraph::print_creation(outputStream* out, Handle loader, Clas } -void ClassLoaderDataGraph::oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim) { +void ClassLoaderDataGraph::oops_do(OopClosure* f, bool must_claim) { for (ClassLoaderData* cld = _head; cld != NULL; cld = cld->next()) { - cld->oops_do(f, klass_closure, must_claim); + cld->oops_do(f, must_claim); } } -void ClassLoaderDataGraph::keep_alive_oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim) { +void ClassLoaderDataGraph::keep_alive_oops_do(OopClosure* f, bool must_claim) { for (ClassLoaderData* cld = _head; cld != NULL; cld = cld->next()) { if (cld->keep_alive()) { - cld->oops_do(f, klass_closure, must_claim); + cld->oops_do(f, must_claim); } } } -void ClassLoaderDataGraph::always_strong_oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim) { +void ClassLoaderDataGraph::always_strong_oops_do(OopClosure* f, bool must_claim) { if (ClassUnloading) { - keep_alive_oops_do(f, klass_closure, must_claim); + keep_alive_oops_do(f, must_claim); } else { - oops_do(f, klass_closure, must_claim); + oops_do(f, must_claim); } } diff --git a/src/hotspot/share/classfile/classLoaderData.hpp b/src/hotspot/share/classfile/classLoaderData.hpp index 524c985dea2..4b6d680a9e3 100644 --- a/src/hotspot/share/classfile/classLoaderData.hpp +++ b/src/hotspot/share/classfile/classLoaderData.hpp @@ -87,9 +87,9 @@ class ClassLoaderDataGraph : public AllStatic { static void purge(); static void clear_claimed_marks(); // oops do - static void oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim); - static void keep_alive_oops_do(OopClosure* blk, KlassClosure* klass_closure, bool must_claim); - static void always_strong_oops_do(OopClosure* blk, KlassClosure* klass_closure, bool must_claim); + static void oops_do(OopClosure* f, bool must_claim); + static void keep_alive_oops_do(OopClosure* blk, bool must_claim); + static void always_strong_oops_do(OopClosure* blk, bool must_claim); // cld do static void cld_do(CLDClosure* cl); static void cld_unloading_do(CLDClosure* cl); @@ -230,10 +230,16 @@ class ClassLoaderData : public CHeapObj { Mutex* _metaspace_lock; // Locks the metaspace for allocations and setup. bool _unloading; // true if this class loader goes away bool _is_anonymous; // if this CLD is for an anonymous class + + // Remembered sets support for the oops in the class loader data. + bool _modified_oops; // Card Table Equivalent (YC/CMS support) + bool _accumulated_modified_oops; // Mod Union Equivalent (CMS support) + s2 _keep_alive; // if this CLD is kept alive without a keep_alive_object(). // Used for anonymous classes and the boot class // loader. _keep_alive does not need to be volatile or // atomic since there is one unique CLD per anonymous class. + volatile int _claimed; // true if claimed, for example during GC traces. // To avoid applying oop closure more than once. // Has to be an int because we cas it. @@ -276,6 +282,19 @@ class ClassLoaderData : public CHeapObj { bool claimed() const { return _claimed == 1; } bool claim(); + // The CLD are not placed in the Heap, so the Card Table or + // the Mod Union Table can't be used to mark when CLD have modified oops. + // The CT and MUT bits saves this information for the whole class loader data. + void clear_modified_oops() { _modified_oops = false; } + public: + void record_modified_oops() { _modified_oops = true; } + bool has_modified_oops() { return _modified_oops; } + + void accumulate_modified_oops() { if (has_modified_oops()) _accumulated_modified_oops = true; } + void clear_accumulated_modified_oops() { _accumulated_modified_oops = false; } + bool has_accumulated_modified_oops() { return _accumulated_modified_oops; } + private: + void unload(); bool keep_alive() const { return _keep_alive > 0; } void classes_do(void f(Klass*)); @@ -346,8 +365,7 @@ class ClassLoaderData : public CHeapObj { inline unsigned int identity_hash() const { return (unsigned int)(((intptr_t)this) >> 3); } - // Used when tracing from klasses. - void oops_do(OopClosure* f, KlassClosure* klass_closure, bool must_claim); + void oops_do(OopClosure* f, bool must_claim, bool clear_modified_oops = false); void classes_do(KlassClosure* klass_closure); Klass* klasses() { return _klasses; } diff --git a/src/hotspot/share/classfile/javaClasses.cpp b/src/hotspot/share/classfile/javaClasses.cpp index 26720f2b258..3499d3e9d01 100644 --- a/src/hotspot/share/classfile/javaClasses.cpp +++ b/src/hotspot/share/classfile/javaClasses.cpp @@ -889,7 +889,7 @@ void java_lang_Class::create_mirror(Klass* k, Handle class_loader, // Setup indirection from klass->mirror // after any exceptions can happen during allocations. - k->set_java_mirror(mirror()); + k->set_java_mirror(mirror); // Set the module field in the java_lang_Class instance. This must be done // after the mirror is set. diff --git a/src/hotspot/share/gc/cms/cmsOopClosures.hpp b/src/hotspot/share/gc/cms/cmsOopClosures.hpp index 11416afebc9..ab29b0136cd 100644 --- a/src/hotspot/share/gc/cms/cmsOopClosures.hpp +++ b/src/hotspot/share/gc/cms/cmsOopClosures.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2007, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2007, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -48,12 +48,7 @@ class ParMarkFromRootsClosure; // because some CMS OopClosures derive from OopsInGenClosure. It would be // good to get rid of them completely. class MetadataAwareOopsInGenClosure: public OopsInGenClosure { - KlassToOopClosure _klass_closure; public: - MetadataAwareOopsInGenClosure() { - _klass_closure.initialize(this); - } - virtual bool do_metadata() { return do_metadata_nv(); } inline bool do_metadata_nv() { return true; } diff --git a/src/hotspot/share/gc/cms/cmsOopClosures.inline.hpp b/src/hotspot/share/gc/cms/cmsOopClosures.inline.hpp index 36a6e841cfc..ad01a9d45d7 100644 --- a/src/hotspot/share/gc/cms/cmsOopClosures.inline.hpp +++ b/src/hotspot/share/gc/cms/cmsOopClosures.inline.hpp @@ -40,10 +40,8 @@ inline void MetadataAwareOopsInGenClosure::do_klass_nv(Klass* k) { inline void MetadataAwareOopsInGenClosure::do_klass(Klass* k) { do_klass_nv(k); } inline void MetadataAwareOopsInGenClosure::do_cld_nv(ClassLoaderData* cld) { - assert(_klass_closure._oop_closure == this, "Must be"); - bool claim = true; // Must claim the class loader data before processing. - cld->oops_do(_klass_closure._oop_closure, &_klass_closure, claim); + cld->oops_do(this, claim); } // Decode the oop and call do_oop on it. diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp index e9a2fe8123b..59161a2baa6 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp @@ -1553,9 +1553,10 @@ void CMSCollector::do_compaction_work(bool clear_all_soft_refs) { assert(_collectorState != Idling || _modUnionTable.isAllClear(), "_modUnionTable should be clear if the baton was not passed"); _modUnionTable.clear_all(); - assert(_collectorState != Idling || _ct->klass_rem_set()->mod_union_is_clear(), + assert(_collectorState != Idling || _ct->cld_rem_set()->mod_union_is_clear(), "mod union for klasses should be clear if the baton was passed"); - _ct->klass_rem_set()->clear_mod_union(); + _ct->cld_rem_set()->clear_mod_union(); + // We must adjust the allocation statistics being maintained // in the free list space. We do so by reading and clearing @@ -2025,7 +2026,7 @@ void CMSCollector::gc_prologue(bool full) { // that information. Tell the young collection to save the union of all // modified klasses. if (duringMarking) { - _ct->klass_rem_set()->set_accumulate_modified_oops(true); + _ct->cld_rem_set()->set_accumulate_modified_oops(true); } bool registerClosure = duringMarking; @@ -2101,7 +2102,7 @@ void CMSCollector::gc_epilogue(bool full) { assert(haveFreelistLocks(), "must have freelist locks"); assert_lock_strong(bitMapLock()); - _ct->klass_rem_set()->set_accumulate_modified_oops(false); + _ct->cld_rem_set()->set_accumulate_modified_oops(false); _cmsGen->gc_epilogue_work(full); @@ -2380,18 +2381,18 @@ void CMSCollector::verify_after_remark_work_1() { } } -class VerifyKlassOopsKlassClosure : public KlassClosure { - class VerifyKlassOopsClosure : public OopClosure { +class VerifyCLDOopsCLDClosure : public CLDClosure { + class VerifyCLDOopsClosure : public OopClosure { CMSBitMap* _bitmap; public: - VerifyKlassOopsClosure(CMSBitMap* bitmap) : _bitmap(bitmap) { } + VerifyCLDOopsClosure(CMSBitMap* bitmap) : _bitmap(bitmap) { } void do_oop(oop* p) { guarantee(*p == NULL || _bitmap->isMarked((HeapWord*) *p), "Should be marked"); } void do_oop(narrowOop* p) { ShouldNotReachHere(); } } _oop_closure; public: - VerifyKlassOopsKlassClosure(CMSBitMap* bitmap) : _oop_closure(bitmap) {} - void do_klass(Klass* k) { - k->oops_do(&_oop_closure); + VerifyCLDOopsCLDClosure(CMSBitMap* bitmap) : _oop_closure(bitmap) {} + void do_cld(ClassLoaderData* cld) { + cld->oops_do(&_oop_closure, false, false); } }; @@ -2437,8 +2438,8 @@ void CMSCollector::verify_after_remark_work_2() { assert(verification_mark_stack()->isEmpty(), "Should have been drained"); verify_work_stacks_empty(); - VerifyKlassOopsKlassClosure verify_klass_oops(verification_mark_bm()); - ClassLoaderDataGraph::classes_do(&verify_klass_oops); + VerifyCLDOopsCLDClosure verify_cld_oops(verification_mark_bm()); + ClassLoaderDataGraph::cld_do(&verify_cld_oops); // Marking completed -- now verify that each bit marked in // verification_mark_bm() is also marked in markBitMap(); flag all @@ -2911,7 +2912,7 @@ void CMSCollector::checkpointRootsInitialWork() { " or no bits are set in the gc_prologue before the start of the next " "subsequent marking phase."); - assert(_ct->klass_rem_set()->mod_union_is_clear(), "Must be"); + assert(_ct->cld_rem_set()->mod_union_is_clear(), "Must be"); // Save the end of the used_region of the constituent generations // to be used to limit the extent of sweep in each generation. @@ -3848,7 +3849,7 @@ size_t CMSCollector::preclean_work(bool clean_refs, bool clean_survivor) { } } - preclean_klasses(&mrias_cl, _cmsGen->freelistLock()); + preclean_cld(&mrias_cl, _cmsGen->freelistLock()); curNumCards = preclean_card_table(_cmsGen, &smoac_cl); cumNumCards += curNumCards; @@ -4067,21 +4068,21 @@ size_t CMSCollector::preclean_card_table(ConcurrentMarkSweepGeneration* old_gen, return cumNumDirtyCards; } -class PrecleanKlassClosure : public KlassClosure { - KlassToOopClosure _cm_klass_closure; +class PrecleanCLDClosure : public CLDClosure { + MetadataAwareOopsInGenClosure* _cm_closure; public: - PrecleanKlassClosure(OopClosure* oop_closure) : _cm_klass_closure(oop_closure) {} - void do_klass(Klass* k) { - if (k->has_accumulated_modified_oops()) { - k->clear_accumulated_modified_oops(); + PrecleanCLDClosure(MetadataAwareOopsInGenClosure* oop_closure) : _cm_closure(oop_closure) {} + void do_cld(ClassLoaderData* cld) { + if (cld->has_accumulated_modified_oops()) { + cld->clear_accumulated_modified_oops(); - _cm_klass_closure.do_klass(k); + _cm_closure->do_cld(cld); } } }; // The freelist lock is needed to prevent asserts, is it really needed? -void CMSCollector::preclean_klasses(MarkRefsIntoAndScanClosure* cl, Mutex* freelistLock) { +void CMSCollector::preclean_cld(MarkRefsIntoAndScanClosure* cl, Mutex* freelistLock) { cl->set_freelistLock(freelistLock); @@ -4089,8 +4090,8 @@ void CMSCollector::preclean_klasses(MarkRefsIntoAndScanClosure* cl, Mutex* freel // SSS: Add equivalent to ScanMarkedObjectsAgainCarefullyClosure::do_yield_check and should_abort_preclean? // SSS: We should probably check if precleaning should be aborted, at suitable intervals? - PrecleanKlassClosure preclean_klass_closure(cl); - ClassLoaderDataGraph::classes_do(&preclean_klass_closure); + PrecleanCLDClosure preclean_closure(cl); + ClassLoaderDataGraph::cld_do(&preclean_closure); verify_work_stacks_empty(); verify_overflow_empty(); @@ -4250,7 +4251,7 @@ void CMSCollector::checkpointRootsFinalWork() { // Call isAllClear() under bitMapLock assert(_modUnionTable.isAllClear(), "Should be clear by end of the final marking"); - assert(_ct->klass_rem_set()->mod_union_is_clear(), + assert(_ct->cld_rem_set()->mod_union_is_clear(), "Should be clear by end of the final marking"); } @@ -4332,26 +4333,26 @@ class CMSParRemarkTask: public CMSParMarkTask { void do_work_steal(int i, ParMarkRefsIntoAndScanClosure* cl, int* seed); }; -class RemarkKlassClosure : public KlassClosure { - KlassToOopClosure _cm_klass_closure; +class RemarkCLDClosure : public CLDClosure { + CLDToOopClosure _cm_closure; public: - RemarkKlassClosure(OopClosure* oop_closure) : _cm_klass_closure(oop_closure) {} - void do_klass(Klass* k) { - // Check if we have modified any oops in the Klass during the concurrent marking. - if (k->has_accumulated_modified_oops()) { - k->clear_accumulated_modified_oops(); + RemarkCLDClosure(OopClosure* oop_closure) : _cm_closure(oop_closure) {} + void do_cld(ClassLoaderData* cld) { + // Check if we have modified any oops in the CLD during the concurrent marking. + if (cld->has_accumulated_modified_oops()) { + cld->clear_accumulated_modified_oops(); // We could have transfered the current modified marks to the accumulated marks, // like we do with the Card Table to Mod Union Table. But it's not really necessary. - } else if (k->has_modified_oops()) { + } else if (cld->has_modified_oops()) { // Don't clear anything, this info is needed by the next young collection. } else { - // No modified oops in the Klass. + // No modified oops in the ClassLoaderData. return; } // The klass has modified fields, need to scan the klass. - _cm_klass_closure.do_klass(k); + _cm_closure.do_cld(cld); } }; @@ -4439,24 +4440,24 @@ void CMSParRemarkTask::work(uint worker_id) { log_trace(gc, task)("Finished unhandled CLD scanning work in %dth thread: %3.3f sec", worker_id, _timer.seconds()); } - // ---------- dirty klass scanning ---------- + // We might have added oops to ClassLoaderData::_handles during the + // concurrent marking phase. These oops do not always point to newly allocated objects + // that are guaranteed to be kept alive. Hence, + // we do have to revisit the _handles block during the remark phase. + + // ---------- dirty CLD scanning ---------- if (worker_id == 0) { // Single threaded at the moment. _timer.reset(); _timer.start(); // Scan all classes that was dirtied during the concurrent marking phase. - RemarkKlassClosure remark_klass_closure(&par_mrias_cl); - ClassLoaderDataGraph::classes_do(&remark_klass_closure); + RemarkCLDClosure remark_closure(&par_mrias_cl); + ClassLoaderDataGraph::cld_do(&remark_closure); _timer.stop(); - log_trace(gc, task)("Finished dirty klass scanning work in %dth thread: %3.3f sec", worker_id, _timer.seconds()); + log_trace(gc, task)("Finished dirty CLD scanning work in %dth thread: %3.3f sec", worker_id, _timer.seconds()); } - // We might have added oops to ClassLoaderData::_handles during the - // concurrent marking phase. These oops point to newly allocated objects - // that are guaranteed to be kept alive. Either by the direct allocation - // code, or when the young collector processes the roots. Hence, - // we don't have to revisit the _handles block during the remark phase. // ---------- rescan dirty cards ------------ _timer.reset(); @@ -4981,23 +4982,21 @@ void CMSCollector::do_remark_non_parallel() { verify_work_stacks_empty(); } + // We might have added oops to ClassLoaderData::_handles during the + // concurrent marking phase. These oops do not point to newly allocated objects + // that are guaranteed to be kept alive. Hence, + // we do have to revisit the _handles block during the remark phase. { - GCTraceTime(Trace, gc, phases) t("Dirty Klass Scan", _gc_timer_cm); + GCTraceTime(Trace, gc, phases) t("Dirty CLD Scan", _gc_timer_cm); verify_work_stacks_empty(); - RemarkKlassClosure remark_klass_closure(&mrias_cl); - ClassLoaderDataGraph::classes_do(&remark_klass_closure); + RemarkCLDClosure remark_closure(&mrias_cl); + ClassLoaderDataGraph::cld_do(&remark_closure); verify_work_stacks_empty(); } - // We might have added oops to ClassLoaderData::_handles during the - // concurrent marking phase. These oops point to newly allocated objects - // that are guaranteed to be kept alive. Either by the direct allocation - // code, or when the young collector processes the roots. Hence, - // we don't have to revisit the _handles block during the remark phase. - verify_work_stacks_empty(); // Restore evacuated mark words, if any, used for overflow list links restore_preserved_marks_if_any(); diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.hpp b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.hpp index 978310aaade..aebaae75705 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.hpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.hpp @@ -777,7 +777,7 @@ class CMSCollector: public CHeapObj { // Does precleaning work, returning a quantity indicative of // the amount of "useful work" done. size_t preclean_work(bool clean_refs, bool clean_survivors); - void preclean_klasses(MarkRefsIntoAndScanClosure* cl, Mutex* freelistLock); + void preclean_cld(MarkRefsIntoAndScanClosure* cl, Mutex* freelistLock); void abortable_preclean(); // Preclean while looking for possible abort void initialize_sequential_subtasks_for_young_gen_rescan(int i); // Helper function for above; merge-sorts the per-thread plab samples diff --git a/src/hotspot/share/gc/cms/parNewGeneration.cpp b/src/hotspot/share/gc/cms/parNewGeneration.cpp index 873fad0b251..b8bdd04af0a 100644 --- a/src/hotspot/share/gc/cms/parNewGeneration.cpp +++ b/src/hotspot/share/gc/cms/parNewGeneration.cpp @@ -493,7 +493,7 @@ void ParScanThreadStateSet::flush() { ParScanClosure::ParScanClosure(ParNewGeneration* g, ParScanThreadState* par_scan_state) : - OopsInKlassOrGenClosure(g), _par_scan_state(par_scan_state), _g(g) { + OopsInClassLoaderDataOrGenClosure(g), _par_scan_state(par_scan_state), _g(g) { _boundary = _g->reserved().end(); } @@ -601,11 +601,8 @@ void ParNewGenTask::work(uint worker_id) { par_scan_state.set_young_old_boundary(_young_old_boundary); - KlassScanClosure klass_scan_closure(&par_scan_state.to_space_root_closure(), - gch->rem_set()->klass_rem_set()); - CLDToKlassAndOopClosure cld_scan_closure(&klass_scan_closure, - &par_scan_state.to_space_root_closure(), - false); + CLDScanClosure cld_scan_closure(&par_scan_state.to_space_root_closure(), + gch->rem_set()->cld_rem_set()->accumulate_modified_oops()); par_scan_state.start_strong_roots(); gch->young_process_roots(_strong_roots_scope, diff --git a/src/hotspot/share/gc/cms/parOopClosures.hpp b/src/hotspot/share/gc/cms/parOopClosures.hpp index daf95f65785..87b5d98d975 100644 --- a/src/hotspot/share/gc/cms/parOopClosures.hpp +++ b/src/hotspot/share/gc/cms/parOopClosures.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2007, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2007, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -37,7 +37,7 @@ typedef Padded ObjToScanQueue; typedef GenericTaskQueueSet ObjToScanQueueSet; class ParallelTaskTerminator; -class ParScanClosure: public OopsInKlassOrGenClosure { +class ParScanClosure: public OopsInClassLoaderDataOrGenClosure { protected: ParScanThreadState* _par_scan_state; ParNewGeneration* _g; diff --git a/src/hotspot/share/gc/cms/parOopClosures.inline.hpp b/src/hotspot/share/gc/cms/parOopClosures.inline.hpp index 12092b62be9..eb4dea537e4 100644 --- a/src/hotspot/share/gc/cms/parOopClosures.inline.hpp +++ b/src/hotspot/share/gc/cms/parOopClosures.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2007, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2007, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -126,8 +126,8 @@ inline void ParScanClosure::do_oop_work(T* p, (void)_par_scan_state->trim_queues(10 * ParallelGCThreads); } } - if (is_scanning_a_klass()) { - do_klass_barrier(); + if (is_scanning_a_cld()) { + do_cld_barrier(); } else if (gc_barrier) { // Now call parent closure par_do_barrier(p); diff --git a/src/hotspot/share/gc/g1/g1CollectedHeap.hpp b/src/hotspot/share/gc/g1/g1CollectedHeap.hpp index 5ed6ae89021..266fffa2d02 100644 --- a/src/hotspot/share/gc/g1/g1CollectedHeap.hpp +++ b/src/hotspot/share/gc/g1/g1CollectedHeap.hpp @@ -63,7 +63,6 @@ class HRRSCleanupTask; class GenerationSpec; class G1ParScanThreadState; class G1ParScanThreadStateSet; -class G1KlassScanClosure; class G1ParScanThreadState; class ObjectClosure; class SpaceClosure; diff --git a/src/hotspot/share/gc/g1/g1HeapVerifier.cpp b/src/hotspot/share/gc/g1/g1HeapVerifier.cpp index 8b2e0334333..9604b8b9481 100644 --- a/src/hotspot/share/gc/g1/g1HeapVerifier.cpp +++ b/src/hotspot/share/gc/g1/g1HeapVerifier.cpp @@ -161,18 +161,18 @@ class YoungRefCounterClosure : public OopClosure { void reset_count() { _count = 0; }; }; -class VerifyKlassClosure: public KlassClosure { +class VerifyCLDClosure: public CLDClosure { YoungRefCounterClosure _young_ref_counter_closure; OopClosure *_oop_closure; public: - VerifyKlassClosure(G1CollectedHeap* g1h, OopClosure* cl) : _young_ref_counter_closure(g1h), _oop_closure(cl) {} - void do_klass(Klass* k) { - k->oops_do(_oop_closure); + VerifyCLDClosure(G1CollectedHeap* g1h, OopClosure* cl) : _young_ref_counter_closure(g1h), _oop_closure(cl) {} + void do_cld(ClassLoaderData* cld) { + cld->oops_do(_oop_closure, false); _young_ref_counter_closure.reset_count(); - k->oops_do(&_young_ref_counter_closure); + cld->oops_do(&_young_ref_counter_closure, false); if (_young_ref_counter_closure.count() > 0) { - guarantee(k->has_modified_oops(), "Klass " PTR_FORMAT ", has young refs but is not dirty.", p2i(k)); + guarantee(cld->has_modified_oops(), "CLD " PTR_FORMAT ", has young %d refs but is not dirty.", p2i(cld), _young_ref_counter_closure.count()); } } }; @@ -390,8 +390,7 @@ void G1HeapVerifier::verify(VerifyOption vo) { log_debug(gc, verify)("Roots"); VerifyRootsClosure rootsCl(vo); - VerifyKlassClosure klassCl(_g1h, &rootsCl); - CLDToKlassAndOopClosure cldCl(&klassCl, &rootsCl, false); + VerifyCLDClosure cldCl(_g1h, &rootsCl); // We apply the relevant closures to all the oops in the // system dictionary, class loader data graph, the string table diff --git a/src/hotspot/share/gc/g1/g1OopClosures.cpp b/src/hotspot/share/gc/g1/g1OopClosures.cpp index 9b04478f2d7..94a7da8b722 100644 --- a/src/hotspot/share/gc/g1/g1OopClosures.cpp +++ b/src/hotspot/share/gc/g1/g1OopClosures.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2014, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2014, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -34,7 +34,7 @@ G1ParCopyHelper::G1ParCopyHelper(G1CollectedHeap* g1, G1ParScanThreadState* par _g1(g1), _par_scan_state(par_scan_state), _worker_id(par_scan_state->worker_id()), - _scanned_klass(NULL), + _scanned_cld(NULL), _cm(_g1->concurrent_mark()) { } @@ -42,20 +42,20 @@ G1ScanClosureBase::G1ScanClosureBase(G1CollectedHeap* g1, G1ParScanThreadState* _g1(g1), _par_scan_state(par_scan_state), _from(NULL) { } -void G1KlassScanClosure::do_klass(Klass* klass) { - // If the klass has not been dirtied we know that there's +void G1CLDScanClosure::do_cld(ClassLoaderData* cld) { + // If the class loader data has not been dirtied we know that there's // no references into the young gen and we can skip it. - if (!_process_only_dirty || klass->has_modified_oops()) { - // Clean the klass since we're going to scavenge all the metadata. - klass->clear_modified_oops(); + if (!_process_only_dirty || cld->has_modified_oops()) { - // Tell the closure that this klass is the Klass to scavenge + // Tell the closure that this class loader data is the CLD to scavenge // and is the one to dirty if oops are left pointing into the young gen. - _closure->set_scanned_klass(klass); + _closure->set_scanned_cld(cld); - klass->oops_do(_closure); + // Clean the cld since we're going to scavenge all the metadata. + // Clear modified oops only if this cld is claimed. + cld->oops_do(_closure, _must_claim, /*clear_modified_oops*/true); - _closure->set_scanned_klass(NULL); + _closure->set_scanned_cld(NULL); } _count++; } diff --git a/src/hotspot/share/gc/g1/g1OopClosures.hpp b/src/hotspot/share/gc/g1/g1OopClosures.hpp index 20a2bd5252b..4d961ac946e 100644 --- a/src/hotspot/share/gc/g1/g1OopClosures.hpp +++ b/src/hotspot/share/gc/g1/g1OopClosures.hpp @@ -107,7 +107,7 @@ protected: G1CollectedHeap* _g1; G1ParScanThreadState* _par_scan_state; uint _worker_id; // Cache value from par_scan_state. - Klass* _scanned_klass; + ClassLoaderData* _scanned_cld; G1ConcurrentMark* _cm; // Mark the object if it's not already marked. This is used to mark @@ -124,13 +124,13 @@ protected: ~G1ParCopyHelper() { } public: - void set_scanned_klass(Klass* k) { _scanned_klass = k; } - template inline void do_klass_barrier(T* p, oop new_obj); + void set_scanned_cld(ClassLoaderData* cld) { _scanned_cld = cld; } + inline void do_cld_barrier(oop new_obj); }; enum G1Barrier { G1BarrierNone, - G1BarrierKlass + G1BarrierCLD }; enum G1Mark { @@ -150,14 +150,16 @@ public: virtual void do_oop(narrowOop* p) { do_oop_work(p); } }; -class G1KlassScanClosure : public KlassClosure { +class G1CLDScanClosure : public CLDClosure { G1ParCopyHelper* _closure; bool _process_only_dirty; + bool _must_claim; int _count; public: - G1KlassScanClosure(G1ParCopyHelper* closure, bool process_only_dirty) - : _process_only_dirty(process_only_dirty), _closure(closure), _count(0) {} - void do_klass(Klass* klass); + G1CLDScanClosure(G1ParCopyHelper* closure, + bool process_only_dirty, bool must_claim) + : _process_only_dirty(process_only_dirty), _must_claim(must_claim), _closure(closure), _count(0) {} + void do_cld(ClassLoaderData* cld); }; // Closure for iterating over object fields during concurrent marking diff --git a/src/hotspot/share/gc/g1/g1OopClosures.inline.hpp b/src/hotspot/share/gc/g1/g1OopClosures.inline.hpp index 017b2df5c13..e3b6887880c 100644 --- a/src/hotspot/share/gc/g1/g1OopClosures.inline.hpp +++ b/src/hotspot/share/gc/g1/g1OopClosures.inline.hpp @@ -195,10 +195,9 @@ inline void G1ScanObjsDuringScanRSClosure::do_oop_nv(T* p) { } } -template -void G1ParCopyHelper::do_klass_barrier(T* p, oop new_obj) { +void G1ParCopyHelper::do_cld_barrier(oop new_obj) { if (_g1->heap_region_containing(new_obj)->is_young()) { - _scanned_klass->record_modified_oops(); + _scanned_cld->record_modified_oops(); } } @@ -249,8 +248,8 @@ void G1ParCopyClosure::do_oop_work(T* p) { mark_forwarded_object(obj, forwardee); } - if (barrier == G1BarrierKlass) { - do_klass_barrier(p, forwardee); + if (barrier == G1BarrierCLD) { + do_cld_barrier(forwardee); } } else { if (state.is_humongous()) { @@ -267,5 +266,4 @@ void G1ParCopyClosure::do_oop_work(T* p) { } } } - #endif // SHARE_VM_GC_G1_G1OOPCLOSURES_INLINE_HPP diff --git a/src/hotspot/share/gc/g1/g1SharedClosures.hpp b/src/hotspot/share/gc/g1/g1SharedClosures.hpp index 2c9352394ae..38c54f5b7d4 100644 --- a/src/hotspot/share/gc/g1/g1SharedClosures.hpp +++ b/src/hotspot/share/gc/g1/g1SharedClosures.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2015, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -34,18 +34,17 @@ class G1ParScanThreadState; template class G1SharedClosures VALUE_OBJ_CLASS_SPEC { public: - G1ParCopyClosure _oops; - G1ParCopyClosure _oop_in_klass; - G1KlassScanClosure _klass_in_cld_closure; - CLDToKlassAndOopClosure _clds; - G1CodeBlobClosure _codeblobs; - BufferingOopClosure _buffered_oops; + G1ParCopyClosure _oops; + G1ParCopyClosure _oops_in_cld; - G1SharedClosures(G1CollectedHeap* g1h, G1ParScanThreadState* pss, bool process_only_dirty_klasses, bool must_claim_cld) : + G1CLDScanClosure _clds; + G1CodeBlobClosure _codeblobs; + BufferingOopClosure _buffered_oops; + + G1SharedClosures(G1CollectedHeap* g1h, G1ParScanThreadState* pss, bool process_only_dirty, bool must_claim_cld) : _oops(g1h, pss), - _oop_in_klass(g1h, pss), - _klass_in_cld_closure(&_oop_in_klass, process_only_dirty_klasses), - _clds(&_klass_in_cld_closure, &_oops, must_claim_cld), + _oops_in_cld(g1h, pss), + _clds(&_oops_in_cld, process_only_dirty, must_claim_cld), _codeblobs(&_oops), _buffered_oops(&_oops) {} }; diff --git a/src/hotspot/share/gc/parallel/pcTasks.cpp b/src/hotspot/share/gc/parallel/pcTasks.cpp index 8cae47c23ef..f5db42d6d09 100644 --- a/src/hotspot/share/gc/parallel/pcTasks.cpp +++ b/src/hotspot/share/gc/parallel/pcTasks.cpp @@ -81,7 +81,6 @@ void MarkFromRootsTask::do_it(GCTaskManager* manager, uint which) { ParCompactionManager* cm = ParCompactionManager::gc_thread_compaction_manager(which); ParCompactionManager::MarkAndPushClosure mark_and_push_closure(cm); - ParCompactionManager::FollowKlassClosure follow_klass_closure(&mark_and_push_closure); switch (_root_type) { case universe: @@ -117,7 +116,7 @@ void MarkFromRootsTask::do_it(GCTaskManager* manager, uint which) { break; case class_loader_data: - ClassLoaderDataGraph::always_strong_oops_do(&mark_and_push_closure, &follow_klass_closure, true); + ClassLoaderDataGraph::always_strong_oops_do(&mark_and_push_closure, true); break; case code_cache: diff --git a/src/hotspot/share/gc/parallel/psCompactionManager.hpp b/src/hotspot/share/gc/parallel/psCompactionManager.hpp index 9eb8bceff57..4690b1d9e3e 100644 --- a/src/hotspot/share/gc/parallel/psCompactionManager.hpp +++ b/src/hotspot/share/gc/parallel/psCompactionManager.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2005, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2005, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -196,17 +196,6 @@ private: FollowStackClosure(ParCompactionManager* cm) : _compaction_manager(cm) { } virtual void do_void(); }; - - // The one and only place to start following the classes. - // Should only be applied to the ClassLoaderData klasses list. - class FollowKlassClosure : public KlassClosure { - private: - MarkAndPushClosure* _mark_and_push_closure; - public: - FollowKlassClosure(MarkAndPushClosure* mark_and_push_closure) : - _mark_and_push_closure(mark_and_push_closure) { } - void do_klass(Klass* klass); - }; }; inline ParCompactionManager* ParCompactionManager::manager_array(uint index) { diff --git a/src/hotspot/share/gc/parallel/psCompactionManager.inline.hpp b/src/hotspot/share/gc/parallel/psCompactionManager.inline.hpp index 7d844c08db7..1376fa65c8e 100644 --- a/src/hotspot/share/gc/parallel/psCompactionManager.inline.hpp +++ b/src/hotspot/share/gc/parallel/psCompactionManager.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2010, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2010, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -98,15 +98,10 @@ inline void ParCompactionManager::FollowStackClosure::do_void() { _compaction_manager->follow_marking_stacks(); } -inline void ParCompactionManager::FollowKlassClosure::do_klass(Klass* klass) { - klass->oops_do(_mark_and_push_closure); -} - inline void ParCompactionManager::follow_class_loader(ClassLoaderData* cld) { MarkAndPushClosure mark_and_push_closure(this); - FollowKlassClosure follow_klass_closure(&mark_and_push_closure); - cld->oops_do(&mark_and_push_closure, &follow_klass_closure, true); + cld->oops_do(&mark_and_push_closure, true); } inline void ParCompactionManager::follow_contents(oop obj) { diff --git a/src/hotspot/share/gc/parallel/psParallelCompact.cpp b/src/hotspot/share/gc/parallel/psParallelCompact.cpp index 8ed22f4ab2a..8e96a9ec869 100644 --- a/src/hotspot/share/gc/parallel/psParallelCompact.cpp +++ b/src/hotspot/share/gc/parallel/psParallelCompact.cpp @@ -838,11 +838,6 @@ PSParallelCompact::IsAliveClosure PSParallelCompact::_is_alive_closure; bool PSParallelCompact::IsAliveClosure::do_object_b(oop p) { return mark_bitmap()->is_marked(p); } -void PSParallelCompact::AdjustKlassClosure::do_klass(Klass* klass) { - PSParallelCompact::AdjustPointerClosure closure(_cm); - klass->oops_do(&closure); -} - void PSParallelCompact::post_initialize() { ParallelScavengeHeap* heap = ParallelScavengeHeap::heap(); MemRegion mr = heap->reserved_region(); @@ -2162,7 +2157,6 @@ void PSParallelCompact::adjust_roots(ParCompactionManager* cm) { ClassLoaderDataGraph::clear_claimed_marks(); PSParallelCompact::AdjustPointerClosure oop_closure(cm); - PSParallelCompact::AdjustKlassClosure klass_closure(cm); // General strong roots. Universe::oops_do(&oop_closure); @@ -2172,7 +2166,7 @@ void PSParallelCompact::adjust_roots(ParCompactionManager* cm) { Management::oops_do(&oop_closure); JvmtiExport::oops_do(&oop_closure); SystemDictionary::oops_do(&oop_closure); - ClassLoaderDataGraph::oops_do(&oop_closure, &klass_closure, true); + ClassLoaderDataGraph::oops_do(&oop_closure, true); // Now adjust pointers in remaining weak roots. (All of which should // have been cleared if they pointed to non-surviving objects.) diff --git a/src/hotspot/share/gc/parallel/psScavenge.inline.hpp b/src/hotspot/share/gc/parallel/psScavenge.inline.hpp index a944277d00f..70bb4ba4afc 100644 --- a/src/hotspot/share/gc/parallel/psScavenge.inline.hpp +++ b/src/hotspot/share/gc/parallel/psScavenge.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2002, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2002, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -85,15 +85,15 @@ class PSRootsClosure: public OopClosure { typedef PSRootsClosure PSScavengeRootsClosure; typedef PSRootsClosure PSPromoteRootsClosure; -// Scavenges a single oop in a Klass. -class PSScavengeFromKlassClosure: public OopClosure { +// Scavenges a single oop in a ClassLoaderData. +class PSScavengeFromCLDClosure: public OopClosure { private: PSPromotionManager* _pm; - // Used to redirty a scanned klass if it has oops + // Used to redirty a scanned cld if it has oops // pointing to the young generation after being scanned. - Klass* _scanned_klass; + ClassLoaderData* _scanned_cld; public: - PSScavengeFromKlassClosure(PSPromotionManager* pm) : _pm(pm), _scanned_klass(NULL) { } + PSScavengeFromCLDClosure(PSPromotionManager* pm) : _pm(pm), _scanned_cld(NULL) { } void do_oop(narrowOop* p) { ShouldNotReachHere(); } void do_oop(oop* p) { ParallelScavengeHeap* psh = ParallelScavengeHeap::heap(); @@ -111,48 +111,46 @@ class PSScavengeFromKlassClosure: public OopClosure { oopDesc::encode_store_heap_oop_not_null(p, new_obj); if (PSScavenge::is_obj_in_young(new_obj)) { - do_klass_barrier(); + do_cld_barrier(); } } } - void set_scanned_klass(Klass* klass) { - assert(_scanned_klass == NULL || klass == NULL, "Should always only handling one klass at a time"); - _scanned_klass = klass; + void set_scanned_cld(ClassLoaderData* cld) { + assert(_scanned_cld == NULL || cld == NULL, "Should always only handling one cld at a time"); + _scanned_cld = cld; } private: - void do_klass_barrier() { - assert(_scanned_klass != NULL, "Should not be called without having a scanned klass"); - _scanned_klass->record_modified_oops(); + void do_cld_barrier() { + assert(_scanned_cld != NULL, "Should not be called without having a scanned cld"); + _scanned_cld->record_modified_oops(); } - }; -// Scavenges the oop in a Klass. -class PSScavengeKlassClosure: public KlassClosure { +// Scavenges the oop in a ClassLoaderData. +class PSScavengeCLDClosure: public CLDClosure { private: - PSScavengeFromKlassClosure _oop_closure; + PSScavengeFromCLDClosure _oop_closure; protected: public: - PSScavengeKlassClosure(PSPromotionManager* pm) : _oop_closure(pm) { } - void do_klass(Klass* klass) { - // If the klass has not been dirtied we know that there's + PSScavengeCLDClosure(PSPromotionManager* pm) : _oop_closure(pm) { } + void do_cld(ClassLoaderData* cld) { + // If the cld has not been dirtied we know that there's // no references into the young gen and we can skip it. - if (klass->has_modified_oops()) { - // Clean the klass since we're going to scavenge all the metadata. - klass->clear_modified_oops(); - - // Setup the promotion manager to redirty this klass + if (cld->has_modified_oops()) { + // Setup the promotion manager to redirty this cld // if references are left in the young gen. - _oop_closure.set_scanned_klass(klass); + _oop_closure.set_scanned_cld(cld); - klass->oops_do(&_oop_closure); + // Clean the cld since we're going to scavenge all the metadata. + cld->oops_do(&_oop_closure, false, /*clear_modified_oops*/true); - _oop_closure.set_scanned_klass(NULL); + _oop_closure.set_scanned_cld(NULL); } } }; + #endif // SHARE_VM_GC_PARALLEL_PSSCAVENGE_INLINE_HPP diff --git a/src/hotspot/share/gc/parallel/psTasks.cpp b/src/hotspot/share/gc/parallel/psTasks.cpp index 35e63dc52c3..3effcc6d1f6 100644 --- a/src/hotspot/share/gc/parallel/psTasks.cpp +++ b/src/hotspot/share/gc/parallel/psTasks.cpp @@ -79,8 +79,8 @@ void ScavengeRootsTask::do_it(GCTaskManager* manager, uint which) { case class_loader_data: { - PSScavengeKlassClosure klass_closure(pm); - ClassLoaderDataGraph::oops_do(&roots_closure, &klass_closure, false); + PSScavengeCLDClosure cld_closure(pm); + ClassLoaderDataGraph::cld_do(&cld_closure); } break; diff --git a/src/hotspot/share/gc/serial/defNewGeneration.cpp b/src/hotspot/share/gc/serial/defNewGeneration.cpp index db6977aa362..e65d12a469c 100644 --- a/src/hotspot/share/gc/serial/defNewGeneration.cpp +++ b/src/hotspot/share/gc/serial/defNewGeneration.cpp @@ -121,7 +121,7 @@ void DefNewGeneration::FastEvacuateFollowersClosure::do_void() { } ScanClosure::ScanClosure(DefNewGeneration* g, bool gc_barrier) : - OopsInKlassOrGenClosure(g), _g(g), _gc_barrier(gc_barrier) + OopsInClassLoaderDataOrGenClosure(g), _g(g), _gc_barrier(gc_barrier) { _boundary = _g->reserved().end(); } @@ -130,7 +130,7 @@ void ScanClosure::do_oop(oop* p) { ScanClosure::do_oop_work(p); } void ScanClosure::do_oop(narrowOop* p) { ScanClosure::do_oop_work(p); } FastScanClosure::FastScanClosure(DefNewGeneration* g, bool gc_barrier) : - OopsInKlassOrGenClosure(g), _g(g), _gc_barrier(gc_barrier) + OopsInClassLoaderDataOrGenClosure(g), _g(g), _gc_barrier(gc_barrier) { _boundary = _g->reserved().end(); } @@ -138,30 +138,28 @@ FastScanClosure::FastScanClosure(DefNewGeneration* g, bool gc_barrier) : void FastScanClosure::do_oop(oop* p) { FastScanClosure::do_oop_work(p); } void FastScanClosure::do_oop(narrowOop* p) { FastScanClosure::do_oop_work(p); } -void KlassScanClosure::do_klass(Klass* klass) { +void CLDScanClosure::do_cld(ClassLoaderData* cld) { NOT_PRODUCT(ResourceMark rm); - log_develop_trace(gc, scavenge)("KlassScanClosure::do_klass " PTR_FORMAT ", %s, dirty: %s", - p2i(klass), - klass->external_name(), - klass->has_modified_oops() ? "true" : "false"); + log_develop_trace(gc, scavenge)("CLDScanClosure::do_cld " PTR_FORMAT ", %s, dirty: %s", + p2i(cld), + cld->loader_name(), + cld->has_modified_oops() ? "true" : "false"); - // If the klass has not been dirtied we know that there's + // If the cld has not been dirtied we know that there's // no references into the young gen and we can skip it. - if (klass->has_modified_oops()) { + if (cld->has_modified_oops()) { if (_accumulate_modified_oops) { - klass->accumulate_modified_oops(); + cld->accumulate_modified_oops(); } - // Clear this state since we're going to scavenge all the metadata. - klass->clear_modified_oops(); - - // Tell the closure which Klass is being scanned so that it can be dirtied + // Tell the closure which CLD is being scanned so that it can be dirtied // if oops are left pointing into the young gen. - _scavenge_closure->set_scanned_klass(klass); + _scavenge_closure->set_scanned_cld(cld); - klass->oops_do(_scavenge_closure); + // Clean the cld since we're going to scavenge all the metadata. + cld->oops_do(_scavenge_closure, false, /*clear_modified_oops*/true); - _scavenge_closure->set_scanned_klass(NULL); + _scavenge_closure->set_scanned_cld(NULL); } } @@ -177,12 +175,6 @@ void ScanWeakRefClosure::do_oop(narrowOop* p) { ScanWeakRefClosure::do_oop_work( void FilteringClosure::do_oop(oop* p) { FilteringClosure::do_oop_work(p); } void FilteringClosure::do_oop(narrowOop* p) { FilteringClosure::do_oop_work(p); } -KlassScanClosure::KlassScanClosure(OopsInKlassOrGenClosure* scavenge_closure, - KlassRemSet* klass_rem_set) - : _scavenge_closure(scavenge_closure), - _accumulate_modified_oops(klass_rem_set->accumulate_modified_oops()) {} - - DefNewGeneration::DefNewGeneration(ReservedSpace rs, size_t initial_size, const char* policy) @@ -629,11 +621,8 @@ void DefNewGeneration::collect(bool full, FastScanClosure fsc_with_no_gc_barrier(this, false); FastScanClosure fsc_with_gc_barrier(this, true); - KlassScanClosure klass_scan_closure(&fsc_with_no_gc_barrier, - gch->rem_set()->klass_rem_set()); - CLDToKlassAndOopClosure cld_scan_closure(&klass_scan_closure, - &fsc_with_no_gc_barrier, - false); + CLDScanClosure cld_scan_closure(&fsc_with_no_gc_barrier, + gch->rem_set()->cld_rem_set()->accumulate_modified_oops()); set_promo_failure_scan_stack_closure(&fsc_with_no_gc_barrier); FastEvacuateFollowersClosure evacuate_followers(gch, diff --git a/src/hotspot/share/gc/shared/cardTableRS.cpp b/src/hotspot/share/gc/shared/cardTableRS.cpp index 0c87676ce02..27d015110c4 100644 --- a/src/hotspot/share/gc/shared/cardTableRS.cpp +++ b/src/hotspot/share/gc/shared/cardTableRS.cpp @@ -34,16 +34,16 @@ #include "runtime/os.hpp" #include "utilities/macros.hpp" -class HasAccumulatedModifiedOopsClosure : public KlassClosure { +class HasAccumulatedModifiedOopsClosure : public CLDClosure { bool _found; public: HasAccumulatedModifiedOopsClosure() : _found(false) {} - void do_klass(Klass* klass) { + void do_cld(ClassLoaderData* cld) { if (_found) { return; } - if (klass->has_accumulated_modified_oops()) { + if (cld->has_accumulated_modified_oops()) { _found = true; } } @@ -52,28 +52,29 @@ class HasAccumulatedModifiedOopsClosure : public KlassClosure { } }; -bool KlassRemSet::mod_union_is_clear() { +bool CLDRemSet::mod_union_is_clear() { HasAccumulatedModifiedOopsClosure closure; - ClassLoaderDataGraph::classes_do(&closure); + ClassLoaderDataGraph::cld_do(&closure); return !closure.found(); } -class ClearKlassModUnionClosure : public KlassClosure { +class ClearCLDModUnionClosure : public CLDClosure { public: - void do_klass(Klass* klass) { - if (klass->has_accumulated_modified_oops()) { - klass->clear_accumulated_modified_oops(); + void do_cld(ClassLoaderData* cld) { + if (cld->has_accumulated_modified_oops()) { + cld->clear_accumulated_modified_oops(); } } }; -void KlassRemSet::clear_mod_union() { - ClearKlassModUnionClosure closure; - ClassLoaderDataGraph::classes_do(&closure); +void CLDRemSet::clear_mod_union() { + ClearCLDModUnionClosure closure; + ClassLoaderDataGraph::cld_do(&closure); } + CardTableRS::CardTableRS(MemRegion whole_heap) : _bs(NULL), _cur_youngergen_card_val(youngergenP1_card) diff --git a/src/hotspot/share/gc/shared/cardTableRS.hpp b/src/hotspot/share/gc/shared/cardTableRS.hpp index 5139580b61f..5713f04b5ce 100644 --- a/src/hotspot/share/gc/shared/cardTableRS.hpp +++ b/src/hotspot/share/gc/shared/cardTableRS.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -31,11 +31,11 @@ class Space; class OopsInGenClosure; -// Helper to remember modified oops in all klasses. -class KlassRemSet { +// Helper to remember modified oops in all clds. +class CLDRemSet { bool _accumulate_modified_oops; public: - KlassRemSet() : _accumulate_modified_oops(false) {} + CLDRemSet() : _accumulate_modified_oops(false) {} void set_accumulate_modified_oops(bool value) { _accumulate_modified_oops = value; } bool accumulate_modified_oops() { return _accumulate_modified_oops; } bool mod_union_is_clear(); @@ -64,7 +64,7 @@ class CardTableRS: public CHeapObj { return CardTableModRefBSForCTRS::card_is_dirty_wrt_gen_iter(cv); } - KlassRemSet _klass_rem_set; + CLDRemSet _cld_rem_set; BarrierSet* _bs; CardTableModRefBSForCTRS* _ct_bs; @@ -121,7 +121,7 @@ public: // Set the barrier set. void set_bs(BarrierSet* bs) { _bs = bs; } - KlassRemSet* klass_rem_set() { return &_klass_rem_set; } + CLDRemSet* cld_rem_set() { return &_cld_rem_set; } CardTableModRefBSForCTRS* ct_bs() { return _ct_bs; } diff --git a/src/hotspot/share/gc/shared/genOopClosures.hpp b/src/hotspot/share/gc/shared/genOopClosures.hpp index f1dd89344d8..076b2fdd031 100644 --- a/src/hotspot/share/gc/shared/genOopClosures.hpp +++ b/src/hotspot/share/gc/shared/genOopClosures.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -81,24 +81,25 @@ class OopsInGenClosure : public ExtendedOopClosure { }; -// Super class for scan closures. It contains code to dirty scanned Klasses. -class OopsInKlassOrGenClosure: public OopsInGenClosure { - Klass* _scanned_klass; +// Super class for scan closures. It contains code to dirty scanned class loader data. +class OopsInClassLoaderDataOrGenClosure: public OopsInGenClosure { + ClassLoaderData* _scanned_cld; public: - OopsInKlassOrGenClosure(Generation* g) : OopsInGenClosure(g), _scanned_klass(NULL) {} - void set_scanned_klass(Klass* k) { - assert(k == NULL || _scanned_klass == NULL, "Must be"); - _scanned_klass = k; + OopsInClassLoaderDataOrGenClosure(Generation* g) : OopsInGenClosure(g), _scanned_cld(NULL) {} + void set_scanned_cld(ClassLoaderData* cld) { + assert(cld == NULL || _scanned_cld == NULL, "Must be"); + _scanned_cld = cld; } - bool is_scanning_a_klass() { return _scanned_klass != NULL; } - void do_klass_barrier(); + bool is_scanning_a_cld() { return _scanned_cld != NULL; } + void do_cld_barrier(); }; + // Closure for scanning DefNewGeneration. // // This closure will perform barrier store calls for ALL // pointers in scanned oops. -class ScanClosure: public OopsInKlassOrGenClosure { +class ScanClosure: public OopsInClassLoaderDataOrGenClosure { protected: DefNewGeneration* _g; HeapWord* _boundary; @@ -117,7 +118,7 @@ class ScanClosure: public OopsInKlassOrGenClosure { // This closure only performs barrier store calls on // pointers into the DefNewGeneration. This is less // precise, but faster, than a ScanClosure -class FastScanClosure: public OopsInKlassOrGenClosure { +class FastScanClosure: public OopsInClassLoaderDataOrGenClosure { protected: DefNewGeneration* _g; HeapWord* _boundary; @@ -131,14 +132,15 @@ class FastScanClosure: public OopsInKlassOrGenClosure { inline void do_oop_nv(narrowOop* p); }; -class KlassScanClosure: public KlassClosure { - OopsInKlassOrGenClosure* _scavenge_closure; +class CLDScanClosure: public CLDClosure { + OopsInClassLoaderDataOrGenClosure* _scavenge_closure; // true if the the modified oops state should be saved. - bool _accumulate_modified_oops; + bool _accumulate_modified_oops; public: - KlassScanClosure(OopsInKlassOrGenClosure* scavenge_closure, - KlassRemSet* klass_rem_set_policy); - void do_klass(Klass* k); + CLDScanClosure(OopsInClassLoaderDataOrGenClosure* scavenge_closure, + bool accumulate_modified_oops) : + _scavenge_closure(scavenge_closure), _accumulate_modified_oops(accumulate_modified_oops) {} + void do_cld(ClassLoaderData* cld); }; class FilteringClosure: public ExtendedOopClosure { diff --git a/src/hotspot/share/gc/shared/genOopClosures.inline.hpp b/src/hotspot/share/gc/shared/genOopClosures.inline.hpp index 13883f2283a..856d573f8f6 100644 --- a/src/hotspot/share/gc/shared/genOopClosures.inline.hpp +++ b/src/hotspot/share/gc/shared/genOopClosures.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -68,9 +68,11 @@ template inline void OopsInGenClosure::par_do_barrier(T* p) { } } -inline void OopsInKlassOrGenClosure::do_klass_barrier() { - assert(_scanned_klass != NULL, "Must be"); - _scanned_klass->record_modified_oops(); +inline void OopsInClassLoaderDataOrGenClosure::do_cld_barrier() { + assert(_scanned_cld != NULL, "Must be"); + if (!_scanned_cld->has_modified_oops()) { + _scanned_cld->record_modified_oops(); + } } // NOTE! Any changes made here should also be made @@ -87,8 +89,8 @@ template inline void ScanClosure::do_oop_work(T* p) { oopDesc::encode_store_heap_oop_not_null(p, new_obj); } - if (is_scanning_a_klass()) { - do_klass_barrier(); + if (is_scanning_a_cld()) { + do_cld_barrier(); } else if (_gc_barrier) { // Now call parent closure do_barrier(p); @@ -111,8 +113,8 @@ template inline void FastScanClosure::do_oop_work(T* p) { oop new_obj = obj->is_forwarded() ? obj->forwardee() : _g->copy_to_survivor_space(obj); oopDesc::encode_store_heap_oop_not_null(p, new_obj); - if (is_scanning_a_klass()) { - do_klass_barrier(); + if (is_scanning_a_cld()) { + do_cld_barrier(); } else if (_gc_barrier) { // Now call parent closure do_barrier(p); diff --git a/src/hotspot/share/jvmci/jvmciCompilerToVM.cpp b/src/hotspot/share/jvmci/jvmciCompilerToVM.cpp index 0e5fc74ba32..a35a9a10d79 100644 --- a/src/hotspot/share/jvmci/jvmciCompilerToVM.cpp +++ b/src/hotspot/share/jvmci/jvmciCompilerToVM.cpp @@ -412,6 +412,7 @@ C2V_VMENTRY(jobjectArray, readConfiguration, (JNIEnv *env)) } else if (strcmp(vmField.typeString, "address") == 0 || strcmp(vmField.typeString, "intptr_t") == 0 || strcmp(vmField.typeString, "uintptr_t") == 0 || + strcmp(vmField.typeString, "OopHandle") == 0 || strcmp(vmField.typeString, "size_t") == 0 || // All foo* types are addresses. vmField.typeString[strlen(vmField.typeString) - 1] == '*') { diff --git a/src/hotspot/share/jvmci/vmStructs_jvmci.cpp b/src/hotspot/share/jvmci/vmStructs_jvmci.cpp index 2d14d680529..36fd53d0b94 100644 --- a/src/hotspot/share/jvmci/vmStructs_jvmci.cpp +++ b/src/hotspot/share/jvmci/vmStructs_jvmci.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2015, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -33,6 +33,7 @@ #include "jvmci/vmStructs_compiler_runtime.hpp" #include "jvmci/vmStructs_jvmci.hpp" #include "oops/oop.hpp" +#include "oops/oopHandle.hpp" #include "oops/objArrayKlass.hpp" #include "runtime/globals.hpp" #include "runtime/sharedRuntime.hpp" @@ -192,7 +193,7 @@ nonstatic_field(Klass, _name, Symbol*) \ nonstatic_field(Klass, _prototype_header, markOop) \ nonstatic_field(Klass, _next_sibling, Klass*) \ - nonstatic_field(Klass, _java_mirror, oop) \ + nonstatic_field(Klass, _java_mirror, OopHandle) \ nonstatic_field(Klass, _modifier_flags, jint) \ nonstatic_field(Klass, _access_flags, AccessFlags) \ \ diff --git a/src/hotspot/share/memory/iterator.cpp b/src/hotspot/share/memory/iterator.cpp index 83288217c62..21eaf79dea4 100644 --- a/src/hotspot/share/memory/iterator.cpp +++ b/src/hotspot/share/memory/iterator.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2013, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -29,17 +29,8 @@ #include "utilities/debug.hpp" #include "utilities/globalDefinitions.hpp" -void KlassToOopClosure::do_klass(Klass* k) { - assert(_oop_closure != NULL, "Not initialized?"); - k->oops_do(_oop_closure); -} - void CLDToOopClosure::do_cld(ClassLoaderData* cld) { - cld->oops_do(_oop_closure, &_klass_closure, _must_claim_cld); -} - -void CLDToKlassAndOopClosure::do_cld(ClassLoaderData* cld) { - cld->oops_do(_oop_closure, _klass_closure, _must_claim_cld); + cld->oops_do(_oop_closure, _must_claim_cld); } void ObjectToOopClosure::do_object(oop obj) { diff --git a/src/hotspot/share/memory/iterator.hpp b/src/hotspot/share/memory/iterator.hpp index 11cdc513c84..d7713cedec0 100644 --- a/src/hotspot/share/memory/iterator.hpp +++ b/src/hotspot/share/memory/iterator.hpp @@ -138,67 +138,27 @@ class CLDClosure : public Closure { virtual void do_cld(ClassLoaderData* cld) = 0; }; -class KlassToOopClosure : public KlassClosure { - friend class MetadataAwareOopClosure; - friend class MetadataAwareOopsInGenClosure; - - OopClosure* _oop_closure; - - // Used when _oop_closure couldn't be set in an initialization list. - void initialize(OopClosure* oop_closure) { - assert(_oop_closure == NULL, "Should only be called once"); - _oop_closure = oop_closure; - } - - public: - KlassToOopClosure(OopClosure* oop_closure = NULL) : _oop_closure(oop_closure) {} - - virtual void do_klass(Klass* k); -}; class CLDToOopClosure : public CLDClosure { OopClosure* _oop_closure; - KlassToOopClosure _klass_closure; bool _must_claim_cld; public: CLDToOopClosure(OopClosure* oop_closure, bool must_claim_cld = true) : _oop_closure(oop_closure), - _klass_closure(oop_closure), _must_claim_cld(must_claim_cld) {} void do_cld(ClassLoaderData* cld); }; -class CLDToKlassAndOopClosure : public CLDClosure { - friend class G1CollectedHeap; - protected: - OopClosure* _oop_closure; - KlassClosure* _klass_closure; - bool _must_claim_cld; - public: - CLDToKlassAndOopClosure(KlassClosure* klass_closure, - OopClosure* oop_closure, - bool must_claim_cld) : - _oop_closure(oop_closure), - _klass_closure(klass_closure), - _must_claim_cld(must_claim_cld) {} - void do_cld(ClassLoaderData* cld); -}; - // The base class for all concurrent marking closures, // that participates in class unloading. // It's used to proxy through the metadata to the oops defined in them. class MetadataAwareOopClosure: public ExtendedOopClosure { - KlassToOopClosure _klass_closure; public: - MetadataAwareOopClosure() : ExtendedOopClosure() { - _klass_closure.initialize(this); - } - MetadataAwareOopClosure(ReferenceProcessor* rp) : ExtendedOopClosure(rp) { - _klass_closure.initialize(this); - } + MetadataAwareOopClosure() : ExtendedOopClosure() { } + MetadataAwareOopClosure(ReferenceProcessor* rp) : ExtendedOopClosure(rp) { } bool do_metadata_nv() { return true; } virtual bool do_metadata() { return do_metadata_nv(); } diff --git a/src/hotspot/share/memory/iterator.inline.hpp b/src/hotspot/share/memory/iterator.inline.hpp index cf2a1f679ec..7e1d973a26d 100644 --- a/src/hotspot/share/memory/iterator.inline.hpp +++ b/src/hotspot/share/memory/iterator.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2014, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2014, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -37,10 +37,8 @@ #include "utilities/debug.hpp" inline void MetadataAwareOopClosure::do_cld_nv(ClassLoaderData* cld) { - assert(_klass_closure._oop_closure == this, "Must be"); - bool claim = true; // Must claim the class loader data before processing. - cld->oops_do(_klass_closure._oop_closure, &_klass_closure, claim); + cld->oops_do(this, claim); } inline void MetadataAwareOopClosure::do_klass_nv(Klass* k) { diff --git a/src/hotspot/share/oops/instanceKlass.cpp b/src/hotspot/share/oops/instanceKlass.cpp index f8366d66b50..04a10565512 100644 --- a/src/hotspot/share/oops/instanceKlass.cpp +++ b/src/hotspot/share/oops/instanceKlass.cpp @@ -285,6 +285,9 @@ void InstanceKlass::deallocate_contents(ClassLoaderData* loader_data) { java_lang_Class::set_klass(java_mirror(), NULL); } + // Also remove mirror from handles + loader_data->remove_handle(_java_mirror); + // Need to take this class off the class loader data list. loader_data->remove_class(this); diff --git a/src/hotspot/share/oops/klass.cpp b/src/hotspot/share/oops/klass.cpp index 7d8670f6a06..82c57239c11 100644 --- a/src/hotspot/share/oops/klass.cpp +++ b/src/hotspot/share/oops/klass.cpp @@ -43,9 +43,16 @@ #include "trace/traceMacros.hpp" #include "utilities/macros.hpp" #include "utilities/stack.inline.hpp" -#if INCLUDE_ALL_GCS -#include "gc/g1/g1SATBCardTableModRefBS.hpp" -#endif // INCLUDE_ALL_GCS + +void Klass::set_java_mirror(Handle m) { + assert(!m.is_null(), "New mirror should never be null."); + assert(_java_mirror.resolve() == NULL, "should only be used to initialize mirror"); + _java_mirror = class_loader_data()->add_handle(m); +} + +oop Klass::java_mirror() const { + return _java_mirror.resolve(); +} bool Klass::is_cloneable() const { return _access_flags.is_cloneable_fast() || @@ -441,51 +448,6 @@ void Klass::clean_weak_klass_links(BoolObjectClosure* is_alive, bool clean_alive } } -void Klass::klass_update_barrier_set(oop v) { - record_modified_oops(); -} - -// This barrier is used by G1 to remember the old oop values, so -// that we don't forget any objects that were live at the snapshot at -// the beginning. This function is only used when we write oops into Klasses. -void Klass::klass_update_barrier_set_pre(oop* p, oop v) { -#if INCLUDE_ALL_GCS - if (UseG1GC) { - oop obj = *p; - if (obj != NULL) { - G1SATBCardTableModRefBS::enqueue(obj); - } - } -#endif -} - -void Klass::klass_oop_store(oop* p, oop v) { - assert(!Universe::heap()->is_in_reserved((void*)p), "Should store pointer into metadata"); - assert(v == NULL || Universe::heap()->is_in_reserved((void*)v), "Should store pointer to an object"); - - // do the store - if (always_do_update_barrier) { - klass_oop_store((volatile oop*)p, v); - } else { - klass_update_barrier_set_pre(p, v); - *p = v; - klass_update_barrier_set(v); - } -} - -void Klass::klass_oop_store(volatile oop* p, oop v) { - assert(!Universe::heap()->is_in_reserved((void*)p), "Should store pointer into metadata"); - assert(v == NULL || Universe::heap()->is_in_reserved((void*)v), "Should store pointer to an object"); - - klass_update_barrier_set_pre((oop*)p, v); // Cast away volatile. - OrderAccess::release_store_ptr(p, v); - klass_update_barrier_set(v); -} - -void Klass::oops_do(OopClosure* cl) { - cl->do_oop(&_java_mirror); -} - void Klass::metaspace_pointers_do(MetaspaceClosure* it) { if (log_is_enabled(Trace, cds)) { ResourceMark rm; @@ -532,7 +494,8 @@ void Klass::remove_java_mirror() { ResourceMark rm; log_trace(cds, unshareable)("remove java_mirror: %s", external_name()); } - set_java_mirror(NULL); + // Just null out the mirror. The class_loader_data() no longer exists. + _java_mirror = NULL; } void Klass::restore_unshareable_info(ClassLoaderData* loader_data, Handle protection_domain, TRAPS) { diff --git a/src/hotspot/share/oops/klass.hpp b/src/hotspot/share/oops/klass.hpp index 5eb4ae201e0..979aaee4fd5 100644 --- a/src/hotspot/share/oops/klass.hpp +++ b/src/hotspot/share/oops/klass.hpp @@ -30,6 +30,7 @@ #include "memory/memRegion.hpp" #include "oops/metadata.hpp" #include "oops/oop.hpp" +#include "oops/oopHandle.hpp" #include "trace/traceMacros.hpp" #include "utilities/accessFlags.hpp" #include "utilities/macros.hpp" @@ -119,7 +120,7 @@ class Klass : public Metadata { // Ordered list of all primary supertypes Klass* _primary_supers[_primary_super_limit]; // java/lang/Class instance mirroring this class - oop _java_mirror; + OopHandle _java_mirror; // Superclass Klass* _super; // First subclass (NULL if none); _subklass->next_sibling() is next one @@ -148,10 +149,6 @@ class Klass : public Metadata { // vtable length int _vtable_len; - // Remembered sets support for the oops in the klasses. - jbyte _modified_oops; // Card Table Equivalent (YC/CMS support) - jbyte _accumulated_modified_oops; // Mod Union Equivalent (CMS support) - private: // This is an index into FileMapHeader::_classpath_entry_table[], to // associate this class with the JAR file where it's loaded from during @@ -228,13 +225,15 @@ protected: } } - // store an oop into a field of a Klass - void klass_oop_store(oop* p, oop v); - void klass_oop_store(volatile oop* p, oop v); - // java mirror - oop java_mirror() const { return _java_mirror; } - void set_java_mirror(oop m) { klass_oop_store(&_java_mirror, m); } + oop java_mirror() const; + void set_java_mirror(Handle m); + + // Temporary mirror switch used by RedefineClasses + // Both mirrors are on the ClassLoaderData::_handles list already so no + // barriers are needed. + void set_java_mirror_handle(OopHandle mirror) { _java_mirror = mirror; } + OopHandle java_mirror_handle() const { return _java_mirror; } // modifier flags jint modifier_flags() const { return _modifier_flags; } @@ -260,17 +259,6 @@ protected: ClassLoaderData* class_loader_data() const { return _class_loader_data; } void set_class_loader_data(ClassLoaderData* loader_data) { _class_loader_data = loader_data; } - // The Klasses are not placed in the Heap, so the Card Table or - // the Mod Union Table can't be used to mark when klasses have modified oops. - // The CT and MUT bits saves this information for the individual Klasses. - void record_modified_oops() { _modified_oops = 1; } - void clear_modified_oops() { _modified_oops = 0; } - bool has_modified_oops() { return _modified_oops == 1; } - - void accumulate_modified_oops() { if (has_modified_oops()) _accumulated_modified_oops = 1; } - void clear_accumulated_modified_oops() { _accumulated_modified_oops = 0; } - bool has_accumulated_modified_oops() { return _accumulated_modified_oops == 1; } - int shared_classpath_index() const { return _shared_class_path_index; }; @@ -598,9 +586,6 @@ protected: TRACE_DEFINE_TRACE_ID_METHODS; - // garbage collection support - void oops_do(OopClosure* cl); - virtual void metaspace_pointers_do(MetaspaceClosure* iter); virtual MetaspaceObj::Type type() const { return ClassType; } @@ -687,11 +672,6 @@ protected: static Klass* decode_klass_not_null(narrowKlass v); static Klass* decode_klass(narrowKlass v); - - private: - // barriers used by klass_oop_store - void klass_update_barrier_set(oop v); - void klass_update_barrier_set_pre(oop* p, oop v); }; // Helper to convert the oop iterate macro suffixes into bool values that can be used by template functions. diff --git a/src/hotspot/share/opto/library_call.cpp b/src/hotspot/share/opto/library_call.cpp index f0fce1d7e48..5de3c62b3aa 100644 --- a/src/hotspot/share/opto/library_call.cpp +++ b/src/hotspot/share/opto/library_call.cpp @@ -3453,7 +3453,8 @@ bool LibraryCallKit::inline_native_isInterrupted() { // Given a klass oop, load its java mirror (a java.lang.Class oop). Node* LibraryCallKit::load_mirror_from_klass(Node* klass) { Node* p = basic_plus_adr(klass, in_bytes(Klass::java_mirror_offset())); - return make_load(NULL, p, TypeInstPtr::MIRROR, T_OBJECT, MemNode::unordered); + Node* load = make_load(NULL, p, TypeRawPtr::NOTNULL, T_ADDRESS, MemNode::unordered); + return make_load(NULL, load, TypeInstPtr::MIRROR, T_OBJECT, MemNode::unordered); } //-----------------------load_klass_from_mirror_common------------------------- diff --git a/src/hotspot/share/opto/memnode.cpp b/src/hotspot/share/opto/memnode.cpp index 7b6e972c677..77a9d68f88b 100644 --- a/src/hotspot/share/opto/memnode.cpp +++ b/src/hotspot/share/opto/memnode.cpp @@ -1771,6 +1771,23 @@ const Type* LoadNode::Value(PhaseGVN* phase) const { Opcode() == Op_LoadKlass, "Field accesses must be precise" ); // For klass/static loads, we expect the _type to be precise + } else if (tp->base() == Type::RawPtr && adr->is_Load() && off == 0) { + /* With mirrors being an indirect in the Klass* + * the VM is now using two loads. LoadKlass(LoadP(LoadP(Klass, mirror_offset), zero_offset)) + * The LoadP from the Klass has a RawPtr type (see LibraryCallKit::load_mirror_from_klass). + * + * So check the type and klass of the node before the LoadP. + */ + Node* adr2 = adr->in(MemNode::Address); + const TypeKlassPtr* tkls = phase->type(adr2)->isa_klassptr(); + if (tkls != NULL && !StressReflectiveCode) { + ciKlass* klass = tkls->klass(); + if (klass->is_loaded() && tkls->klass_is_exact() && tkls->offset() == in_bytes(Klass::java_mirror_offset())) { + assert(adr->Opcode() == Op_LoadP, "must load an oop from _java_mirror"); + assert(Opcode() == Op_LoadP, "must load an oop from _java_mirror"); + return TypeInstPtr::make(klass->java_mirror()); + } + } } const TypeKlassPtr *tkls = tp->isa_klassptr(); @@ -1798,12 +1815,6 @@ const Type* LoadNode::Value(PhaseGVN* phase) const { } const Type* aift = load_array_final_field(tkls, klass); if (aift != NULL) return aift; - if (tkls->offset() == in_bytes(Klass::java_mirror_offset())) { - // The field is Klass::_java_mirror. Return its (constant) value. - // (Folds up the 2nd indirection in anObjConstant.getClass().) - assert(Opcode() == Op_LoadP, "must load an oop from _java_mirror"); - return TypeInstPtr::make(klass->java_mirror()); - } } // We can still check if we are loading from the primary_supers array at a @@ -2203,22 +2214,24 @@ Node* LoadNode::klass_identity_common(PhaseGVN* phase) { // This improves reflective code, often making the Class // mirror go completely dead. (Current exception: Class // mirrors may appear in debug info, but we could clean them out by - // introducing a new debug info operator for Klass*.java_mirror). + // introducing a new debug info operator for Klass.java_mirror). + if (toop->isa_instptr() && toop->klass() == phase->C->env()->Class_klass() && offset == java_lang_Class::klass_offset_in_bytes()) { - // We are loading a special hidden field from a Class mirror, - // the field which points to its Klass or ArrayKlass metaobject. if (base->is_Load()) { - Node* adr2 = base->in(MemNode::Address); - const TypeKlassPtr* tkls = phase->type(adr2)->isa_klassptr(); - if (tkls != NULL && !tkls->empty() - && (tkls->klass()->is_instance_klass() || + Node* base2 = base->in(MemNode::Address); + if (base2->is_Load()) { /* direct load of a load which is the oophandle */ + Node* adr2 = base2->in(MemNode::Address); + const TypeKlassPtr* tkls = phase->type(adr2)->isa_klassptr(); + if (tkls != NULL && !tkls->empty() + && (tkls->klass()->is_instance_klass() || tkls->klass()->is_array_klass()) - && adr2->is_AddP() - ) { - int mirror_field = in_bytes(Klass::java_mirror_offset()); - if (tkls->offset() == mirror_field) { - return adr2->in(AddPNode::Base); + && adr2->is_AddP() + ) { + int mirror_field = in_bytes(Klass::java_mirror_offset()); + if (tkls->offset() == mirror_field) { + return adr2->in(AddPNode::Base); + } } } } diff --git a/src/hotspot/share/opto/subnode.cpp b/src/hotspot/share/opto/subnode.cpp index aa0c335f2b4..cc1d881f10d 100644 --- a/src/hotspot/share/opto/subnode.cpp +++ b/src/hotspot/share/opto/subnode.cpp @@ -877,8 +877,8 @@ const Type *CmpPNode::sub( const Type *t1, const Type *t2 ) const { } static inline Node* isa_java_mirror_load(PhaseGVN* phase, Node* n) { - // Return the klass node for - // LoadP(AddP(foo:Klass, #java_mirror)) + // Return the klass node for (indirect load from OopHandle) + // LoadP(LoadP(AddP(foo:Klass, #java_mirror))) // or NULL if not matching. if (n->Opcode() != Op_LoadP) return NULL; @@ -886,6 +886,10 @@ static inline Node* isa_java_mirror_load(PhaseGVN* phase, Node* n) { if (!tp || tp->klass() != phase->C->env()->Class_klass()) return NULL; Node* adr = n->in(MemNode::Address); + // First load from OopHandle + if (adr->Opcode() != Op_LoadP || !phase->type(adr)->isa_rawptr()) return NULL; + adr = adr->in(MemNode::Address); + intptr_t off = 0; Node* k = AddPNode::Ideal_base_and_offset(adr, phase, off); if (k == NULL) return NULL; diff --git a/src/hotspot/share/prims/jvmtiTagMap.cpp b/src/hotspot/share/prims/jvmtiTagMap.cpp index 7aaa1341dd6..25807a2a626 100644 --- a/src/hotspot/share/prims/jvmtiTagMap.cpp +++ b/src/hotspot/share/prims/jvmtiTagMap.cpp @@ -3026,8 +3026,7 @@ inline bool VM_HeapWalkOperation::collect_simple_roots() { // Preloaded classes and loader from the system dictionary blk.set_kind(JVMTI_HEAP_REFERENCE_SYSTEM_CLASS); SystemDictionary::always_strong_oops_do(&blk); - KlassToOopClosure klass_blk(&blk); - ClassLoaderDataGraph::always_strong_oops_do(&blk, &klass_blk, false); + ClassLoaderDataGraph::always_strong_oops_do(&blk, false); if (blk.stopped()) { return false; } diff --git a/src/hotspot/share/prims/jvmtiThreadState.hpp b/src/hotspot/share/prims/jvmtiThreadState.hpp index 3a7ddb66fc3..9dfb9b85309 100644 --- a/src/hotspot/share/prims/jvmtiThreadState.hpp +++ b/src/hotspot/share/prims/jvmtiThreadState.hpp @@ -411,21 +411,21 @@ class RedefineVerifyMark : public StackObj { private: JvmtiThreadState* _state; Klass* _scratch_class; - Handle _scratch_mirror; + OopHandle _scratch_mirror; public: RedefineVerifyMark(Klass* the_class, Klass* scratch_class, JvmtiThreadState *state) : _state(state), _scratch_class(scratch_class) { _state->set_class_versions_map(the_class, scratch_class); - _scratch_mirror = Handle(Thread::current(), _scratch_class->java_mirror()); - _scratch_class->set_java_mirror(the_class->java_mirror()); + _scratch_mirror = _scratch_class->java_mirror_handle(); + _scratch_class->set_java_mirror_handle(the_class->java_mirror_handle()); } ~RedefineVerifyMark() { // Restore the scratch class's mirror, so when scratch_class is removed // the correct mirror pointing to it can be cleared. - _scratch_class->set_java_mirror(_scratch_mirror()); + _scratch_class->set_java_mirror_handle(_scratch_mirror); _state->clear_class_versions_map(); } }; diff --git a/src/hotspot/share/runtime/vmStructs.cpp b/src/hotspot/share/runtime/vmStructs.cpp index d9dd0d15b50..49fcd97a876 100644 --- a/src/hotspot/share/runtime/vmStructs.cpp +++ b/src/hotspot/share/runtime/vmStructs.cpp @@ -277,7 +277,7 @@ typedef RehashableHashtable RehashableSymbolHashtable; nonstatic_field(Klass, _secondary_super_cache, Klass*) \ nonstatic_field(Klass, _secondary_supers, Array*) \ nonstatic_field(Klass, _primary_supers[0], Klass*) \ - nonstatic_field(Klass, _java_mirror, oop) \ + nonstatic_field(Klass, _java_mirror, OopHandle) \ nonstatic_field(Klass, _modifier_flags, jint) \ nonstatic_field(Klass, _super, Klass*) \ nonstatic_field(Klass, _subklass, Klass*) \ diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/Klass.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/Klass.java index bc9431ca126..e2aa52ffd9c 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/Klass.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/oops/Klass.java @@ -51,7 +51,7 @@ public class Klass extends Metadata implements ClassConstants { private static synchronized void initialize(TypeDataBase db) throws WrongTypeException { Type type = db.lookupType("Klass"); - javaMirror = new OopField(type.getOopField("_java_mirror"), 0); + javaMirror = type.getAddressField("_java_mirror"); superField = new MetadataField(type.getAddressField("_super"), 0); layoutHelper = new IntField(type.getJIntField("_layout_helper"), 0); name = type.getAddressField("_name"); @@ -88,7 +88,7 @@ public class Klass extends Metadata implements ClassConstants { public boolean isKlass() { return true; } // Fields - private static OopField javaMirror; + private static AddressField javaMirror; private static MetadataField superField; private static IntField layoutHelper; private static AddressField name; @@ -109,7 +109,15 @@ public class Klass extends Metadata implements ClassConstants { } // Accessors for declared fields - public Instance getJavaMirror() { return (Instance) javaMirror.getValue(this); } + public Instance getJavaMirror() { + Address handle = javaMirror.getValue(getAddress()); + if (handle != null) { + // Load through the handle + OopHandle refs = handle.getOopHandleAt(0); + return (Instance)VM.getVM().getObjectHeap().newOop(refs); + } + return null; + } public Klass getSuper() { return (Klass) superField.getValue(this); } public Klass getJavaSuper() { return null; } public int getLayoutHelper() { return (int) layoutHelper.getValue(this); } @@ -185,7 +193,7 @@ public class Klass extends Metadata implements ClassConstants { } public void iterateFields(MetadataVisitor visitor) { - visitor.doOop(javaMirror, true); + // visitor.doOop(javaMirror, true); visitor.doMetadata(superField, true); visitor.doInt(layoutHelper, true); // visitor.doOop(name, true); diff --git a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotMemoryAccessProviderImpl.java b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotMemoryAccessProviderImpl.java index e3ad9c834c2..feae2a72267 100644 --- a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotMemoryAccessProviderImpl.java +++ b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotMemoryAccessProviderImpl.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -138,21 +138,6 @@ class HotSpotMemoryAccessProviderImpl implements HotSpotMemoryAccessProvider { return true; } - private boolean isValidObjectFieldDisplacement(Constant base, long displacement) { - if (base instanceof HotSpotMetaspaceConstant) { - MetaspaceWrapperObject metaspaceObject = HotSpotMetaspaceConstantImpl.getMetaspaceObject(base); - if (metaspaceObject instanceof HotSpotResolvedObjectTypeImpl) { - if (displacement == runtime.getConfig().classMirrorOffset) { - // Klass::_java_mirror is valid for all Klass* values - return true; - } - } else { - throw new IllegalArgumentException(String.valueOf(metaspaceObject)); - } - } - return false; - } - private static long asRawPointer(Constant base) { if (base instanceof HotSpotMetaspaceConstantImpl) { MetaspaceWrapperObject meta = HotSpotMetaspaceConstantImpl.getMetaspaceObject(base); @@ -202,7 +187,7 @@ class HotSpotMemoryAccessProviderImpl implements HotSpotMemoryAccessProvider { if (base instanceof HotSpotMetaspaceConstant) { MetaspaceWrapperObject metaspaceObject = HotSpotMetaspaceConstantImpl.getMetaspaceObject(base); if (metaspaceObject instanceof HotSpotResolvedObjectTypeImpl) { - if (displacement == runtime.getConfig().classMirrorOffset) { + if (displacement == runtime.getConfig().classMirrorHandleOffset) { assert expected == ((HotSpotResolvedObjectTypeImpl) metaspaceObject).mirror(); } } @@ -294,10 +279,18 @@ class HotSpotMemoryAccessProviderImpl implements HotSpotMemoryAccessProvider { Object o = readRawObject(base, displacement, runtime.getConfig().useCompressedOops); return HotSpotObjectConstantImpl.forObject(o); } - if (!isValidObjectFieldDisplacement(base, displacement)) { - return null; + if (base instanceof HotSpotMetaspaceConstant) { + MetaspaceWrapperObject metaspaceObject = HotSpotMetaspaceConstantImpl.getMetaspaceObject(base); + if (metaspaceObject instanceof HotSpotResolvedObjectTypeImpl) { + if (displacement == runtime.getConfig().classMirrorHandleOffset) { + // Klass::_java_mirror is valid for all Klass* values + return HotSpotObjectConstantImpl.forObject(((HotSpotResolvedObjectTypeImpl) metaspaceObject).mirror()); + } + } else { + throw new IllegalArgumentException(String.valueOf(metaspaceObject)); + } } - return HotSpotObjectConstantImpl.forObject(readRawObject(base, displacement, false)); + return null; } @Override diff --git a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotVMConfig.java b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotVMConfig.java index 25f6153f54e..7f3a52e9bb5 100644 --- a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotVMConfig.java +++ b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot/src/jdk/vm/ci/hotspot/HotSpotVMConfig.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -77,7 +77,7 @@ class HotSpotVMConfig extends HotSpotVMConfigAccess { /** * The offset of the _java_mirror field (of type {@link Class}) in a Klass. */ - final int classMirrorOffset = getFieldOffset("Klass::_java_mirror", Integer.class, "oop"); + final int classMirrorHandleOffset = getFieldOffset("Klass::_java_mirror", Integer.class, "OopHandle"); final int klassAccessFlagsOffset = getFieldOffset("Klass::_access_flags", Integer.class, "AccessFlags"); final int klassLayoutHelperOffset = getFieldOffset("Klass::_layout_helper", Integer.class, "jint"); diff --git a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/GraalHotSpotVMConfig.java b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/GraalHotSpotVMConfig.java index f39ecd0dd7c..f314bbd584f 100644 --- a/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/GraalHotSpotVMConfig.java +++ b/src/jdk.internal.vm.compiler/share/classes/org.graalvm.compiler.hotspot/src/org/graalvm/compiler/hotspot/GraalHotSpotVMConfig.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -280,14 +280,14 @@ public class GraalHotSpotVMConfig extends HotSpotVMConfigAccess { } if (offset == -1) { try { - offset = getFieldOffset(name, Integer.class, "jobject"); + offset = getFieldOffset(name, Integer.class, "OopHandle"); isHandle = true; } catch (JVMCIError e) { } } if (offset == -1) { - throw new JVMCIError("cannot get offset of field " + name + " with type oop or jobject"); + throw new JVMCIError("cannot get offset of field " + name + " with type oop or OopHandle"); } classMirrorOffset = offset; classMirrorIsHandle = isHandle; diff --git a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/DataPatchTest.java b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/DataPatchTest.java index 135bb9284d1..8afc7d7b98e 100644 --- a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/DataPatchTest.java +++ b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/DataPatchTest.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2015, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -110,7 +110,7 @@ public class DataPatchTest extends CodeInstallationTest { test(asm -> { ResolvedJavaType type = metaAccess.lookupJavaType(getConstClass()); Register klass = asm.emitLoadPointer((HotSpotConstant) constantReflection.asObjectHub(type)); - Register ret = asm.emitLoadPointer(klass, config.classMirrorOffset); + Register ret = asm.emitLoadPointer(asm.emitLoadPointer(klass, config.classMirrorHandleOffset), 0); asm.emitPointerRet(ret); }); } @@ -123,7 +123,7 @@ public class DataPatchTest extends CodeInstallationTest { HotSpotConstant hub = (HotSpotConstant) constantReflection.asObjectHub(type); Register narrowKlass = asm.emitLoadPointer((HotSpotConstant) hub.compress()); Register klass = asm.emitUncompressPointer(narrowKlass, config.narrowKlassBase, config.narrowKlassShift); - Register ret = asm.emitLoadPointer(klass, config.classMirrorOffset); + Register ret = asm.emitLoadPointer(asm.emitLoadPointer(klass, config.classMirrorHandleOffset), 0); asm.emitPointerRet(ret); }); } @@ -135,7 +135,7 @@ public class DataPatchTest extends CodeInstallationTest { HotSpotConstant hub = (HotSpotConstant) constantReflection.asObjectHub(type); DataSectionReference ref = asm.emitDataItem(hub); Register klass = asm.emitLoadPointer(ref); - Register ret = asm.emitLoadPointer(klass, config.classMirrorOffset); + Register ret = asm.emitLoadPointer(asm.emitLoadPointer(klass, config.classMirrorHandleOffset), 0); asm.emitPointerRet(ret); }); } @@ -150,7 +150,7 @@ public class DataPatchTest extends CodeInstallationTest { DataSectionReference ref = asm.emitDataItem(narrowHub); Register narrowKlass = asm.emitLoadNarrowPointer(ref); Register klass = asm.emitUncompressPointer(narrowKlass, config.narrowKlassBase, config.narrowKlassShift); - Register ret = asm.emitLoadPointer(klass, config.classMirrorOffset); + Register ret = asm.emitLoadPointer(asm.emitLoadPointer(klass, config.classMirrorHandleOffset), 0); asm.emitPointerRet(ret); }); } diff --git a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/TestHotSpotVMConfig.java b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/TestHotSpotVMConfig.java index cc80c0bcdbe..71182b1a7bf 100644 --- a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/TestHotSpotVMConfig.java +++ b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.code.test/src/jdk/vm/ci/code/test/TestHotSpotVMConfig.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -40,7 +40,7 @@ public class TestHotSpotVMConfig extends HotSpotVMConfigAccess { public final long narrowKlassBase = getFieldValue("CompilerToVM::Data::Universe_narrow_klass_base", Long.class, "address"); public final int narrowKlassShift = getFieldValue("CompilerToVM::Data::Universe_narrow_klass_shift", Integer.class, "int"); - public final int classMirrorOffset = getFieldOffset("Klass::_java_mirror", Integer.class, "oop"); + public final int classMirrorHandleOffset = getFieldOffset("Klass::_java_mirror", Integer.class, "OopHandle"); public final int MARKID_DEOPT_HANDLER_ENTRY = getConstant("CodeInstaller::DEOPT_HANDLER_ENTRY", Integer.class); public final long handleDeoptStub = getFieldValue("CompilerToVM::Data::SharedRuntime_deopt_blob_unpack", Long.class, "address"); diff --git a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.hotspot.test/src/jdk/vm/ci/hotspot/test/MemoryAccessProviderData.java b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.hotspot.test/src/jdk/vm/ci/hotspot/test/MemoryAccessProviderData.java index 1122bd7eb5d..54f5d41ff38 100644 --- a/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.hotspot.test/src/jdk/vm/ci/hotspot/test/MemoryAccessProviderData.java +++ b/test/hotspot/jtreg/compiler/jvmci/jdk.vm.ci.hotspot.test/src/jdk/vm/ci/hotspot/test/MemoryAccessProviderData.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -64,7 +64,7 @@ public class MemoryAccessProviderData { @DataProvider(name = "positiveObject") public static Object[][] getPositiveObjectJavaKind() { HotSpotJVMCIRuntimeProvider runtime = (HotSpotJVMCIRuntimeProvider) JVMCI.getRuntime(); - int offset = new HotSpotVMConfigAccess(runtime.getConfigStore()).getFieldOffset("Klass::_java_mirror", Integer.class, "oop"); + int offset = new HotSpotVMConfigAccess(runtime.getConfigStore()).getFieldOffset("Klass::_java_mirror", Integer.class, "OopHandle"); Constant wrappedKlassPointer = ((HotSpotResolvedObjectType) runtime.fromClass(TestClass.class)).klass(); return new Object[][]{new Object[]{JavaKind.Object, wrappedKlassPointer, (long) offset, TEST_CLASS_CONSTANT, 0}}; } From e6765bf9bfd9eeb956d294af80ad558dbf055571 Mon Sep 17 00:00:00 2001 From: Rohit Arul Raj Date: Tue, 3 Oct 2017 15:32:27 -0700 Subject: [PATCH 31/80] 8187219: Newer AMD 17h (EPYC) Processor family defaults Reviewed-by: dholmes, kvn --- src/hotspot/cpu/x86/vm_version_x86.cpp | 42 +++++++++++++++++++++++--- src/hotspot/cpu/x86/vm_version_x86.hpp | 40 ++++++++++++++++++------ 2 files changed, 67 insertions(+), 15 deletions(-) diff --git a/src/hotspot/cpu/x86/vm_version_x86.cpp b/src/hotspot/cpu/x86/vm_version_x86.cpp index 99e402f8dee..6e3acc22315 100644 --- a/src/hotspot/cpu/x86/vm_version_x86.cpp +++ b/src/hotspot/cpu/x86/vm_version_x86.cpp @@ -46,7 +46,7 @@ address VM_Version::_cpuinfo_segv_addr = 0; address VM_Version::_cpuinfo_cont_addr = 0; static BufferBlob* stub_blob; -static const int stub_size = 1000; +static const int stub_size = 1100; extern "C" { typedef void (*get_cpu_info_stub_t)(void*); @@ -70,7 +70,7 @@ class VM_Version_StubGenerator: public StubCodeGenerator { bool use_evex = FLAG_IS_DEFAULT(UseAVX) || (UseAVX > 2); Label detect_486, cpu486, detect_586, std_cpuid1, std_cpuid4; - Label sef_cpuid, ext_cpuid, ext_cpuid1, ext_cpuid5, ext_cpuid7, done, wrapup; + Label sef_cpuid, ext_cpuid, ext_cpuid1, ext_cpuid5, ext_cpuid7, ext_cpuid8, done, wrapup; Label legacy_setup, save_restore_except, legacy_save_restore, start_simd_check; StubCodeMark mark(this, "VM_Version", "get_cpu_info_stub"); @@ -267,14 +267,30 @@ class VM_Version_StubGenerator: public StubCodeGenerator { __ cmpl(rax, 0x80000000); // Is cpuid(0x80000001) supported? __ jcc(Assembler::belowEqual, done); __ cmpl(rax, 0x80000004); // Is cpuid(0x80000005) supported? - __ jccb(Assembler::belowEqual, ext_cpuid1); + __ jcc(Assembler::belowEqual, ext_cpuid1); __ cmpl(rax, 0x80000006); // Is cpuid(0x80000007) supported? __ jccb(Assembler::belowEqual, ext_cpuid5); __ cmpl(rax, 0x80000007); // Is cpuid(0x80000008) supported? __ jccb(Assembler::belowEqual, ext_cpuid7); + __ cmpl(rax, 0x80000008); // Is cpuid(0x80000009 and above) supported? + __ jccb(Assembler::belowEqual, ext_cpuid8); + __ cmpl(rax, 0x8000001E); // Is cpuid(0x8000001E) supported? + __ jccb(Assembler::below, ext_cpuid8); + // + // Extended cpuid(0x8000001E) + // + __ movl(rax, 0x8000001E); + __ cpuid(); + __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid1E_offset()))); + __ movl(Address(rsi, 0), rax); + __ movl(Address(rsi, 4), rbx); + __ movl(Address(rsi, 8), rcx); + __ movl(Address(rsi,12), rdx); + // // Extended cpuid(0x80000008) // + __ bind(ext_cpuid8); __ movl(rax, 0x80000008); __ cpuid(); __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid8_offset()))); @@ -1109,11 +1125,27 @@ void VM_Version::get_processor_features() { } #ifdef COMPILER2 - if (MaxVectorSize > 16) { - // Limit vectors size to 16 bytes on current AMD cpus. + if (cpu_family() < 0x17 && MaxVectorSize > 16) { + // Limit vectors size to 16 bytes on AMD cpus < 17h. FLAG_SET_DEFAULT(MaxVectorSize, 16); } #endif // COMPILER2 + + // Some defaults for AMD family 17h + if ( cpu_family() == 0x17 ) { + // On family 17h processors use XMM and UnalignedLoadStores for Array Copy + if (supports_sse2() && FLAG_IS_DEFAULT(UseXMMForArrayCopy)) { + FLAG_SET_DEFAULT(UseXMMForArrayCopy, true); + } + if (supports_sse2() && FLAG_IS_DEFAULT(UseUnalignedLoadStores)) { + FLAG_SET_DEFAULT(UseUnalignedLoadStores, true); + } +#ifdef COMPILER2 + if (supports_sse4_2() && FLAG_IS_DEFAULT(UseFPUForSpilling)) { + FLAG_SET_DEFAULT(UseFPUForSpilling, true); + } +#endif + } } if( is_intel() ) { // Intel cpus specific settings diff --git a/src/hotspot/cpu/x86/vm_version_x86.hpp b/src/hotspot/cpu/x86/vm_version_x86.hpp index 23c2c7c195c..0a3b53a5271 100644 --- a/src/hotspot/cpu/x86/vm_version_x86.hpp +++ b/src/hotspot/cpu/x86/vm_version_x86.hpp @@ -228,6 +228,15 @@ class VM_Version : public Abstract_VM_Version { } bits; }; + union ExtCpuid1EEbx { + uint32_t value; + struct { + uint32_t : 8, + threads_per_core : 8, + : 16; + } bits; + }; + union XemXcr0Eax { uint32_t value; struct { @@ -398,6 +407,12 @@ protected: ExtCpuid8Ecx ext_cpuid8_ecx; uint32_t ext_cpuid8_edx; // reserved + // cpuid function 0x8000001E // AMD 17h + uint32_t ext_cpuid1E_eax; + ExtCpuid1EEbx ext_cpuid1E_ebx; // threads per core (AMD17h) + uint32_t ext_cpuid1E_ecx; + uint32_t ext_cpuid1E_edx; // unused currently + // extended control register XCR0 (the XFEATURE_ENABLED_MASK register) XemXcr0Eax xem_xcr0_eax; uint32_t xem_xcr0_edx; // reserved @@ -505,6 +520,14 @@ protected: result |= CPU_CLMUL; if (_cpuid_info.sef_cpuid7_ebx.bits.rtm != 0) result |= CPU_RTM; + if(_cpuid_info.sef_cpuid7_ebx.bits.adx != 0) + result |= CPU_ADX; + if(_cpuid_info.sef_cpuid7_ebx.bits.bmi2 != 0) + result |= CPU_BMI2; + if (_cpuid_info.sef_cpuid7_ebx.bits.sha != 0) + result |= CPU_SHA; + if (_cpuid_info.std_cpuid1_ecx.bits.fma != 0) + result |= CPU_FMA; // AMD features. if (is_amd()) { @@ -518,16 +541,8 @@ protected: } // Intel features. if(is_intel()) { - if(_cpuid_info.sef_cpuid7_ebx.bits.adx != 0) - result |= CPU_ADX; - if(_cpuid_info.sef_cpuid7_ebx.bits.bmi2 != 0) - result |= CPU_BMI2; - if (_cpuid_info.sef_cpuid7_ebx.bits.sha != 0) - result |= CPU_SHA; if(_cpuid_info.ext_cpuid1_ecx.bits.lzcnt_intel != 0) result |= CPU_LZCNT; - if (_cpuid_info.std_cpuid1_ecx.bits.fma != 0) - result |= CPU_FMA; // for Intel, ecx.bits.misalignsse bit (bit 8) indicates support for prefetchw if (_cpuid_info.ext_cpuid1_ecx.bits.misalignsse != 0) { result |= CPU_3DNOW_PREFETCH; @@ -590,6 +605,7 @@ public: static ByteSize ext_cpuid5_offset() { return byte_offset_of(CpuidInfo, ext_cpuid5_eax); } static ByteSize ext_cpuid7_offset() { return byte_offset_of(CpuidInfo, ext_cpuid7_eax); } static ByteSize ext_cpuid8_offset() { return byte_offset_of(CpuidInfo, ext_cpuid8_eax); } + static ByteSize ext_cpuid1E_offset() { return byte_offset_of(CpuidInfo, ext_cpuid1E_eax); } static ByteSize tpl_cpuidB0_offset() { return byte_offset_of(CpuidInfo, tpl_cpuidB0_eax); } static ByteSize tpl_cpuidB1_offset() { return byte_offset_of(CpuidInfo, tpl_cpuidB1_eax); } static ByteSize tpl_cpuidB2_offset() { return byte_offset_of(CpuidInfo, tpl_cpuidB2_eax); } @@ -673,8 +689,12 @@ public: if (is_intel() && supports_processor_topology()) { result = _cpuid_info.tpl_cpuidB0_ebx.bits.logical_cpus; } else if (_cpuid_info.std_cpuid1_edx.bits.ht != 0) { - result = _cpuid_info.std_cpuid1_ebx.bits.threads_per_cpu / - cores_per_cpu(); + if (cpu_family() >= 0x17) { + result = _cpuid_info.ext_cpuid1E_ebx.bits.threads_per_core + 1; + } else { + result = _cpuid_info.std_cpuid1_ebx.bits.threads_per_cpu / + cores_per_cpu(); + } } return (result == 0 ? 1 : result); } From 7b17b2d2a3e1a9bb615700f4dca501b41698b419 Mon Sep 17 00:00:00 2001 From: Michihiro Horie Date: Tue, 3 Oct 2017 17:37:15 -0700 Subject: [PATCH 32/80] 8188139: PPC64: Superword Level Parallelization with VSX Reviewed-by: kvn, gromero --- src/hotspot/cpu/ppc/assembler_ppc.hpp | 9 + src/hotspot/cpu/ppc/assembler_ppc.inline.hpp | 17 +- src/hotspot/cpu/ppc/ppc.ad | 699 +++++++++++++++++- .../cpu/ppc/register_definitions_ppc.cpp | 2 + src/hotspot/cpu/ppc/register_ppc.hpp | 2 +- src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp | 8 +- src/hotspot/cpu/ppc/vm_version_ppc.cpp | 5 +- src/hotspot/share/adlc/output_c.cpp | 4 + src/hotspot/share/opto/machnode.hpp | 12 + src/hotspot/share/opto/type.cpp | 8 +- 10 files changed, 750 insertions(+), 16 deletions(-) diff --git a/src/hotspot/cpu/ppc/assembler_ppc.hpp b/src/hotspot/cpu/ppc/assembler_ppc.hpp index 62c395d2a50..0b56f9bbe58 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.hpp @@ -517,6 +517,9 @@ class Assembler : public AbstractAssembler { XXPERMDI_OPCODE= (60u << OPCODE_SHIFT | 10u << 3), XXMRGHW_OPCODE = (60u << OPCODE_SHIFT | 18u << 3), XXMRGLW_OPCODE = (60u << OPCODE_SHIFT | 50u << 3), + XXSPLTW_OPCODE = (60u << OPCODE_SHIFT | 164u << 2), + XXLXOR_OPCODE = (60u << OPCODE_SHIFT | 154u << 3), + XXLEQV_OPCODE = (60u << OPCODE_SHIFT | 186u << 3), // Vector Permute and Formatting VPKPX_OPCODE = (4u << OPCODE_SHIFT | 782u ), @@ -1125,6 +1128,7 @@ class Assembler : public AbstractAssembler { static int vsplti_sim(int x) { return opp_u_field(x, 15, 11); } // for vsplti* instructions static int vsldoi_shb(int x) { return opp_u_field(x, 25, 22); } // for vsldoi instruction static int vcmp_rc( int x) { return opp_u_field(x, 21, 21); } // for vcmp* instructions + static int xxsplt_uim(int x) { return opp_u_field(x, 15, 14); } // for xxsplt* instructions //static int xo1( int x) { return opp_u_field(x, 29, 21); }// is contained in our opcodes //static int xo2( int x) { return opp_u_field(x, 30, 21); }// is contained in our opcodes @@ -2155,6 +2159,11 @@ class Assembler : public AbstractAssembler { inline void xxpermdi( VectorSRegister d, VectorSRegister a, VectorSRegister b, int dm); inline void xxmrghw( VectorSRegister d, VectorSRegister a, VectorSRegister b); inline void xxmrglw( VectorSRegister d, VectorSRegister a, VectorSRegister b); + inline void mtvsrd( VectorSRegister d, Register a); + inline void mtvsrwz( VectorSRegister d, Register a); + inline void xxspltw( VectorSRegister d, VectorSRegister b, int ui2); + inline void xxlxor( VectorSRegister d, VectorSRegister a, VectorSRegister b); + inline void xxleqv( VectorSRegister d, VectorSRegister a, VectorSRegister b); // VSX Extended Mnemonics inline void xxspltd( VectorSRegister d, VectorSRegister a, int x); diff --git a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp index f409c4d0276..1f1cfb4f2c6 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp @@ -759,15 +759,20 @@ inline void Assembler::lvsl( VectorRegister d, Register s1, Register s2) { emit inline void Assembler::lvsr( VectorRegister d, Register s1, Register s2) { emit_int32( LVSR_OPCODE | vrt(d) | ra0mem(s1) | rb(s2)); } // Vector-Scalar (VSX) instructions. -inline void Assembler::lxvd2x( VectorSRegister d, Register s1) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra(0) | rb(s1)); } -inline void Assembler::lxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra0mem(s1) | rb(s2)); } -inline void Assembler::stxvd2x( VectorSRegister d, Register s1) { emit_int32( STXVD2X_OPCODE | vsrt(d) | ra(0) | rb(s1)); } -inline void Assembler::stxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( STXVD2X_OPCODE | vsrt(d) | ra0mem(s1) | rb(s2)); } -inline void Assembler::mtvrd( VectorRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d->to_vsr()) | ra(a)); } +inline void Assembler::lxvd2x( VectorSRegister d, Register s1) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra(0) | rb(s1) | 1u); } +inline void Assembler::lxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra0mem(s1) | rb(s2) | 1u); } +inline void Assembler::stxvd2x( VectorSRegister d, Register s1) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra(0) | rb(s1) | 1u); } +inline void Assembler::stxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra0mem(s1) | rb(s2) | 1u); } +inline void Assembler::mtvsrd( VectorSRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d) | ra(a) | 1u); } +inline void Assembler::mtvsrwz( VectorSRegister d, Register a) { emit_int32( MTVSRWZ_OPCODE | vsrt(d) | ra(a) | 1u); } +inline void Assembler::xxspltw( VectorSRegister d, VectorSRegister b, int ui2) { emit_int32( XXSPLTW_OPCODE | vsrt(d) | vsrb(b) | xxsplt_uim(uimm(ui2,2)) | 1u << 1 | 1u); } +inline void Assembler::xxlxor( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLXOR_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 1u << 2 | 1u << 1 | 1u); } +inline void Assembler::xxleqv( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLEQV_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 1u << 2 | 1u << 1 | 1u); } +inline void Assembler::mtvrd( VectorRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mfvrd( Register a, VectorRegister d) { emit_int32( MFVSRD_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mtvrwz( VectorRegister d, Register a) { emit_int32( MTVSRWZ_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mfvrwz( Register a, VectorRegister d) { emit_int32( MFVSRWZ_OPCODE | vsrt(d->to_vsr()) | ra(a)); } -inline void Assembler::xxpermdi(VectorSRegister d, VectorSRegister a, VectorSRegister b, int dm) { emit_int32( XXPERMDI_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | vsdm(dm)); } +inline void Assembler::xxpermdi(VectorSRegister d, VectorSRegister a, VectorSRegister b, int dm) { emit_int32( XXPERMDI_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 0u << 10 | vsdm(dm) | 1u << 2 | 1u << 1 | 1u); } inline void Assembler::xxmrghw( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXMRGHW_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } inline void Assembler::xxmrglw( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXMRGHW_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } diff --git a/src/hotspot/cpu/ppc/ppc.ad b/src/hotspot/cpu/ppc/ppc.ad index de0d6088460..68e7060f910 100644 --- a/src/hotspot/cpu/ppc/ppc.ad +++ b/src/hotspot/cpu/ppc/ppc.ad @@ -254,6 +254,73 @@ register %{ reg_def SR_SPEFSCR(SOC, SOC, Op_RegP, 4, SR_SPEFSCR->as_VMReg()); // v reg_def SR_PPR( SOC, SOC, Op_RegP, 5, SR_PPR->as_VMReg()); // v +// ---------------------------- +// Vector-Scalar Registers +// ---------------------------- + reg_def VSR0 ( SOC, SOC, Op_VecX, 0, NULL); + reg_def VSR1 ( SOC, SOC, Op_VecX, 1, NULL); + reg_def VSR2 ( SOC, SOC, Op_VecX, 2, NULL); + reg_def VSR3 ( SOC, SOC, Op_VecX, 3, NULL); + reg_def VSR4 ( SOC, SOC, Op_VecX, 4, NULL); + reg_def VSR5 ( SOC, SOC, Op_VecX, 5, NULL); + reg_def VSR6 ( SOC, SOC, Op_VecX, 6, NULL); + reg_def VSR7 ( SOC, SOC, Op_VecX, 7, NULL); + reg_def VSR8 ( SOC, SOC, Op_VecX, 8, NULL); + reg_def VSR9 ( SOC, SOC, Op_VecX, 9, NULL); + reg_def VSR10 ( SOC, SOC, Op_VecX, 10, NULL); + reg_def VSR11 ( SOC, SOC, Op_VecX, 11, NULL); + reg_def VSR12 ( SOC, SOC, Op_VecX, 12, NULL); + reg_def VSR13 ( SOC, SOC, Op_VecX, 13, NULL); + reg_def VSR14 ( SOC, SOC, Op_VecX, 14, NULL); + reg_def VSR15 ( SOC, SOC, Op_VecX, 15, NULL); + reg_def VSR16 ( SOC, SOC, Op_VecX, 16, NULL); + reg_def VSR17 ( SOC, SOC, Op_VecX, 17, NULL); + reg_def VSR18 ( SOC, SOC, Op_VecX, 18, NULL); + reg_def VSR19 ( SOC, SOC, Op_VecX, 19, NULL); + reg_def VSR20 ( SOC, SOC, Op_VecX, 20, NULL); + reg_def VSR21 ( SOC, SOC, Op_VecX, 21, NULL); + reg_def VSR22 ( SOC, SOC, Op_VecX, 22, NULL); + reg_def VSR23 ( SOC, SOC, Op_VecX, 23, NULL); + reg_def VSR24 ( SOC, SOC, Op_VecX, 24, NULL); + reg_def VSR25 ( SOC, SOC, Op_VecX, 25, NULL); + reg_def VSR26 ( SOC, SOC, Op_VecX, 26, NULL); + reg_def VSR27 ( SOC, SOC, Op_VecX, 27, NULL); + reg_def VSR28 ( SOC, SOC, Op_VecX, 28, NULL); + reg_def VSR29 ( SOC, SOC, Op_VecX, 29, NULL); + reg_def VSR30 ( SOC, SOC, Op_VecX, 30, NULL); + reg_def VSR31 ( SOC, SOC, Op_VecX, 31, NULL); + reg_def VSR32 ( SOC, SOC, Op_VecX, 32, NULL); + reg_def VSR33 ( SOC, SOC, Op_VecX, 33, NULL); + reg_def VSR34 ( SOC, SOC, Op_VecX, 34, NULL); + reg_def VSR35 ( SOC, SOC, Op_VecX, 35, NULL); + reg_def VSR36 ( SOC, SOC, Op_VecX, 36, NULL); + reg_def VSR37 ( SOC, SOC, Op_VecX, 37, NULL); + reg_def VSR38 ( SOC, SOC, Op_VecX, 38, NULL); + reg_def VSR39 ( SOC, SOC, Op_VecX, 39, NULL); + reg_def VSR40 ( SOC, SOC, Op_VecX, 40, NULL); + reg_def VSR41 ( SOC, SOC, Op_VecX, 41, NULL); + reg_def VSR42 ( SOC, SOC, Op_VecX, 42, NULL); + reg_def VSR43 ( SOC, SOC, Op_VecX, 43, NULL); + reg_def VSR44 ( SOC, SOC, Op_VecX, 44, NULL); + reg_def VSR45 ( SOC, SOC, Op_VecX, 45, NULL); + reg_def VSR46 ( SOC, SOC, Op_VecX, 46, NULL); + reg_def VSR47 ( SOC, SOC, Op_VecX, 47, NULL); + reg_def VSR48 ( SOC, SOC, Op_VecX, 48, NULL); + reg_def VSR49 ( SOC, SOC, Op_VecX, 49, NULL); + reg_def VSR50 ( SOC, SOC, Op_VecX, 50, NULL); + reg_def VSR51 ( SOC, SOC, Op_VecX, 51, NULL); + reg_def VSR52 ( SOC, SOC, Op_VecX, 52, NULL); + reg_def VSR53 ( SOC, SOC, Op_VecX, 53, NULL); + reg_def VSR54 ( SOC, SOC, Op_VecX, 54, NULL); + reg_def VSR55 ( SOC, SOC, Op_VecX, 55, NULL); + reg_def VSR56 ( SOC, SOC, Op_VecX, 56, NULL); + reg_def VSR57 ( SOC, SOC, Op_VecX, 57, NULL); + reg_def VSR58 ( SOC, SOC, Op_VecX, 58, NULL); + reg_def VSR59 ( SOC, SOC, Op_VecX, 59, NULL); + reg_def VSR60 ( SOC, SOC, Op_VecX, 60, NULL); + reg_def VSR61 ( SOC, SOC, Op_VecX, 61, NULL); + reg_def VSR62 ( SOC, SOC, Op_VecX, 62, NULL); + reg_def VSR63 ( SOC, SOC, Op_VecX, 63, NULL); // ---------------------------- // Specify priority of register selection within phases of register @@ -395,6 +462,73 @@ alloc_class chunk3 ( SR_PPR ); +alloc_class chunk4 ( + VSR0, + VSR1, + VSR2, + VSR3, + VSR4, + VSR5, + VSR6, + VSR7, + VSR8, + VSR9, + VSR10, + VSR11, + VSR12, + VSR13, + VSR14, + VSR15, + VSR16, + VSR17, + VSR18, + VSR19, + VSR20, + VSR21, + VSR22, + VSR23, + VSR24, + VSR25, + VSR26, + VSR27, + VSR28, + VSR29, + VSR30, + VSR31, + VSR32, + VSR33, + VSR34, + VSR35, + VSR36, + VSR37, + VSR38, + VSR39, + VSR40, + VSR41, + VSR42, + VSR43, + VSR44, + VSR45, + VSR46, + VSR47, + VSR48, + VSR49, + VSR50, + VSR51, + VSR52, + VSR53, + VSR54, + VSR55, + VSR56, + VSR57, + VSR58, + VSR59, + VSR60, + VSR61, + VSR62, + VSR63 +); + //-------Architecture Description Register Classes----------------------- // Several register classes are automatically defined based upon @@ -769,6 +903,73 @@ reg_class dbl_reg( F31, F31_H // nv! ); +// Class for all 128bit vector registers +reg_class vectorx_reg(VSR0, + VSR1, + VSR2, + VSR3, + VSR4, + VSR5, + VSR6, + VSR7, + VSR8, + VSR9, + VSR10, + VSR11, + VSR12, + VSR13, + VSR14, + VSR15, + VSR16, + VSR17, + VSR18, + VSR19, + VSR20, + VSR21, + VSR22, + VSR23, + VSR24, + VSR25, + VSR26, + VSR27, + VSR28, + VSR29, + VSR30, + VSR31, + VSR32, + VSR33, + VSR34, + VSR35, + VSR36, + VSR37, + VSR38, + VSR39, + VSR40, + VSR41, + VSR42, + VSR43, + VSR44, + VSR45, + VSR46, + VSR47, + VSR48, + VSR49, + VSR50, + VSR51, + VSR52, + VSR53, + VSR54, + VSR55, + VSR56, + VSR57, + VSR58, + VSR59, + VSR60, + VSR61, + VSR62, + VSR63 +); + %} //----------DEFINITION BLOCK--------------------------------------------------- @@ -2048,14 +2249,24 @@ const bool Matcher::convL2FSupported(void) { // Vector width in bytes. const int Matcher::vector_width_in_bytes(BasicType bt) { - assert(MaxVectorSize == 8, ""); - return 8; + if (VM_Version::has_vsx()) { + assert(MaxVectorSize == 16, ""); + return 16; + } else { + assert(MaxVectorSize == 8, ""); + return 8; + } } // Vector ideal reg. const uint Matcher::vector_ideal_reg(int size) { - assert(MaxVectorSize == 8 && size == 8, ""); - return Op_RegL; + if (VM_Version::has_vsx()) { + assert(MaxVectorSize == 16 && size == 16, ""); + return Op_VecX; + } else { + assert(MaxVectorSize == 8 && size == 8, ""); + return Op_RegL; + } } const uint Matcher::vector_shift_count_ideal_reg(int size) { @@ -2075,7 +2286,10 @@ const int Matcher::min_vector_size(const BasicType bt) { // PPC doesn't support misaligned vectors store/load. const bool Matcher::misaligned_vectors_ok() { - return false; + if (VM_Version::has_vsx()) + return !AlignVector; // can be changed by flag + else + return false; } // PPC AES support not yet implemented @@ -2217,10 +2431,31 @@ const MachRegisterNumbers farg_reg[13] = { F13_num }; +const MachRegisterNumbers vsarg_reg[64] = { + VSR0_num, VSR1_num, VSR2_num, VSR3_num, + VSR4_num, VSR5_num, VSR6_num, VSR7_num, + VSR8_num, VSR9_num, VSR10_num, VSR11_num, + VSR12_num, VSR13_num, VSR14_num, VSR15_num, + VSR16_num, VSR17_num, VSR18_num, VSR19_num, + VSR20_num, VSR21_num, VSR22_num, VSR23_num, + VSR24_num, VSR23_num, VSR24_num, VSR25_num, + VSR28_num, VSR29_num, VSR30_num, VSR31_num, + VSR32_num, VSR33_num, VSR34_num, VSR35_num, + VSR36_num, VSR37_num, VSR38_num, VSR39_num, + VSR40_num, VSR41_num, VSR42_num, VSR43_num, + VSR44_num, VSR45_num, VSR46_num, VSR47_num, + VSR48_num, VSR49_num, VSR50_num, VSR51_num, + VSR52_num, VSR53_num, VSR54_num, VSR55_num, + VSR56_num, VSR57_num, VSR58_num, VSR59_num, + VSR60_num, VSR61_num, VSR62_num, VSR63_num +}; + const int num_iarg_registers = sizeof(iarg_reg) / sizeof(iarg_reg[0]); const int num_farg_registers = sizeof(farg_reg) / sizeof(farg_reg[0]); +const int num_vsarg_registers = sizeof(vsarg_reg) / sizeof(vsarg_reg[0]); + // Return whether or not this register is ever used as an argument. This // function is used on startup to build the trampoline stubs in generateOptoStub. // Registers not mentioned will be killed by the VM call in the trampoline, and @@ -2552,6 +2787,115 @@ loadConLNodesTuple loadConLNodesTuple_create(PhaseRegAlloc *ra_, Node *toc, immL return nodes; } +typedef struct { + loadConL_hiNode *_large_hi; + loadConL_loNode *_large_lo; + mtvsrdNode *_moved; + xxspltdNode *_replicated; + loadConLNode *_small; + MachNode *_last; +} loadConLReplicatedNodesTuple; + +loadConLReplicatedNodesTuple loadConLReplicatedNodesTuple_create(Compile *C, PhaseRegAlloc *ra_, Node *toc, immLOper *immSrc, + vecXOper *dst, immI_0Oper *zero, + OptoReg::Name reg_second, OptoReg::Name reg_first, + OptoReg::Name reg_vec_second, OptoReg::Name reg_vec_first) { + loadConLReplicatedNodesTuple nodes; + + const bool large_constant_pool = true; // TODO: PPC port C->cfg()->_consts_size > 4000; + if (large_constant_pool) { + // Create new nodes. + loadConL_hiNode *m1 = new loadConL_hiNode(); + loadConL_loNode *m2 = new loadConL_loNode(); + mtvsrdNode *m3 = new mtvsrdNode(); + xxspltdNode *m4 = new xxspltdNode(); + + // inputs for new nodes + m1->add_req(NULL, toc); + m2->add_req(NULL, m1); + m3->add_req(NULL, m2); + m4->add_req(NULL, m3); + + // operands for new nodes + m1->_opnds[0] = new iRegLdstOper(); // dst + m1->_opnds[1] = immSrc; // src + m1->_opnds[2] = new iRegPdstOper(); // toc + + m2->_opnds[0] = new iRegLdstOper(); // dst + m2->_opnds[1] = immSrc; // src + m2->_opnds[2] = new iRegLdstOper(); // base + + m3->_opnds[0] = new vecXOper(); // dst + m3->_opnds[1] = new iRegLdstOper(); // src + + m4->_opnds[0] = new vecXOper(); // dst + m4->_opnds[1] = new vecXOper(); // src + m4->_opnds[2] = zero; + + // Initialize ins_attrib TOC fields. + m1->_const_toc_offset = -1; + m2->_const_toc_offset_hi_node = m1; + + // Initialize ins_attrib instruction offset. + m1->_cbuf_insts_offset = -1; + + // register allocation for new nodes + ra_->set_pair(m1->_idx, reg_second, reg_first); + ra_->set_pair(m2->_idx, reg_second, reg_first); + ra_->set1(m3->_idx, reg_second); + ra_->set2(m3->_idx, reg_vec_first); + ra_->set_pair(m4->_idx, reg_vec_second, reg_vec_first); + + // Create result. + nodes._large_hi = m1; + nodes._large_lo = m2; + nodes._moved = m3; + nodes._replicated = m4; + nodes._small = NULL; + nodes._last = nodes._replicated; + assert(m2->bottom_type()->isa_long(), "must be long"); + } else { + loadConLNode *m2 = new loadConLNode(); + mtvsrdNode *m3 = new mtvsrdNode(); + xxspltdNode *m4 = new xxspltdNode(); + + // inputs for new nodes + m2->add_req(NULL, toc); + + // operands for new nodes + m2->_opnds[0] = new iRegLdstOper(); // dst + m2->_opnds[1] = immSrc; // src + m2->_opnds[2] = new iRegPdstOper(); // toc + + m3->_opnds[0] = new vecXOper(); // dst + m3->_opnds[1] = new iRegLdstOper(); // src + + m4->_opnds[0] = new vecXOper(); // dst + m4->_opnds[1] = new vecXOper(); // src + m4->_opnds[2] = zero; + + // Initialize ins_attrib instruction offset. + m2->_cbuf_insts_offset = -1; + ra_->set1(m3->_idx, reg_second); + ra_->set2(m3->_idx, reg_vec_first); + ra_->set_pair(m4->_idx, reg_vec_second, reg_vec_first); + + // register allocation for new nodes + ra_->set_pair(m2->_idx, reg_second, reg_first); + + // Create result. + nodes._large_hi = NULL; + nodes._large_lo = NULL; + nodes._small = m2; + nodes._moved = m3; + nodes._replicated = m4; + nodes._last = nodes._replicated; + assert(m2->bottom_type()->isa_long(), "must be long"); + } + + return nodes; +} + %} // source encode %{ @@ -3212,6 +3556,27 @@ encode %{ assert(loadConLNodes._last->bottom_type()->isa_long(), "must be long"); %} + enc_class postalloc_expand_load_replF_constant_vsx(vecX dst, immF src, iRegLdst toc) %{ + // Create new nodes. + + // Make an operand with the bit pattern to load as float. + immLOper *op_repl = new immLOper((jlong)replicate_immF(op_src->constantF())); + immI_0Oper *op_zero = new immI_0Oper(0); + + loadConLReplicatedNodesTuple loadConLNodes = + loadConLReplicatedNodesTuple_create(C, ra_, n_toc, op_repl, op_dst, op_zero, + OptoReg::Name(R20_H_num), OptoReg::Name(R20_num), + OptoReg::Name(VSR11_num), OptoReg::Name(VSR10_num)); + + // Push new nodes. + if (loadConLNodes._large_hi) { nodes->push(loadConLNodes._large_hi); } + if (loadConLNodes._large_lo) { nodes->push(loadConLNodes._large_lo); } + if (loadConLNodes._moved) { nodes->push(loadConLNodes._moved); } + if (loadConLNodes._last) { nodes->push(loadConLNodes._last); } + + assert(nodes->length() >= 1, "must have created at least 1 node"); + %} + // This enc_class is needed so that scheduler gets proper // input mapping for latency computation. enc_class enc_poll(immI dst, iRegLdst poll) %{ @@ -3840,6 +4205,14 @@ ins_attrib ins_field_load_ic_node(0); // // Formats are generated automatically for constants and base registers. +operand vecX() %{ + constraint(ALLOC_IN_RC(vectorx_reg)); + match(VecX); + + format %{ %} + interface(REG_INTER); +%} + //----------Simple Operands---------------------------------------------------- // Immediate Operands @@ -5372,6 +5745,20 @@ instruct loadV8(iRegLdst dst, memoryAlg4 mem) %{ ins_pipe(pipe_class_memory); %} +// Load Aligned Packed Byte +instruct loadV16(vecX dst, indirect mem) %{ + predicate(n->as_LoadVector()->memory_size() == 16); + match(Set dst (LoadVector mem)); + ins_cost(MEMORY_REF_COST); + + format %{ "LXVD2X $dst, $mem \t// load 16-byte Vector" %} + size(4); + ins_encode %{ + __ lxvd2x($dst$$VectorSRegister, $mem$$Register); + %} + ins_pipe(pipe_class_default); +%} + // Load Range, range = array length (=jint) instruct loadRange(iRegIdst dst, memory mem) %{ match(Set dst (LoadRange mem)); @@ -6368,6 +6755,20 @@ instruct storeA8B(memoryAlg4 mem, iRegLsrc src) %{ ins_pipe(pipe_class_memory); %} +// Store Packed Byte long register to memory +instruct storeV16(indirect mem, vecX src) %{ + predicate(n->as_StoreVector()->memory_size() == 16); + match(Set mem (StoreVector mem src)); + ins_cost(MEMORY_REF_COST); + + format %{ "STXVD2X $mem, $src \t// store 16-byte Vector" %} + size(4); + ins_encode %{ + __ stxvd2x($src$$VectorSRegister, $mem$$Register); + %} + ins_pipe(pipe_class_default); +%} + // Store Compressed Oop instruct storeN(memory dst, iRegN_P2N src) %{ match(Set dst (StoreN dst src)); @@ -13239,6 +13640,26 @@ instruct storeS_reversed(iRegIsrc src, indirect mem) %{ ins_pipe(pipe_class_default); %} +instruct mtvsrwz(vecX temp1, iRegIsrc src) %{ + effect(DEF temp1, USE src); + + size(4); + ins_encode %{ + __ mtvsrwz($temp1$$VectorSRegister, $src$$Register); + %} + ins_pipe(pipe_class_default); +%} + +instruct xxspltw(vecX dst, vecX src, immI8 imm1) %{ + effect(DEF dst, USE src, USE imm1); + + size(4); + ins_encode %{ + __ xxspltw($dst$$VectorSRegister, $src$$VectorSRegister, $imm1$$constant); + %} + ins_pipe(pipe_class_default); +%} + //---------- Replicate Vector Instructions ------------------------------------ // Insrdi does replicate if src == dst. @@ -13318,6 +13739,46 @@ instruct repl8B_immIminus1(iRegLdst dst, immI_minus1 src) %{ ins_pipe(pipe_class_default); %} +instruct repl16B_reg_Ex(vecX dst, iRegIsrc src) %{ + match(Set dst (ReplicateB src)); + predicate(n->as_Vector()->length() == 16); + + expand %{ + iRegLdst tmpL; + vecX tmpV; + immI8 imm1 %{ (int) 1 %} + moveReg(tmpL, src); + repl56(tmpL); + repl48(tmpL); + mtvsrwz(tmpV, tmpL); + xxspltw(dst, tmpV, imm1); + %} +%} + +instruct repl16B_immI0(vecX dst, immI_0 zero) %{ + match(Set dst (ReplicateB zero)); + predicate(n->as_Vector()->length() == 16); + + format %{ "XXLXOR $dst, $zero \t// replicate16B" %} + size(4); + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl16B_immIminus1(vecX dst, immI_minus1 src) %{ + match(Set dst (ReplicateB src)); + predicate(n->as_Vector()->length() == 16); + + format %{ "XXLEQV $dst, $src \t// replicate16B" %} + size(4); + ins_encode %{ + __ xxleqv($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + instruct repl4S_reg_Ex(iRegLdst dst, iRegIsrc src) %{ match(Set dst (ReplicateS src)); predicate(n->as_Vector()->length() == 4); @@ -13352,6 +13813,46 @@ instruct repl4S_immIminus1(iRegLdst dst, immI_minus1 src) %{ ins_pipe(pipe_class_default); %} +instruct repl8S_reg_Ex(vecX dst, iRegIsrc src) %{ + match(Set dst (ReplicateS src)); + predicate(n->as_Vector()->length() == 8); + + expand %{ + iRegLdst tmpL; + vecX tmpV; + immI8 zero %{ (int) 0 %} + moveReg(tmpL, src); + repl48(tmpL); + repl32(tmpL); + mtvsrd(tmpV, tmpL); + xxpermdi(dst, tmpV, tmpV, zero); + %} +%} + +instruct repl8S_immI0(vecX dst, immI_0 zero) %{ + match(Set dst (ReplicateS zero)); + predicate(n->as_Vector()->length() == 8); + + format %{ "XXLXOR $dst, $zero \t// replicate8S" %} + size(4); + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl8S_immIminus1(vecX dst, immI_minus1 src) %{ + match(Set dst (ReplicateS src)); + predicate(n->as_Vector()->length() == 8); + + format %{ "XXLEQV $dst, $src \t// replicate16B" %} + size(4); + ins_encode %{ + __ xxleqv($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + instruct repl2I_reg_Ex(iRegLdst dst, iRegIsrc src) %{ match(Set dst (ReplicateI src)); predicate(n->as_Vector()->length() == 2); @@ -13386,6 +13887,46 @@ instruct repl2I_immIminus1(iRegLdst dst, immI_minus1 src) %{ ins_pipe(pipe_class_default); %} +instruct repl4I_reg_Ex(vecX dst, iRegIsrc src) %{ + match(Set dst (ReplicateI src)); + predicate(n->as_Vector()->length() == 4); + ins_cost(2 * DEFAULT_COST); + + expand %{ + iRegLdst tmpL; + vecX tmpV; + immI8 zero %{ (int) 0 %} + moveReg(tmpL, src); + repl32(tmpL); + mtvsrd(tmpV, tmpL); + xxpermdi(dst, tmpV, tmpV, zero); + %} +%} + +instruct repl4I_immI0(vecX dst, immI_0 zero) %{ + match(Set dst (ReplicateI zero)); + predicate(n->as_Vector()->length() == 4); + + format %{ "XXLXOR $dst, $zero \t// replicate4I" %} + size(4); + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl4I_immIminus1(vecX dst, immI_minus1 src) %{ + match(Set dst (ReplicateI src)); + predicate(n->as_Vector()->length() == 4); + + format %{ "XXLEQV $dst, $dst, $dst \t// replicate4I" %} + size(4); + ins_encode %{ + __ xxleqv($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + // Move float to int register via stack, replicate. instruct repl2F_reg_Ex(iRegLdst dst, regF src) %{ match(Set dst (ReplicateF src)); @@ -13484,6 +14025,154 @@ instruct overflowMulL_reg_reg(flagsRegCR0 cr0, iRegLsrc op1, iRegLsrc op2) %{ %} +instruct repl4F_reg_Ex(vecX dst, regF src) %{ + match(Set dst (ReplicateF src)); + predicate(n->as_Vector()->length() == 4); + ins_cost(2 * MEMORY_REF_COST + DEFAULT_COST); + expand %{ + stackSlotL tmpS; + iRegIdst tmpI; + iRegLdst tmpL; + vecX tmpV; + immI8 zero %{ (int) 0 %} + + moveF2I_reg_stack(tmpS, src); // Move float to stack. + moveF2I_stack_reg(tmpI, tmpS); // Move stack to int reg. + moveReg(tmpL, tmpI); // Move int to long reg. + repl32(tmpL); // Replicate bitpattern. + mtvsrd(tmpV, tmpL); + xxpermdi(dst, tmpV, tmpV, zero); + %} +%} + +instruct repl4F_immF_Ex(vecX dst, immF src) %{ + match(Set dst (ReplicateF src)); + predicate(n->as_Vector()->length() == 4); + ins_cost(10 * DEFAULT_COST); + + postalloc_expand( postalloc_expand_load_replF_constant_vsx(dst, src, constanttablebase) ); +%} + +instruct repl4F_immF0(vecX dst, immF_0 zero) %{ + match(Set dst (ReplicateF zero)); + predicate(n->as_Vector()->length() == 4); + + format %{ "XXLXOR $dst, $zero \t// replicate4F" %} + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl2D_reg_Ex(vecX dst, regD src) %{ + match(Set dst (ReplicateD src)); + predicate(n->as_Vector()->length() == 2); + expand %{ + stackSlotL tmpS; + iRegLdst tmpL; + iRegLdst tmp; + vecX tmpV; + immI8 zero %{ (int) 0 %} + moveD2L_reg_stack(tmpS, src); + moveD2L_stack_reg(tmpL, tmpS); + mtvsrd(tmpV, tmpL); + xxpermdi(dst, tmpV, tmpV, zero); + %} +%} + +instruct repl2D_immI0(vecX dst, immI_0 zero) %{ + match(Set dst (ReplicateD zero)); + predicate(n->as_Vector()->length() == 2); + + format %{ "XXLXOR $dst, $zero \t// replicate2D" %} + size(4); + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl2D_immIminus1(vecX dst, immI_minus1 src) %{ + match(Set dst (ReplicateD src)); + predicate(n->as_Vector()->length() == 2); + + format %{ "XXLEQV $dst, $src \t// replicate16B" %} + size(4); + ins_encode %{ + __ xxleqv($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct mtvsrd(vecX dst, iRegLsrc src) %{ + predicate(false); + effect(DEF dst, USE src); + + format %{ "MTVSRD $dst, $src \t// Move to 16-byte register"%} + size(4); + ins_encode %{ + __ mtvsrd($dst$$VectorSRegister, $src$$Register); + %} + ins_pipe(pipe_class_default); +%} + +instruct xxspltd(vecX dst, vecX src, immI8 zero) %{ + effect(DEF dst, USE src, USE zero); + + format %{ "XXSPLATD $dst, $src, $zero \t// Permute 16-byte register"%} + size(4); + ins_encode %{ + __ xxpermdi($dst$$VectorSRegister, $src$$VectorSRegister, $src$$VectorSRegister, $zero$$constant); + %} + ins_pipe(pipe_class_default); +%} + +instruct xxpermdi(vecX dst, vecX src1, vecX src2, immI8 zero) %{ + effect(DEF dst, USE src1, USE src2, USE zero); + + format %{ "XXPERMDI $dst, $src1, $src2, $zero \t// Permute 16-byte register"%} + size(4); + ins_encode %{ + __ xxpermdi($dst$$VectorSRegister, $src1$$VectorSRegister, $src2$$VectorSRegister, $zero$$constant); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl2L_reg_Ex(vecX dst, iRegLsrc src) %{ + match(Set dst (ReplicateL src)); + predicate(n->as_Vector()->length() == 2); + expand %{ + vecX tmpV; + immI8 zero %{ (int) 0 %} + mtvsrd(tmpV, src); + xxpermdi(dst, tmpV, tmpV, zero); + %} +%} + +instruct repl2L_immI0(vecX dst, immI_0 zero) %{ + match(Set dst (ReplicateL zero)); + predicate(n->as_Vector()->length() == 2); + + format %{ "XXLXOR $dst, $zero \t// replicate2L" %} + size(4); + ins_encode %{ + __ xxlxor($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + +instruct repl2L_immIminus1(vecX dst, immI_minus1 src) %{ + match(Set dst (ReplicateL src)); + predicate(n->as_Vector()->length() == 2); + + format %{ "XXLEQV $dst, $src \t// replicate16B" %} + size(4); + ins_encode %{ + __ xxleqv($dst$$VectorSRegister, $dst$$VectorSRegister, $dst$$VectorSRegister); + %} + ins_pipe(pipe_class_default); +%} + // ============================================================================ // Safepoint Instruction diff --git a/src/hotspot/cpu/ppc/register_definitions_ppc.cpp b/src/hotspot/cpu/ppc/register_definitions_ppc.cpp index 2a2d968e44d..d5a064b169f 100644 --- a/src/hotspot/cpu/ppc/register_definitions_ppc.cpp +++ b/src/hotspot/cpu/ppc/register_definitions_ppc.cpp @@ -31,3 +31,5 @@ REGISTER_DEFINITION(Register, noreg); REGISTER_DEFINITION(FloatRegister, fnoreg); + +REGISTER_DEFINITION(VectorSRegister, vsnoreg); diff --git a/src/hotspot/cpu/ppc/register_ppc.hpp b/src/hotspot/cpu/ppc/register_ppc.hpp index c554f88619d..af516ce2d8f 100644 --- a/src/hotspot/cpu/ppc/register_ppc.hpp +++ b/src/hotspot/cpu/ppc/register_ppc.hpp @@ -677,7 +677,7 @@ class ConcreteRegisterImpl : public AbstractRegisterImpl { * 2 // register halves + ConditionRegisterImpl::number_of_registers // condition code registers + SpecialRegisterImpl::number_of_registers // special registers - + VectorRegisterImpl::number_of_registers // VSX registers + + VectorSRegisterImpl::number_of_registers // VSX registers }; static const int max_gpr; diff --git a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp index 20a1a963abc..6c6649be948 100644 --- a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp +++ b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp @@ -479,8 +479,12 @@ void RegisterSaver::restore_result_registers(MacroAssembler* masm, int frame_siz // Is vector's size (in bytes) bigger than a size saved by default? bool SharedRuntime::is_wide_vector(int size) { - // Note, MaxVectorSize == 8 on PPC64. - assert(size <= 8, "%d bytes vectors are not supported", size); + // Note, MaxVectorSize == 8/16 on PPC64. + if (VM_Version::has_vsx()) { + assert(size <= 16, "%d bytes vectors are not supported", size); + } else { + assert(size <= 8, "%d bytes vectors are not supported", size); + } return size > 8; } diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.cpp b/src/hotspot/cpu/ppc/vm_version_ppc.cpp index c4d3041183d..0bb6aeab787 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.cpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.cpp @@ -107,7 +107,10 @@ void VM_Version::initialize() { // TODO: PPC port PdScheduling::power6SectorSize = 0x20; } - MaxVectorSize = 8; + if (VM_Version::has_vsx()) + MaxVectorSize = 16; + else + MaxVectorSize = 8; #endif // Create and print feature-string. diff --git a/src/hotspot/share/adlc/output_c.cpp b/src/hotspot/share/adlc/output_c.cpp index 3e78d62e5d7..302e67bf5fb 100644 --- a/src/hotspot/share/adlc/output_c.cpp +++ b/src/hotspot/share/adlc/output_c.cpp @@ -2276,6 +2276,10 @@ private: if (strcmp(rep_var,"$XMMRegister") == 0) return "as_XMMRegister"; #endif if (strcmp(rep_var,"$CondRegister") == 0) return "as_ConditionRegister"; +#if defined(PPC64) + if (strcmp(rep_var,"$VectorRegister") == 0) return "as_VectorRegister"; + if (strcmp(rep_var,"$VectorSRegister") == 0) return "as_VectorSRegister"; +#endif return NULL; } diff --git a/src/hotspot/share/opto/machnode.hpp b/src/hotspot/share/opto/machnode.hpp index 60bdc9b8768..8bfd1e5b9c8 100644 --- a/src/hotspot/share/opto/machnode.hpp +++ b/src/hotspot/share/opto/machnode.hpp @@ -115,6 +115,18 @@ public: ConditionRegister as_ConditionRegister(PhaseRegAlloc *ra_, const Node *node, int idx) const { return ::as_ConditionRegister(reg(ra_, node, idx)); } + VectorRegister as_VectorRegister(PhaseRegAlloc *ra_, const Node *node) const { + return ::as_VectorRegister(reg(ra_, node)); + } + VectorRegister as_VectorRegister(PhaseRegAlloc *ra_, const Node *node, int idx) const { + return ::as_VectorRegister(reg(ra_, node, idx)); + } + VectorSRegister as_VectorSRegister(PhaseRegAlloc *ra_, const Node *node) const { + return ::as_VectorSRegister(reg(ra_, node)); + } + VectorSRegister as_VectorSRegister(PhaseRegAlloc *ra_, const Node *node, int idx) const { + return ::as_VectorSRegister(reg(ra_, node, idx)); + } #endif virtual intptr_t constant() const; diff --git a/src/hotspot/share/opto/type.cpp b/src/hotspot/share/opto/type.cpp index ce199a2abd7..08b56cd3d14 100644 --- a/src/hotspot/share/opto/type.cpp +++ b/src/hotspot/share/opto/type.cpp @@ -67,7 +67,13 @@ const Type::TypeInfo Type::_type_info[Type::lastype] = { { Bad, T_ILLEGAL, "vectorx:", false, 0, relocInfo::none }, // VectorX { Bad, T_ILLEGAL, "vectory:", false, 0, relocInfo::none }, // VectorY { Bad, T_ILLEGAL, "vectorz:", false, 0, relocInfo::none }, // VectorZ -#elif defined(PPC64) || defined(S390) +#elif defined(PPC64) + { Bad, T_ILLEGAL, "vectors:", false, 0, relocInfo::none }, // VectorS + { Bad, T_ILLEGAL, "vectord:", false, Op_RegL, relocInfo::none }, // VectorD + { Bad, T_ILLEGAL, "vectorx:", false, Op_VecX, relocInfo::none }, // VectorX + { Bad, T_ILLEGAL, "vectory:", false, 0, relocInfo::none }, // VectorY + { Bad, T_ILLEGAL, "vectorz:", false, 0, relocInfo::none }, // VectorZ +#elif defined(S390) { Bad, T_ILLEGAL, "vectors:", false, 0, relocInfo::none }, // VectorS { Bad, T_ILLEGAL, "vectord:", false, Op_RegL, relocInfo::none }, // VectorD { Bad, T_ILLEGAL, "vectorx:", false, 0, relocInfo::none }, // VectorX From febf1d80ea8b368e909792a343aee7fab133e59a Mon Sep 17 00:00:00 2001 From: Michihiro Horie Date: Wed, 4 Oct 2017 14:01:54 +0200 Subject: [PATCH 33/80] 8188757: PPC64: Disable VSR52-63 in ppc.ad Reviewed-by: mdoerr --- src/hotspot/cpu/ppc/assembler_ppc.inline.hpp | 20 ++-- src/hotspot/cpu/ppc/ppc.ad | 104 +++++++------------ 2 files changed, 48 insertions(+), 76 deletions(-) diff --git a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp index 1f1cfb4f2c6..da496abd5d7 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp @@ -759,20 +759,20 @@ inline void Assembler::lvsl( VectorRegister d, Register s1, Register s2) { emit inline void Assembler::lvsr( VectorRegister d, Register s1, Register s2) { emit_int32( LVSR_OPCODE | vrt(d) | ra0mem(s1) | rb(s2)); } // Vector-Scalar (VSX) instructions. -inline void Assembler::lxvd2x( VectorSRegister d, Register s1) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra(0) | rb(s1) | 1u); } -inline void Assembler::lxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra0mem(s1) | rb(s2) | 1u); } -inline void Assembler::stxvd2x( VectorSRegister d, Register s1) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra(0) | rb(s1) | 1u); } -inline void Assembler::stxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra0mem(s1) | rb(s2) | 1u); } -inline void Assembler::mtvsrd( VectorSRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d) | ra(a) | 1u); } -inline void Assembler::mtvsrwz( VectorSRegister d, Register a) { emit_int32( MTVSRWZ_OPCODE | vsrt(d) | ra(a) | 1u); } -inline void Assembler::xxspltw( VectorSRegister d, VectorSRegister b, int ui2) { emit_int32( XXSPLTW_OPCODE | vsrt(d) | vsrb(b) | xxsplt_uim(uimm(ui2,2)) | 1u << 1 | 1u); } -inline void Assembler::xxlxor( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLXOR_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 1u << 2 | 1u << 1 | 1u); } -inline void Assembler::xxleqv( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLEQV_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 1u << 2 | 1u << 1 | 1u); } +inline void Assembler::lxvd2x( VectorSRegister d, Register s1) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra(0) | rb(s1)); } +inline void Assembler::lxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( LXVD2X_OPCODE | vsrt(d) | ra0mem(s1) | rb(s2)); } +inline void Assembler::stxvd2x( VectorSRegister d, Register s1) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra(0) | rb(s1)); } +inline void Assembler::stxvd2x( VectorSRegister d, Register s1, Register s2) { emit_int32( STXVD2X_OPCODE | vsrs(d) | ra0mem(s1) | rb(s2)); } +inline void Assembler::mtvsrd( VectorSRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d) | ra(a)); } +inline void Assembler::mtvsrwz( VectorSRegister d, Register a) { emit_int32( MTVSRWZ_OPCODE | vsrt(d) | ra(a)); } +inline void Assembler::xxspltw( VectorSRegister d, VectorSRegister b, int ui2) { emit_int32( XXSPLTW_OPCODE | vsrt(d) | vsrb(b) | xxsplt_uim(uimm(ui2,2))); } +inline void Assembler::xxlxor( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLXOR_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } +inline void Assembler::xxleqv( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXLEQV_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } inline void Assembler::mtvrd( VectorRegister d, Register a) { emit_int32( MTVSRD_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mfvrd( Register a, VectorRegister d) { emit_int32( MFVSRD_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mtvrwz( VectorRegister d, Register a) { emit_int32( MTVSRWZ_OPCODE | vsrt(d->to_vsr()) | ra(a)); } inline void Assembler::mfvrwz( Register a, VectorRegister d) { emit_int32( MFVSRWZ_OPCODE | vsrt(d->to_vsr()) | ra(a)); } -inline void Assembler::xxpermdi(VectorSRegister d, VectorSRegister a, VectorSRegister b, int dm) { emit_int32( XXPERMDI_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | 0u << 10 | vsdm(dm) | 1u << 2 | 1u << 1 | 1u); } +inline void Assembler::xxpermdi(VectorSRegister d, VectorSRegister a, VectorSRegister b, int dm) { emit_int32( XXPERMDI_OPCODE | vsrt(d) | vsra(a) | vsrb(b) | vsdm(dm)); } inline void Assembler::xxmrghw( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXMRGHW_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } inline void Assembler::xxmrglw( VectorSRegister d, VectorSRegister a, VectorSRegister b) { emit_int32( XXMRGHW_OPCODE | vsrt(d) | vsra(a) | vsrb(b)); } diff --git a/src/hotspot/cpu/ppc/ppc.ad b/src/hotspot/cpu/ppc/ppc.ad index 68e7060f910..477aedf496f 100644 --- a/src/hotspot/cpu/ppc/ppc.ad +++ b/src/hotspot/cpu/ppc/ppc.ad @@ -903,71 +903,43 @@ reg_class dbl_reg( F31, F31_H // nv! ); -// Class for all 128bit vector registers -reg_class vectorx_reg(VSR0, - VSR1, - VSR2, - VSR3, - VSR4, - VSR5, - VSR6, - VSR7, - VSR8, - VSR9, - VSR10, - VSR11, - VSR12, - VSR13, - VSR14, - VSR15, - VSR16, - VSR17, - VSR18, - VSR19, - VSR20, - VSR21, - VSR22, - VSR23, - VSR24, - VSR25, - VSR26, - VSR27, - VSR28, - VSR29, - VSR30, - VSR31, - VSR32, - VSR33, - VSR34, - VSR35, - VSR36, - VSR37, - VSR38, - VSR39, - VSR40, - VSR41, - VSR42, - VSR43, - VSR44, - VSR45, - VSR46, - VSR47, - VSR48, - VSR49, - VSR50, - VSR51, - VSR52, - VSR53, - VSR54, - VSR55, - VSR56, - VSR57, - VSR58, - VSR59, - VSR60, - VSR61, - VSR62, - VSR63 +// ---------------------------- +// Vector-Scalar Register Class +// ---------------------------- + +reg_class vs_reg( + VSR32, + VSR33, + VSR34, + VSR35, + VSR36, + VSR37, + VSR38, + VSR39, + VSR40, + VSR41, + VSR42, + VSR43, + VSR44, + VSR45, + VSR46, + VSR47, + VSR48, + VSR49, + VSR50, + VSR51 +// VSR52, // nv! +// VSR53, // nv! +// VSR54, // nv! +// VSR55, // nv! +// VSR56, // nv! +// VSR57, // nv! +// VSR58, // nv! +// VSR59, // nv! +// VSR60, // nv! +// VSR61, // nv! +// VSR62, // nv! +// VSR63 // nv! ); %} @@ -4206,7 +4178,7 @@ ins_attrib ins_field_load_ic_node(0); // Formats are generated automatically for constants and base registers. operand vecX() %{ - constraint(ALLOC_IN_RC(vectorx_reg)); + constraint(ALLOC_IN_RC(vs_reg)); match(VecX); format %{ %} From bdb303aa4230d84360727f6b640ff56512aea7d4 Mon Sep 17 00:00:00 2001 From: Lutz Schmidt Date: Wed, 4 Oct 2017 14:25:53 +0200 Subject: [PATCH 34/80] 8187969: [s390] z/Architecture Vector Facility Support. Part II Reviewed-by: mdoerr --- src/hotspot/cpu/s390/assembler_s390.hpp | 61 ++++++++-- .../cpu/s390/assembler_s390.inline.hpp | 107 +++++++++++------- 2 files changed, 119 insertions(+), 49 deletions(-) diff --git a/src/hotspot/cpu/s390/assembler_s390.hpp b/src/hotspot/cpu/s390/assembler_s390.hpp index 6e2820ce980..7b431307458 100644 --- a/src/hotspot/cpu/s390/assembler_s390.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.hpp @@ -1276,6 +1276,13 @@ class Assembler : public AbstractAssembler { // Test under Mask #define VTM_ZOPC (unsigned long)(0xe7L << 40 | 0xd8L << 0) // Like TM, set CC according to state of selected bits. +//---< Vector String Instructions >--- +#define VFAE_ZOPC (unsigned long)(0xe7L << 40 | 0x82L << 0) // Find any element +#define VFEE_ZOPC (unsigned long)(0xe7L << 40 | 0x80L << 0) // Find element equal +#define VFENE_ZOPC (unsigned long)(0xe7L << 40 | 0x81L << 0) // Find element not equal +#define VSTRC_ZOPC (unsigned long)(0xe7L << 40 | 0x8aL << 0) // String range compare +#define VISTR_ZOPC (unsigned long)(0xe7L << 40 | 0x5cL << 0) // Isolate String + //-------------------------------- //-- Miscellaneous Operations -- @@ -1475,10 +1482,18 @@ class Assembler : public AbstractAssembler { VRET_QW = 4 }; - // Vector Operation Condition Code Control. - enum VOpCCC { - VOP_CCIGN = 0, // ignore, don't set CC - VOP_CCSET = 1 // set the CC + // Vector Operation Result Control. + // This is a set of flags used in some vector instructions to control + // the result (side) effects of instruction execution. + enum VOpRC { + VOPRC_CCSET = 0b0001, // set the CC. + VOPRC_CCIGN = 0b0000, // ignore, don't set CC. + VOPRC_ZS = 0b0010, // Zero Search. Additional, elementwise, comparison against zero. + VOPRC_NOZS = 0b0000, // No Zero Search. + VOPRC_RTBYTEIX = 0b0100, // generate byte index to lowest element with true comparison. + VOPRC_RTBITVEC = 0b0000, // generate bit vector, all 1s for true, all 0s for false element comparisons. + VOPRC_INVERT = 0b1000, // invert comparison results. + VOPRC_NOINVERT = 0b0000 // use comparison results as is, do not invert. }; // Inverse condition code, i.e. determine "15 - cc" for a given condition code cc. @@ -1625,10 +1640,15 @@ class Assembler : public AbstractAssembler { return uimm4(ix, pos, 48); } - // Vector Operation Condition Code Control. 4-bit field, one bit of which indicates if the condition code is to be set by the operation. - static int64_t vccc_mask(int64_t flag, int pos) { - assert((flag == VOP_CCIGN) || (flag == VOP_CCSET), "VCCC flag value out of range"); - return uimm4(flag, pos, 48); + // Vector Operation Result Control. 4-bit field. + static int64_t voprc_any(int64_t flags, int pos, int64_t allowed_flags = 0b1111) { + assert((flags & allowed_flags) == flags, "Invalid VOPRC_* flag combination: %d", (int)flags); + return uimm4(flags, pos, 48); + } + + // Vector Operation Result Control. Condition code setting. + static int64_t voprc_ccmask(int64_t flags, int pos) { + return voprc_any(flags, pos, VOPRC_CCIGN | VOPRC_CCSET); } public: @@ -2772,6 +2792,31 @@ class Assembler : public AbstractAssembler { // Test under Mask inline void z_vtm( VectorRegister v1, VectorRegister v2); + //---< Vector String Instructions >--- + inline void z_vfae( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5); // Find any element + inline void z_vfaeb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfaeh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfaef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfee( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5); // Find element equal + inline void z_vfeeb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfeeh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfeef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfene( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5); // Find element not equal + inline void z_vfeneb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfeneh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vfenef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5); + inline void z_vstrc( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t imm5, int64_t cc6); // String range compare + inline void z_vstrcb( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6); + inline void z_vstrch( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6); + inline void z_vstrcf( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6); + inline void z_vistr( VectorRegister v1, VectorRegister v2, int64_t imm3, int64_t cc5); // Isolate String + inline void z_vistrb( VectorRegister v1, VectorRegister v2, int64_t cc5); + inline void z_vistrh( VectorRegister v1, VectorRegister v2, int64_t cc5); + inline void z_vistrf( VectorRegister v1, VectorRegister v2, int64_t cc5); + inline void z_vistrbs(VectorRegister v1, VectorRegister v2); + inline void z_vistrhs(VectorRegister v1, VectorRegister v2); + inline void z_vistrfs(VectorRegister v1, VectorRegister v2); + // Floatingpoint instructions // ========================== diff --git a/src/hotspot/cpu/s390/assembler_s390.inline.hpp b/src/hotspot/cpu/s390/assembler_s390.inline.hpp index a9d4c078b38..bfa4646a42a 100644 --- a/src/hotspot/cpu/s390/assembler_s390.inline.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.inline.hpp @@ -762,21 +762,21 @@ inline void Assembler::z_vpkh( VectorRegister v1, VectorRegister v2, VectorReg inline void Assembler::z_vpkf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpk(v1, v2, v3, VRET_FW); } // vector element type 'F' inline void Assembler::z_vpkg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpk(v1, v2, v3, VRET_DW); } // vector element type 'G' -inline void Assembler::z_vpks( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | vccc_mask(cc5, 24)); } -inline void Assembler::z_vpksh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC -inline void Assembler::z_vpksf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC -inline void Assembler::z_vpksg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC -inline void Assembler::z_vpkshs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', set CC -inline void Assembler::z_vpksfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', set CC -inline void Assembler::z_vpksgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', set CC +inline void Assembler::z_vpks( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | voprc_ccmask(cc5, 24)); } +inline void Assembler::z_vpksh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOPRC_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vpksf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOPRC_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vpksg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOPRC_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vpkshs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_HW, VOPRC_CCSET); } // vector element type 'H', set CC +inline void Assembler::z_vpksfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_FW, VOPRC_CCSET); } // vector element type 'F', set CC +inline void Assembler::z_vpksgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpks(v1, v2, v3, VRET_DW, VOPRC_CCSET); } // vector element type 'G', set CC -inline void Assembler::z_vpkls( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKLS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | vccc_mask(cc5, 24)); } -inline void Assembler::z_vpklsh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC -inline void Assembler::z_vpklsf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC -inline void Assembler::z_vpklsg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC -inline void Assembler::z_vpklshs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', set CC -inline void Assembler::z_vpklsfs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', set CC -inline void Assembler::z_vpklsgs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', set CC +inline void Assembler::z_vpkls( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VPKLS_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_HW, VRET_DW, 32) | voprc_ccmask(cc5, 24)); } +inline void Assembler::z_vpklsh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOPRC_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vpklsf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOPRC_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vpklsg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOPRC_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vpklshs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_HW, VOPRC_CCSET); } // vector element type 'H', set CC +inline void Assembler::z_vpklsfs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_FW, VOPRC_CCSET); } // vector element type 'F', set CC +inline void Assembler::z_vpklsgs(VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vpkls(v1, v2, v3, VRET_DW, VOPRC_CCSET); } // vector element type 'G', set CC // vector register unpack (sign-extended) inline void Assembler::z_vuph( VectorRegister v1, VectorRegister v2, int64_t m3) {emit_48(VUPH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(m3, VRET_BYTE, VRET_FW, 32)); } @@ -967,33 +967,33 @@ inline void Assembler::z_vno( VectorRegister v1, VectorRegister v2, VectorReg inline void Assembler::z_vo( VectorRegister v1, VectorRegister v2, VectorRegister v3) {emit_48(VO_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16)); } // Comparison (element-wise) -inline void Assembler::z_vceq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCEQ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } -inline void Assembler::z_vceqb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC -inline void Assembler::z_vceqh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC -inline void Assembler::z_vceqf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC -inline void Assembler::z_vceqg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC -inline void Assembler::z_vceqbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC -inline void Assembler::z_vceqhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC -inline void Assembler::z_vceqfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC -inline void Assembler::z_vceqgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC -inline void Assembler::z_vch( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } -inline void Assembler::z_vchb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC -inline void Assembler::z_vchh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC -inline void Assembler::z_vchf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC -inline void Assembler::z_vchg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC -inline void Assembler::z_vchbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC -inline void Assembler::z_vchhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC -inline void Assembler::z_vchfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC -inline void Assembler::z_vchgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC -inline void Assembler::z_vchl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCHL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | vccc_mask(cc5, 24)); } -inline void Assembler::z_vchlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOP_CCIGN); } // vector element type 'B', don't set CC -inline void Assembler::z_vchlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOP_CCIGN); } // vector element type 'H', don't set CC -inline void Assembler::z_vchlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOP_CCIGN); } // vector element type 'F', don't set CC -inline void Assembler::z_vchlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOP_CCIGN); } // vector element type 'G', don't set CC -inline void Assembler::z_vchlbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOP_CCSET); } // vector element type 'B', don't set CC -inline void Assembler::z_vchlhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOP_CCSET); } // vector element type 'H', don't set CC -inline void Assembler::z_vchlfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOP_CCSET); } // vector element type 'F', don't set CC -inline void Assembler::z_vchlgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOP_CCSET); } // vector element type 'G', don't set CC +inline void Assembler::z_vceq( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCEQ_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | voprc_ccmask(cc5, 24)); } +inline void Assembler::z_vceqb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOPRC_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vceqh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOPRC_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vceqf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOPRC_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vceqg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOPRC_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vceqbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_BYTE, VOPRC_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vceqhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_HW, VOPRC_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vceqfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_FW, VOPRC_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vceqgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vceq(v1, v2, v3, VRET_DW, VOPRC_CCSET); } // vector element type 'G', don't set CC +inline void Assembler::z_vch( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCH_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | voprc_ccmask(cc5, 24)); } +inline void Assembler::z_vchb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOPRC_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vchh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOPRC_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vchf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOPRC_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vchg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOPRC_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vchbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_BYTE, VOPRC_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vchhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_HW, VOPRC_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vchfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_FW, VOPRC_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vchgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vch(v1, v2, v3, VRET_DW, VOPRC_CCSET); } // vector element type 'G', don't set CC +inline void Assembler::z_vchl( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4, int64_t cc5) {emit_48(VCHL_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32) | voprc_ccmask(cc5, 24)); } +inline void Assembler::z_vchlb( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOPRC_CCIGN); } // vector element type 'B', don't set CC +inline void Assembler::z_vchlh( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOPRC_CCIGN); } // vector element type 'H', don't set CC +inline void Assembler::z_vchlf( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOPRC_CCIGN); } // vector element type 'F', don't set CC +inline void Assembler::z_vchlg( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOPRC_CCIGN); } // vector element type 'G', don't set CC +inline void Assembler::z_vchlbs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_BYTE, VOPRC_CCSET); } // vector element type 'B', don't set CC +inline void Assembler::z_vchlhs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_HW, VOPRC_CCSET); } // vector element type 'H', don't set CC +inline void Assembler::z_vchlfs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_FW, VOPRC_CCSET); } // vector element type 'F', don't set CC +inline void Assembler::z_vchlgs( VectorRegister v1, VectorRegister v2, VectorRegister v3) {z_vchl(v1, v2, v3, VRET_DW, VOPRC_CCSET); } // vector element type 'G', don't set CC // Max/Min (element-wise) inline void Assembler::z_vmx( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t m4) {emit_48(VMX_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(m4, VRET_BYTE, VRET_DW, 32)); } @@ -1091,6 +1091,31 @@ inline void Assembler::z_vsrlb( VectorRegister v1, VectorRegister v2, VectorReg // Test under Mask inline void Assembler::z_vtm( VectorRegister v1, VectorRegister v2) {emit_48(VTM_ZOPC | vreg(v1, 8) | vreg(v2, 12)); } +//---< Vector String Instructions >--- +inline void Assembler::z_vfae( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5) {emit_48(VFAE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(imm4, VRET_BYTE, VRET_FW, 32) | voprc_any(cc5, 24) ); } // Find any element +inline void Assembler::z_vfaeb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfae(v1, v2, v3, VRET_BYTE, cc5); } +inline void Assembler::z_vfaeh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfae(v1, v2, v3, VRET_HW, cc5); } +inline void Assembler::z_vfaef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfae(v1, v2, v3, VRET_FW, cc5); } +inline void Assembler::z_vfee( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5) {emit_48(VFEE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(imm4, VRET_BYTE, VRET_FW, 32) | voprc_any(cc5, 24) ); } // Find element equal +inline void Assembler::z_vfeeb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfee(v1, v2, v3, VRET_BYTE, cc5); } +inline void Assembler::z_vfeeh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfee(v1, v2, v3, VRET_HW, cc5); } +inline void Assembler::z_vfeef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfee(v1, v2, v3, VRET_FW, cc5); } +inline void Assembler::z_vfene( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t imm4, int64_t cc5) {emit_48(VFENE_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vesc_mask(imm4, VRET_BYTE, VRET_FW, 32) | voprc_any(cc5, 24) ); } // Find element not equal +inline void Assembler::z_vfeneb( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfene(v1, v2, v3, VRET_BYTE, cc5); } +inline void Assembler::z_vfeneh( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfene(v1, v2, v3, VRET_HW, cc5); } +inline void Assembler::z_vfenef( VectorRegister v1, VectorRegister v2, VectorRegister v3, int64_t cc5) {z_vfene(v1, v2, v3, VRET_FW, cc5); } +inline void Assembler::z_vstrc( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t imm5, int64_t cc6) {emit_48(VSTRC_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vreg(v3, 16) | vreg(v4, 32) | vesc_mask(imm5, VRET_BYTE, VRET_FW, 20) | voprc_any(cc6, 24) ); } // String range compare +inline void Assembler::z_vstrcb( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6) {z_vstrc(v1, v2, v3, v4, VRET_BYTE, cc6); } +inline void Assembler::z_vstrch( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6) {z_vstrc(v1, v2, v3, v4, VRET_HW, cc6); } +inline void Assembler::z_vstrcf( VectorRegister v1, VectorRegister v2, VectorRegister v3, VectorRegister v4, int64_t cc6) {z_vstrc(v1, v2, v3, v4, VRET_FW, cc6); } +inline void Assembler::z_vistr( VectorRegister v1, VectorRegister v2, int64_t imm3, int64_t cc5) {emit_48(VISTR_ZOPC | vreg(v1, 8) | vreg(v2, 12) | vesc_mask(imm3, VRET_BYTE, VRET_FW, 32) | voprc_any(cc5, 24) ); } // isolate string +inline void Assembler::z_vistrb( VectorRegister v1, VectorRegister v2, int64_t cc5) {z_vistr(v1, v2, VRET_BYTE, cc5); } +inline void Assembler::z_vistrh( VectorRegister v1, VectorRegister v2, int64_t cc5) {z_vistr(v1, v2, VRET_HW, cc5); } +inline void Assembler::z_vistrf( VectorRegister v1, VectorRegister v2, int64_t cc5) {z_vistr(v1, v2, VRET_FW, cc5); } +inline void Assembler::z_vistrbs(VectorRegister v1, VectorRegister v2) {z_vistr(v1, v2, VRET_BYTE, VOPRC_CCSET); } +inline void Assembler::z_vistrhs(VectorRegister v1, VectorRegister v2) {z_vistr(v1, v2, VRET_HW, VOPRC_CCSET); } +inline void Assembler::z_vistrfs(VectorRegister v1, VectorRegister v2) {z_vistr(v1, v2, VRET_FW, VOPRC_CCSET); } + //------------------------------- // FLOAT INSTRUCTIONS From f651176392eec1e776f6e047309d59ec16358a5a Mon Sep 17 00:00:00 2001 From: Martin Doerr Date: Wed, 4 Oct 2017 16:44:45 +0200 Subject: [PATCH 35/80] 8188773: PPC64 and s390: Fix UseMembar and enable ShareVtableStubs Reviewed-by: goetz --- src/hotspot/cpu/ppc/globals_ppc.hpp | 2 +- src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp | 6 ------ src/hotspot/cpu/ppc/templateInterpreterGenerator_ppc.cpp | 7 ------- src/hotspot/cpu/s390/globals_s390.hpp | 6 +++--- src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp | 6 +++--- 5 files changed, 7 insertions(+), 20 deletions(-) diff --git a/src/hotspot/cpu/ppc/globals_ppc.hpp b/src/hotspot/cpu/ppc/globals_ppc.hpp index 0bc041e9188..56232e2ae30 100644 --- a/src/hotspot/cpu/ppc/globals_ppc.hpp +++ b/src/hotspot/cpu/ppc/globals_ppc.hpp @@ -32,7 +32,7 @@ // Sets the default values for platform dependent flags used by the runtime system. // (see globals.hpp) -define_pd_global(bool, ShareVtableStubs, false); // Improves performance markedly for mtrt and compress. +define_pd_global(bool, ShareVtableStubs, true); define_pd_global(bool, NeedsDeoptSuspend, false); // Only register window machines need this. diff --git a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp index 6c6649be948..f68058e237e 100644 --- a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp +++ b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp @@ -2238,9 +2238,6 @@ nmethod *SharedRuntime::generate_native_wrapper(MacroAssembler *masm, __ release(); // TODO: PPC port assert(4 == JavaThread::sz_thread_state(), "unexpected field size"); __ stw(R0, thread_(thread_state)); - if (UseMembar) { - __ fence(); - } // The JNI call @@ -2397,9 +2394,6 @@ nmethod *SharedRuntime::generate_native_wrapper(MacroAssembler *masm, __ release(); // TODO: PPC port assert(4 == JavaThread::sz_thread_state(), "unexpected field size"); __ stw(R0, thread_(thread_state)); - if (UseMembar) { - __ fence(); - } __ bind(after_transition); // Reguard any pages if necessary. diff --git a/src/hotspot/cpu/ppc/templateInterpreterGenerator_ppc.cpp b/src/hotspot/cpu/ppc/templateInterpreterGenerator_ppc.cpp index 32e25e9038c..2216890dd6b 100644 --- a/src/hotspot/cpu/ppc/templateInterpreterGenerator_ppc.cpp +++ b/src/hotspot/cpu/ppc/templateInterpreterGenerator_ppc.cpp @@ -1470,10 +1470,6 @@ address TemplateInterpreterGenerator::generate_native_entry(bool synchronized) { // TODO PPC port assert(4 == JavaThread::sz_thread_state(), "unexpected field size"); __ stw(R0, thread_(thread_state)); - if (UseMembar) { - __ fence(); - } - //============================================================================= // Call the native method. Argument registers must not have been // overwritten since "__ call_stub(signature_handler);" (except for @@ -1594,9 +1590,6 @@ address TemplateInterpreterGenerator::generate_native_entry(bool synchronized) { __ li(R0/*thread_state*/, _thread_in_Java); __ release(); __ stw(R0/*thread_state*/, thread_(thread_state)); - if (UseMembar) { - __ fence(); - } if (CheckJNICalls) { // clear_pending_jni_exception_check diff --git a/src/hotspot/cpu/s390/globals_s390.hpp b/src/hotspot/cpu/s390/globals_s390.hpp index cb5adff3ef5..fef2dbec99b 100644 --- a/src/hotspot/cpu/s390/globals_s390.hpp +++ b/src/hotspot/cpu/s390/globals_s390.hpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2016, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017 Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -34,7 +34,7 @@ // Sorted according to sparc. // z/Architecture remembers branch targets, so don't share vtables. -define_pd_global(bool, ShareVtableStubs, false); +define_pd_global(bool, ShareVtableStubs, true); define_pd_global(bool, NeedsDeoptSuspend, false); // Only register window machines need this. define_pd_global(bool, ImplicitNullChecks, true); // Generate code for implicit null checks. diff --git a/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp b/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp index fa53de045d0..f7ab305f709 100644 --- a/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp +++ b/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp @@ -1,6 +1,6 @@ /* - * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. - * Copyright (c) 2016 SAP SE. All rights reserved. + * Copyright (c) 2016, 2017, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2016, 2017 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -471,7 +471,7 @@ JVM_handle_linux_signal(int sig, // Info->si_addr need not be the exact address, it is only // guaranteed to be on the same page as the address that caused // the SIGSEGV. - if ((sig == SIGSEGV) && + if ((sig == SIGSEGV) && !UseMembar && (os::get_memory_serialize_page() == (address)((uintptr_t)info->si_addr & ~(os::vm_page_size()-1)))) { return true; From 949f6779574366a2415e2de2a91fba14835c7c19 Mon Sep 17 00:00:00 2001 From: Dmitrij Pochepko Date: Wed, 4 Oct 2017 11:52:07 -0700 Subject: [PATCH 36/80] 8187684: Intrinsify Math.multiplyHigh(long, long) Reviewed-by: kvn, aph, lucy --- src/hotspot/share/classfile/vmSymbols.hpp | 2 ++ src/hotspot/share/opto/c2compiler.cpp | 3 +++ src/hotspot/share/opto/library_call.cpp | 7 +++++++ src/java.base/share/classes/java/lang/Math.java | 1 + 4 files changed, 13 insertions(+) diff --git a/src/hotspot/share/classfile/vmSymbols.hpp b/src/hotspot/share/classfile/vmSymbols.hpp index 9551124f7df..65001d4cce9 100644 --- a/src/hotspot/share/classfile/vmSymbols.hpp +++ b/src/hotspot/share/classfile/vmSymbols.hpp @@ -781,6 +781,7 @@ do_name(decrementExact_name,"decrementExact") \ do_name(incrementExact_name,"incrementExact") \ do_name(multiplyExact_name,"multiplyExact") \ + do_name(multiplyHigh_name,"multiplyHigh") \ do_name(negateExact_name,"negateExact") \ do_name(subtractExact_name,"subtractExact") \ do_name(fma_name, "fma") \ @@ -805,6 +806,7 @@ do_intrinsic(_incrementExactL, java_lang_Math, incrementExact_name, long_long_signature, F_S) \ do_intrinsic(_multiplyExactI, java_lang_Math, multiplyExact_name, int2_int_signature, F_S) \ do_intrinsic(_multiplyExactL, java_lang_Math, multiplyExact_name, long2_long_signature, F_S) \ + do_intrinsic(_multiplyHigh, java_lang_Math, multiplyHigh_name, long2_long_signature, F_S) \ do_intrinsic(_negateExactI, java_lang_Math, negateExact_name, int_int_signature, F_S) \ do_intrinsic(_negateExactL, java_lang_Math, negateExact_name, long_long_signature, F_S) \ do_intrinsic(_subtractExactI, java_lang_Math, subtractExact_name, int2_int_signature, F_S) \ diff --git a/src/hotspot/share/opto/c2compiler.cpp b/src/hotspot/share/opto/c2compiler.cpp index 9f823784824..7170a0bee93 100644 --- a/src/hotspot/share/opto/c2compiler.cpp +++ b/src/hotspot/share/opto/c2compiler.cpp @@ -410,6 +410,9 @@ bool C2Compiler::is_intrinsic_supported(const methodHandle& method, bool is_virt case vmIntrinsics::_multiplyExactL: if (!Matcher::match_rule_supported(Op_OverflowMulL)) return false; break; + case vmIntrinsics::_multiplyHigh: + if (!Matcher::match_rule_supported(Op_MulHiL)) return false; + break; case vmIntrinsics::_getCallerClass: if (SystemDictionary::reflect_CallerSensitive_klass() == NULL) return false; break; diff --git a/src/hotspot/share/opto/library_call.cpp b/src/hotspot/share/opto/library_call.cpp index 5de3c62b3aa..bb4ed6cef8e 100644 --- a/src/hotspot/share/opto/library_call.cpp +++ b/src/hotspot/share/opto/library_call.cpp @@ -231,6 +231,7 @@ class LibraryCallKit : public GraphKit { bool inline_math_addExactL(bool is_increment); bool inline_math_multiplyExactI(); bool inline_math_multiplyExactL(); + bool inline_math_multiplyHigh(); bool inline_math_negateExactI(); bool inline_math_negateExactL(); bool inline_math_subtractExactI(bool is_decrement); @@ -549,6 +550,7 @@ bool LibraryCallKit::try_to_inline(int predicate) { case vmIntrinsics::_incrementExactL: return inline_math_addExactL(true /* increment */); case vmIntrinsics::_multiplyExactI: return inline_math_multiplyExactI(); case vmIntrinsics::_multiplyExactL: return inline_math_multiplyExactL(); + case vmIntrinsics::_multiplyHigh: return inline_math_multiplyHigh(); case vmIntrinsics::_negateExactI: return inline_math_negateExactI(); case vmIntrinsics::_negateExactL: return inline_math_negateExactL(); case vmIntrinsics::_subtractExactI: return inline_math_subtractExactI(false /* subtract */); @@ -1897,6 +1899,11 @@ bool LibraryCallKit::inline_math_multiplyExactL() { return inline_math_overflow(argument(0), argument(2)); } +bool LibraryCallKit::inline_math_multiplyHigh() { + set_result(_gvn.transform(new MulHiLNode(argument(0), argument(2)))); + return true; +} + Node* LibraryCallKit::generate_min_max(vmIntrinsics::ID id, Node* x0, Node* y0) { // These are the candidate return value: diff --git a/src/java.base/share/classes/java/lang/Math.java b/src/java.base/share/classes/java/lang/Math.java index 14093908c6e..dffce353746 100644 --- a/src/java.base/share/classes/java/lang/Math.java +++ b/src/java.base/share/classes/java/lang/Math.java @@ -1094,6 +1094,7 @@ public final class Math { * @return the result * @since 9 */ + @HotSpotIntrinsicCandidate public static long multiplyHigh(long x, long y) { if (x < 0 || y < 0) { // Use technique from section 8-2 of Henry S. Warren, Jr., From 844e594fec72d9d55896992af962e39c4895207c Mon Sep 17 00:00:00 2001 From: Roland Westrelin Date: Wed, 27 Sep 2017 16:17:47 +0200 Subject: [PATCH 37/80] 8187822: C2 conditonal move optimization might create broken graph Reviewed-by: kvn --- src/hotspot/share/opto/loopopts.cpp | 24 ++++--- .../loopopts/TestCMovSplitThruPhi.java | 67 +++++++++++++++++++ 2 files changed, 82 insertions(+), 9 deletions(-) create mode 100644 test/hotspot/jtreg/compiler/loopopts/TestCMovSplitThruPhi.java diff --git a/src/hotspot/share/opto/loopopts.cpp b/src/hotspot/share/opto/loopopts.cpp index 06818e71e3a..8bbb2c45e8d 100644 --- a/src/hotspot/share/opto/loopopts.cpp +++ b/src/hotspot/share/opto/loopopts.cpp @@ -311,6 +311,7 @@ Node *PhaseIdealLoop::has_local_phi_input( Node *n ) { } return NULL; } + assert(m->is_Phi() || is_dominator(get_ctrl(m), n_ctrl), "m has strange control"); } return n_ctrl; @@ -615,6 +616,7 @@ Node *PhaseIdealLoop::conditional_move( Node *region ) { // Now replace all Phis with CMOV's Node *cmov_ctrl = iff->in(0); uint flip = (lp->Opcode() == Op_IfTrue); + Node_List wq; while (1) { PhiNode* phi = NULL; for (DUIterator_Fast imax, i = region->fast_outs(imax); i < imax; i++) { @@ -627,17 +629,21 @@ Node *PhaseIdealLoop::conditional_move( Node *region ) { if (phi == NULL) break; if (PrintOpto && VerifyLoopOptimizations) { tty->print_cr("CMOV"); } // Move speculative ops - for (uint j = 1; j < region->req(); j++) { - Node *proj = region->in(j); - Node *inp = phi->in(j); - if (get_ctrl(inp) == proj) { // Found local op + wq.push(phi); + while (wq.size() > 0) { + Node *n = wq.pop(); + for (uint j = 1; j < n->req(); j++) { + Node* m = n->in(j); + if (m != NULL && !is_dominator(get_ctrl(m), cmov_ctrl)) { #ifndef PRODUCT - if (PrintOpto && VerifyLoopOptimizations) { - tty->print(" speculate: "); - inp->dump(); - } + if (PrintOpto && VerifyLoopOptimizations) { + tty->print(" speculate: "); + m->dump(); + } #endif - set_ctrl(inp, cmov_ctrl); + set_ctrl(m, cmov_ctrl); + wq.push(m); + } } } Node *cmov = CMoveNode::make(cmov_ctrl, iff->in(1), phi->in(1+flip), phi->in(2-flip), _igvn.type(phi)); diff --git a/test/hotspot/jtreg/compiler/loopopts/TestCMovSplitThruPhi.java b/test/hotspot/jtreg/compiler/loopopts/TestCMovSplitThruPhi.java new file mode 100644 index 00000000000..03df3c0b810 --- /dev/null +++ b/test/hotspot/jtreg/compiler/loopopts/TestCMovSplitThruPhi.java @@ -0,0 +1,67 @@ +/* + * Copyright (c) 2017, Red Hat, Inc. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/** + * @test + * @bug 8187822 + * @summary C2 conditonal move optimization might create broken graph + * @run main/othervm -XX:-UseOnStackReplacement -XX:-BackgroundCompilation -XX:CompileCommand=dontinline,TestCMovSplitThruPhi::not_inlined -XX:CompileOnly=TestCMovSplitThruPhi::test -XX:-LoopUnswitching TestCMovSplitThruPhi + * + */ + +public class TestCMovSplitThruPhi { + static int f; + + static int test(boolean flag1, boolean flag2, boolean flag3, boolean flag4) { + int v3 = 0; + if (flag4) { + for (int i = 0; i < 10; i++) { + int v1 = 0; + if (flag1) { + v1 = not_inlined(); + } + // AddI below will be candidate for split through Phi + int v2 = v1; + if (flag2) { + v2 = f + v1; + } + // test above will be converted to CMovI + if (flag3) { + v3 = v2 * 2; + break; + } + } + } + return v3; + } + + private static int not_inlined() { + return 0; + } + + public static void main(String[] args) { + for (int i = 0; i < 20000; i++) { + test((i % 2) == 0, (i % 2) == 0, (i % 100) == 1, (i % 1000) == 1); + } + } +} From 2990ce80127aa7a9db90090a93b64f586b2b2c36 Mon Sep 17 00:00:00 2001 From: Zhongwei Yao Date: Wed, 20 Sep 2017 18:30:32 +0800 Subject: [PATCH 38/80] 8187601: Unrolling more when SLP auto-vectorization failed Reviewed-by: kvn --- src/hotspot/share/opto/loopTransform.cpp | 2 +- src/hotspot/share/opto/superword.cpp | 15 +++++++++++---- 2 files changed, 12 insertions(+), 5 deletions(-) diff --git a/src/hotspot/share/opto/loopTransform.cpp b/src/hotspot/share/opto/loopTransform.cpp index c00dda397db..4737a8ffe9e 100644 --- a/src/hotspot/share/opto/loopTransform.cpp +++ b/src/hotspot/share/opto/loopTransform.cpp @@ -666,7 +666,7 @@ bool IdealLoopTree::policy_unroll(PhaseIdealLoop *phase) { _local_loop_unroll_limit = LoopUnrollLimit; _local_loop_unroll_factor = 4; int future_unroll_ct = cl->unrolled_count() * 2; - if (!cl->do_unroll_only()) { + if (!cl->is_vectorized_loop()) { if (future_unroll_ct > LoopMaxUnroll) return false; } else { // obey user constraints on vector mapped loops with additional unrolling applied diff --git a/src/hotspot/share/opto/superword.cpp b/src/hotspot/share/opto/superword.cpp index bbc30e32b02..b35f9b1da67 100644 --- a/src/hotspot/share/opto/superword.cpp +++ b/src/hotspot/share/opto/superword.cpp @@ -145,6 +145,8 @@ void SuperWord::transform_loop(IdealLoopTree* lpt, bool do_optimization) { // Skip any loops already optimized by slp if (cl->is_vectorized_loop()) return; + if (cl->do_unroll_only()) return; + if (cl->is_main_loop()) { // Check for pre-loop ending with CountedLoopEnd(Bool(Cmp(x,Opaque1(limit)))) CountedLoopEndNode* pre_end = get_pre_loop_end(cl); @@ -2163,7 +2165,15 @@ void SuperWord::print_loop(bool whole) { //------------------------------output--------------------------- // Convert packs into vector node operations void SuperWord::output() { - if (_packset.length() == 0) return; + CountedLoopNode *cl = lpt()->_head->as_CountedLoop(); + Compile* C = _phase->C; + if (_packset.length() == 0) { + // Instigate more unrolling for optimization when vectorization fails. + C->set_major_progress(); + cl->set_notpassed_slp(); + cl->mark_do_unroll_only(); + return; + } #ifndef PRODUCT if (TraceLoopOpts) { @@ -2172,7 +2182,6 @@ void SuperWord::output() { } #endif - CountedLoopNode *cl = lpt()->_head->as_CountedLoop(); if (cl->is_main_loop()) { // MUST ENSURE main loop's initial value is properly aligned: // (iv_initial_value + min_iv_offset) % vector_width_in_bytes() == 0 @@ -2185,7 +2194,6 @@ void SuperWord::output() { } } - Compile* C = _phase->C; uint max_vlen_in_bytes = 0; uint max_vlen = 0; bool can_process_post_loop = (PostLoopMultiversioning && Matcher::has_predicated_vectors() && cl->is_post_loop()); @@ -4493,4 +4501,3 @@ bool SuperWord::hoist_loads_in_graph() { return true; } - From 8afe0e3b01c1294b8fd00ab00e971224fe66e86f Mon Sep 17 00:00:00 2001 From: Igor Ignatyev Date: Wed, 20 Sep 2017 20:53:22 -0700 Subject: [PATCH 39/80] 8188117: jdk/test/lib/FileInstaller doesn't work for directories Reviewed-by: mseledtsov, sspitsyn --- test/lib/jdk/test/lib/FileInstaller.java | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/test/lib/jdk/test/lib/FileInstaller.java b/test/lib/jdk/test/lib/FileInstaller.java index 1247deedcb1..5e16b315153 100644 --- a/test/lib/jdk/test/lib/FileInstaller.java +++ b/test/lib/jdk/test/lib/FileInstaller.java @@ -45,10 +45,12 @@ public class FileInstaller { if (args.length != 2) { throw new IllegalArgumentException("Unexpected number of arguments for file copy"); } - Path src = Paths.get(Utils.TEST_SRC, args[0]).toAbsolutePath(); - Path dst = Paths.get(args[1]).toAbsolutePath(); + Path src = Paths.get(Utils.TEST_SRC, args[0]).toAbsolutePath().normalize(); + Path dst = Paths.get(args[1]).toAbsolutePath().normalize(); if (src.toFile().exists()) { + System.out.printf("copying %s to %s%n", src, dst); if (src.toFile().isDirectory()) { + // can't use Files::copy for dirs, as 'dst' might exist already Files.walkFileTree(src, new CopyFileVisitor(src, dst)); } else { Path dstDir = dst.getParent(); @@ -74,7 +76,7 @@ public class FileInstaller { @Override public FileVisitResult preVisitDirectory(Path file, BasicFileAttributes attrs) throws IOException { - Path relativePath = file.relativize(copyFrom); + Path relativePath = copyFrom.relativize(file); Path destination = copyTo.resolve(relativePath); if (!destination.toFile().exists()) { Files.createDirectories(destination); From a17ce440a56a294c9f43f46cc50694f4b56d4727 Mon Sep 17 00:00:00 2001 From: Goetz Lindenmaier Date: Mon, 25 Sep 2017 08:43:43 +0200 Subject: [PATCH 40/80] 8187547: PPC64: icache invalidation is incorrect in some places Reviewed-by: mdoerr, goetz --- src/hotspot/cpu/ppc/macroAssembler_ppc.cpp | 8 +++--- src/hotspot/cpu/ppc/macroAssembler_ppc.hpp | 6 +++-- src/hotspot/cpu/ppc/nativeInst_ppc.cpp | 30 +++++++++++----------- 3 files changed, 23 insertions(+), 21 deletions(-) diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp index 9ce7be54a84..bc34768dd70 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp @@ -129,7 +129,7 @@ void MacroAssembler::calculate_address_from_global_toc(Register dst, address add } } -int MacroAssembler::patch_calculate_address_from_global_toc_at(address a, address bound, address addr) { +address MacroAssembler::patch_calculate_address_from_global_toc_at(address a, address bound, address addr) { const int offset = MacroAssembler::offset_to_global_toc(addr); const address inst2_addr = a; @@ -155,7 +155,7 @@ int MacroAssembler::patch_calculate_address_from_global_toc_at(address a, addres assert(is_addis(inst1) && inv_ra_field(inst1) == 29 /* R29 */, "source must be global TOC"); set_imm((int *)inst1_addr, MacroAssembler::largeoffset_si16_si16_hi(offset)); set_imm((int *)inst2_addr, MacroAssembler::largeoffset_si16_si16_lo(offset)); - return (int)((intptr_t)addr - (intptr_t)inst1_addr); + return inst1_addr; } address MacroAssembler::get_address_of_calculate_address_from_global_toc_at(address a, address bound) { @@ -201,7 +201,7 @@ address MacroAssembler::get_address_of_calculate_address_from_global_toc_at(addr // clrldi rx = rx & 0xFFFFffff // clearMS32b, optional // ori rx = rx | const.lo // Clrldi will be passed by. -int MacroAssembler::patch_set_narrow_oop(address a, address bound, narrowOop data) { +address MacroAssembler::patch_set_narrow_oop(address a, address bound, narrowOop data) { assert(UseCompressedOops, "Should only patch compressed oops"); const address inst2_addr = a; @@ -227,7 +227,7 @@ int MacroAssembler::patch_set_narrow_oop(address a, address bound, narrowOop dat set_imm((int *)inst1_addr, (short)(xc)); // see enc_load_con_narrow_hi/_lo set_imm((int *)inst2_addr, (xd)); // unsigned int - return (int)((intptr_t)inst2_addr - (intptr_t)inst1_addr); + return inst1_addr; } // Get compressed oop or klass constant. diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp index db04a3700e7..f096299538c 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp @@ -105,13 +105,15 @@ class MacroAssembler: public Assembler { }; inline static bool is_calculate_address_from_global_toc_at(address a, address bound); - static int patch_calculate_address_from_global_toc_at(address a, address addr, address bound); + // Returns address of first instruction in sequence. + static address patch_calculate_address_from_global_toc_at(address a, address bound, address addr); static address get_address_of_calculate_address_from_global_toc_at(address a, address addr); #ifdef _LP64 // Patch narrow oop constant. inline static bool is_set_narrow_oop(address a, address bound); - static int patch_set_narrow_oop(address a, address bound, narrowOop data); + // Returns address of first instruction in sequence. + static address patch_set_narrow_oop(address a, address bound, narrowOop data); static narrowOop get_narrow_oop(address a, address bound); #endif diff --git a/src/hotspot/cpu/ppc/nativeInst_ppc.cpp b/src/hotspot/cpu/ppc/nativeInst_ppc.cpp index 70cd4ebbd91..6d6128d416e 100644 --- a/src/hotspot/cpu/ppc/nativeInst_ppc.cpp +++ b/src/hotspot/cpu/ppc/nativeInst_ppc.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * Copyright (c) 2012, 2015 SAP SE. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * @@ -221,13 +221,13 @@ address NativeMovConstReg::set_data_plain(intptr_t data, CodeBlob *cb) { // A calculation relative to the global TOC. if (MacroAssembler::get_address_of_calculate_address_from_global_toc_at(addr, cb->content_begin()) != (address)data) { - const int invalidated_range = - MacroAssembler::patch_calculate_address_from_global_toc_at(addr, cb->content_begin(), + const address inst2_addr = addr; + const address inst1_addr = + MacroAssembler::patch_calculate_address_from_global_toc_at(inst2_addr, cb->content_begin(), (address)data); - const address start = invalidated_range < 0 ? addr + invalidated_range : addr; - // FIXME: - const int range = invalidated_range < 0 ? 4 - invalidated_range : 8; - ICache::ppc64_flush_icache_bytes(start, range); + assert(inst1_addr != NULL && inst1_addr < inst2_addr, "first instruction must be found"); + const int range = inst2_addr - inst1_addr + BytesPerInstWord; + ICache::ppc64_flush_icache_bytes(inst1_addr, range); } next_address = addr + 1 * BytesPerInstWord; } else if (MacroAssembler::is_load_const_at(addr)) { @@ -288,15 +288,15 @@ void NativeMovConstReg::set_data(intptr_t data) { } void NativeMovConstReg::set_narrow_oop(narrowOop data, CodeBlob *code /* = NULL */) { - address addr = addr_at(0); + address inst2_addr = addr_at(0); CodeBlob* cb = (code) ? code : CodeCache::find_blob(instruction_address()); - if (MacroAssembler::get_narrow_oop(addr, cb->content_begin()) == (long)data) return; - const int invalidated_range = - MacroAssembler::patch_set_narrow_oop(addr, cb->content_begin(), (long)data); - const address start = invalidated_range < 0 ? addr + invalidated_range : addr; - // FIXME: - const int range = invalidated_range < 0 ? 4 - invalidated_range : 8; - ICache::ppc64_flush_icache_bytes(start, range); + if (MacroAssembler::get_narrow_oop(inst2_addr, cb->content_begin()) == (long)data) + return; + const address inst1_addr = + MacroAssembler::patch_set_narrow_oop(inst2_addr, cb->content_begin(), (long)data); + assert(inst1_addr != NULL && inst1_addr < inst2_addr, "first instruction must be found"); + const int range = inst2_addr - inst1_addr + BytesPerInstWord; + ICache::ppc64_flush_icache_bytes(inst1_addr, range); } // Do not use an assertion here. Let clients decide whether they only From 521c3ea430a134c7e446b63805fec78e310fb3e6 Mon Sep 17 00:00:00 2001 From: Gustavo Serra Scalet Date: Mon, 25 Sep 2017 09:37:43 +0200 Subject: [PATCH 41/80] 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics This implementation is based on the algorithm implemented in java. It yields a performance speedup of: JDK8: 23% JDK9: 5% JDK10: 5% Reviewed-by: mdoerr, goetz --- src/hotspot/cpu/ppc/assembler_ppc.hpp | 1 + src/hotspot/cpu/ppc/assembler_ppc.inline.hpp | 1 + src/hotspot/cpu/ppc/macroAssembler_ppc.cpp | 34 +++ src/hotspot/cpu/ppc/macroAssembler_ppc.hpp | 2 + src/hotspot/cpu/ppc/stubGenerator_ppc.cpp | 267 +++++++++++++++++++ src/hotspot/cpu/ppc/vm_version_ppc.cpp | 6 + 6 files changed, 311 insertions(+) diff --git a/src/hotspot/cpu/ppc/assembler_ppc.hpp b/src/hotspot/cpu/ppc/assembler_ppc.hpp index 26b77b8cbc3..176b911ffd3 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.hpp @@ -1308,6 +1308,7 @@ class Assembler : public AbstractAssembler { inline void li( Register d, int si16); inline void lis( Register d, int si16); inline void addir(Register d, int si16, Register a); + inline void subi( Register d, Register a, int si16); static bool is_addi(int x) { return ADDI_OPCODE == (x & ADDI_OPCODE_MASK); diff --git a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp index d21ffaf8fcb..b3a6b89d864 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp @@ -164,6 +164,7 @@ inline void Assembler::divwo_( Register d, Register a, Register b) { emit_int32 inline void Assembler::li( Register d, int si16) { Assembler::addi_r0ok( d, R0, si16); } inline void Assembler::lis( Register d, int si16) { Assembler::addis_r0ok(d, R0, si16); } inline void Assembler::addir(Register d, int si16, Register a) { Assembler::addi(d, a, si16); } +inline void Assembler::subi( Register d, Register a, int si16) { Assembler::addi(d, a, -si16); } // PPC 1, section 3.3.9, Fixed-Point Compare Instructions inline void Assembler::cmpi( ConditionRegister f, int l, Register a, int si16) { emit_int32( CMPI_OPCODE | bf(f) | l10(l) | ra(a) | simm(si16,16)); } diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp index bc34768dd70..31dcfa7beba 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.cpp @@ -5234,6 +5234,40 @@ void MacroAssembler::multiply_128_x_128_loop(Register x_xstart, bind(L_post_third_loop_done); } // multiply_128_x_128_loop +void MacroAssembler::muladd(Register out, Register in, + Register offset, Register len, Register k, + Register tmp1, Register tmp2, Register carry) { + + // Labels + Label LOOP, SKIP; + + // Make sure length is positive. + cmpdi (CCR0, len, 0); + + // Prepare variables + subi (offset, offset, 4); + li (carry, 0); + ble (CCR0, SKIP); + + mtctr (len); + subi (len, len, 1 ); + sldi (len, len, 2 ); + + // Main loop + bind(LOOP); + lwzx (tmp1, len, in ); + lwzx (tmp2, offset, out ); + mulld (tmp1, tmp1, k ); + add (tmp2, carry, tmp2 ); + add (tmp2, tmp1, tmp2 ); + stwx (tmp2, offset, out ); + srdi (carry, tmp2, 32 ); + subi (offset, offset, 4 ); + subi (len, len, 4 ); + bdnz (LOOP); + bind(SKIP); +} + void MacroAssembler::multiply_to_len(Register x, Register xlen, Register y, Register ylen, Register z, Register zlen, diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp index f096299538c..63c377b6c0a 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp @@ -815,6 +815,8 @@ class MacroAssembler: public Assembler { Register yz_idx, Register idx, Register carry, Register product_high, Register product, Register carry2, Register tmp); + void muladd(Register out, Register in, Register offset, Register len, Register k, + Register tmp1, Register tmp2, Register carry); void multiply_to_len(Register x, Register xlen, Register y, Register ylen, Register z, Register zlen, diff --git a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp index 2eb4937a6fa..2a149432520 100644 --- a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp +++ b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp @@ -3306,6 +3306,267 @@ class StubGenerator: public StubCodeGenerator { BLOCK_COMMENT("} Stub body"); } + /** + * Arguments: + * + * Input: + * R3_ARG1 - out address + * R4_ARG2 - in address + * R5_ARG3 - offset + * R6_ARG4 - len + * R7_ARG5 - k + * Output: + * R3_RET - carry + */ + address generate_mulAdd() { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", "mulAdd"); + + address start = __ function_entry(); + + // C2 does not sign extend signed parameters to full 64 bits registers: + __ rldic (R5_ARG3, R5_ARG3, 2, 32); // always positive + __ clrldi(R6_ARG4, R6_ARG4, 32); // force zero bits on higher word + __ clrldi(R7_ARG5, R7_ARG5, 32); // force zero bits on higher word + + __ muladd(R3_ARG1, R4_ARG2, R5_ARG3, R6_ARG4, R7_ARG5, R8, R9, R10); + + // Moves output carry to return register + __ mr (R3_RET, R10); + + __ blr(); + + return start; + } + + /** + * Arguments: + * + * Input: + * R3_ARG1 - in address + * R4_ARG2 - in length + * R5_ARG3 - out address + * R6_ARG4 - out length + */ + address generate_squareToLen() { + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", "squareToLen"); + + address start = __ function_entry(); + + // args - higher word is cleaned (unsignedly) due to int to long casting + const Register in = R3_ARG1; + const Register in_len = R4_ARG2; + __ clrldi(in_len, in_len, 32); + const Register out = R5_ARG3; + const Register out_len = R6_ARG4; + __ clrldi(out_len, out_len, 32); + + // output + const Register ret = R3_RET; + + // temporaries + const Register lplw_s = R7; + const Register in_aux = R8; + const Register out_aux = R9; + const Register piece = R10; + const Register product = R14; + const Register lplw = R15; + const Register i_minus1 = R16; + const Register carry = R17; + const Register offset = R18; + const Register off_aux = R19; + const Register t = R20; + const Register mlen = R21; + const Register len = R22; + const Register a = R23; + const Register b = R24; + const Register i = R25; + const Register c = R26; + const Register cs = R27; + + // Labels + Label SKIP_LSHIFT, SKIP_DIAGONAL_SUM, SKIP_ADDONE, SKIP_MULADD, SKIP_LOOP_SQUARE; + Label LOOP_LSHIFT, LOOP_DIAGONAL_SUM, LOOP_ADDONE, LOOP_MULADD, LOOP_SQUARE; + + // Save non-volatile regs (frameless). + int current_offs = -8; + __ std(R28, current_offs, R1_SP); current_offs -= 8; + __ std(R27, current_offs, R1_SP); current_offs -= 8; + __ std(R26, current_offs, R1_SP); current_offs -= 8; + __ std(R25, current_offs, R1_SP); current_offs -= 8; + __ std(R24, current_offs, R1_SP); current_offs -= 8; + __ std(R23, current_offs, R1_SP); current_offs -= 8; + __ std(R22, current_offs, R1_SP); current_offs -= 8; + __ std(R21, current_offs, R1_SP); current_offs -= 8; + __ std(R20, current_offs, R1_SP); current_offs -= 8; + __ std(R19, current_offs, R1_SP); current_offs -= 8; + __ std(R18, current_offs, R1_SP); current_offs -= 8; + __ std(R17, current_offs, R1_SP); current_offs -= 8; + __ std(R16, current_offs, R1_SP); current_offs -= 8; + __ std(R15, current_offs, R1_SP); current_offs -= 8; + __ std(R14, current_offs, R1_SP); + + // Store the squares, right shifted one bit (i.e., divided by 2) + __ subi (out_aux, out, 8); + __ subi (in_aux, in, 4); + __ cmpwi (CCR0, in_len, 0); + // Initialize lplw outside of the loop + __ xorr (lplw, lplw, lplw); + __ ble (CCR0, SKIP_LOOP_SQUARE); // in_len <= 0 + __ mtctr (in_len); + + __ bind(LOOP_SQUARE); + __ lwzu (piece, 4, in_aux); + __ mulld (product, piece, piece); + // shift left 63 bits and only keep the MSB + __ rldic (lplw_s, lplw, 63, 0); + __ mr (lplw, product); + // shift right 1 bit without sign extension + __ srdi (product, product, 1); + // join them to the same register and store it + __ orr (product, lplw_s, product); +#ifdef VM_LITTLE_ENDIAN + // Swap low and high words for little endian + __ rldicl (product, product, 32, 0); +#endif + __ stdu (product, 8, out_aux); + __ bdnz (LOOP_SQUARE); + + __ bind(SKIP_LOOP_SQUARE); + + // Add in off-diagonal sums + __ cmpwi (CCR0, in_len, 0); + __ ble (CCR0, SKIP_DIAGONAL_SUM); + // Avoid CTR usage here in order to use it at mulAdd + __ subi (i_minus1, in_len, 1); + __ li (offset, 4); + + __ bind(LOOP_DIAGONAL_SUM); + + __ sldi (off_aux, out_len, 2); + __ sub (off_aux, off_aux, offset); + + __ mr (len, i_minus1); + __ sldi (mlen, i_minus1, 2); + __ lwzx (t, in, mlen); + + __ muladd (out, in, off_aux, len, t, a, b, carry); + + // begin + // off_aux = out_len*4 - 4 - mlen - offset*4 - 4; + __ addi (mlen, mlen, 4); + __ sldi (a, out_len, 2); + __ subi (a, a, 4); + __ sub (a, a, mlen); + __ subi (off_aux, offset, 4); + __ sub (off_aux, a, off_aux); + + __ lwzx (b, off_aux, out); + __ add (b, b, carry); + __ stwx (b, off_aux, out); + + // if (((uint64_t)s >> 32) != 0) { + __ srdi_ (a, b, 32); + __ beq (CCR0, SKIP_ADDONE); + + // while (--mlen >= 0) { + __ bind(LOOP_ADDONE); + __ subi (mlen, mlen, 4); + __ cmpwi (CCR0, mlen, 0); + __ beq (CCR0, SKIP_ADDONE); + + // if (--offset_aux < 0) { // Carry out of number + __ subi (off_aux, off_aux, 4); + __ cmpwi (CCR0, off_aux, 0); + __ blt (CCR0, SKIP_ADDONE); + + // } else { + __ lwzx (b, off_aux, out); + __ addi (b, b, 1); + __ stwx (b, off_aux, out); + __ cmpwi (CCR0, b, 0); + __ bne (CCR0, SKIP_ADDONE); + __ b (LOOP_ADDONE); + + __ bind(SKIP_ADDONE); + // } } } end + + __ addi (offset, offset, 8); + __ subi (i_minus1, i_minus1, 1); + __ cmpwi (CCR0, i_minus1, 0); + __ bge (CCR0, LOOP_DIAGONAL_SUM); + + __ bind(SKIP_DIAGONAL_SUM); + + // Shift back up and set low bit + // Shifts 1 bit left up to len positions. Assumes no leading zeros + // begin + __ cmpwi (CCR0, out_len, 0); + __ ble (CCR0, SKIP_LSHIFT); + __ li (i, 0); + __ lwz (c, 0, out); + __ subi (b, out_len, 1); + __ mtctr (b); + + __ bind(LOOP_LSHIFT); + __ mr (b, c); + __ addi (cs, i, 4); + __ lwzx (c, out, cs); + + __ sldi (b, b, 1); + __ srwi (cs, c, 31); + __ orr (b, b, cs); + __ stwx (b, i, out); + + __ addi (i, i, 4); + __ bdnz (LOOP_LSHIFT); + + __ sldi (c, out_len, 2); + __ subi (c, c, 4); + __ lwzx (b, out, c); + __ sldi (b, b, 1); + __ stwx (b, out, c); + + __ bind(SKIP_LSHIFT); + // end + + // Set low bit + __ sldi (i, in_len, 2); + __ subi (i, i, 4); + __ lwzx (i, in, i); + __ sldi (c, out_len, 2); + __ subi (c, c, 4); + __ lwzx (b, out, c); + + __ andi (i, i, 1); + __ orr (i, b, i); + + __ stwx (i, out, c); + + // Restore non-volatile regs. + current_offs = -8; + __ ld(R28, current_offs, R1_SP); current_offs -= 8; + __ ld(R27, current_offs, R1_SP); current_offs -= 8; + __ ld(R26, current_offs, R1_SP); current_offs -= 8; + __ ld(R25, current_offs, R1_SP); current_offs -= 8; + __ ld(R24, current_offs, R1_SP); current_offs -= 8; + __ ld(R23, current_offs, R1_SP); current_offs -= 8; + __ ld(R22, current_offs, R1_SP); current_offs -= 8; + __ ld(R21, current_offs, R1_SP); current_offs -= 8; + __ ld(R20, current_offs, R1_SP); current_offs -= 8; + __ ld(R19, current_offs, R1_SP); current_offs -= 8; + __ ld(R18, current_offs, R1_SP); current_offs -= 8; + __ ld(R17, current_offs, R1_SP); current_offs -= 8; + __ ld(R16, current_offs, R1_SP); current_offs -= 8; + __ ld(R15, current_offs, R1_SP); current_offs -= 8; + __ ld(R14, current_offs, R1_SP); + + __ mr(ret, out); + __ blr(); + + return start; + } /** * Arguments: @@ -3500,6 +3761,12 @@ class StubGenerator: public StubCodeGenerator { } #endif + if (UseSquareToLenIntrinsic) { + StubRoutines::_squareToLen = generate_squareToLen(); + } + if (UseMulAddIntrinsic) { + StubRoutines::_mulAdd = generate_mulAdd(); + } if (UseMontgomeryMultiplyIntrinsic) { StubRoutines::_montgomeryMultiply = CAST_FROM_FN_PTR(address, SharedRuntime::montgomery_multiply); diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.cpp b/src/hotspot/cpu/ppc/vm_version_ppc.cpp index 4db0a9c20cb..b6c4058c557 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.cpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.cpp @@ -258,6 +258,12 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(UseSHA512Intrinsics, false); } + if (FLAG_IS_DEFAULT(UseSquareToLenIntrinsic)) { + UseSquareToLenIntrinsic = true; + } + if (FLAG_IS_DEFAULT(UseMulAddIntrinsic)) { + UseMulAddIntrinsic = true; + } if (FLAG_IS_DEFAULT(UseMultiplyToLenIntrinsic)) { UseMultiplyToLenIntrinsic = true; } From d0dc2dd2310c7951943ccc4ce8251d75fc14df55 Mon Sep 17 00:00:00 2001 From: Martin Doerr Date: Mon, 25 Sep 2017 17:40:06 +0200 Subject: [PATCH 42/80] 8185979: PPC64: Implement SHA2 intrinsic Co-authored-by: Bruno Rosa Co-authored-by: Gustavo Serra Scalet Co-authored-by: Igor Nunes Reviewed-by: mdoerr, goetz --- src/hotspot/cpu/ppc/assembler_ppc.hpp | 7 +- src/hotspot/cpu/ppc/assembler_ppc.inline.hpp | 19 +- src/hotspot/cpu/ppc/macroAssembler_ppc.hpp | 34 + .../cpu/ppc/macroAssembler_ppc_sha.cpp | 1136 +++++++++++++++++ src/hotspot/cpu/ppc/stubGenerator_ppc.cpp | 30 + src/hotspot/cpu/ppc/stubRoutines_ppc.hpp | 2 +- src/hotspot/cpu/ppc/vm_version_ppc.cpp | 41 +- src/hotspot/cpu/ppc/vm_version_ppc.hpp | 3 + .../testcases/GenericTestCaseForOtherCPU.java | 3 +- .../sha/predicate/IntrinsicPredicates.java | 8 +- 10 files changed, 1271 insertions(+), 12 deletions(-) create mode 100644 src/hotspot/cpu/ppc/macroAssembler_ppc_sha.cpp diff --git a/src/hotspot/cpu/ppc/assembler_ppc.hpp b/src/hotspot/cpu/ppc/assembler_ppc.hpp index 176b911ffd3..62c395d2a50 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.hpp @@ -2175,7 +2175,8 @@ class Assembler : public AbstractAssembler { inline void vsbox( VectorRegister d, VectorRegister a); // SHA (introduced with Power 8) - // Not yet implemented. + inline void vshasigmad(VectorRegister d, VectorRegister a, bool st, int six); + inline void vshasigmaw(VectorRegister d, VectorRegister a, bool st, int six); // Vector Binary Polynomial Multiplication (introduced with Power 8) inline void vpmsumb( VectorRegister d, VectorRegister a, VectorRegister b); @@ -2286,6 +2287,10 @@ class Assembler : public AbstractAssembler { inline void lvsl( VectorRegister d, Register s2); inline void lvsr( VectorRegister d, Register s2); + // Endianess specific concatenation of 2 loaded vectors. + inline void load_perm(VectorRegister perm, Register addr); + inline void vec_perm(VectorRegister first_dest, VectorRegister second, VectorRegister perm); + // RegisterOrConstant versions. // These emitters choose between the versions using two registers and // those with register and immediate, depending on the content of roc. diff --git a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp index b3a6b89d864..f409c4d0276 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp @@ -926,7 +926,8 @@ inline void Assembler::vncipherlast(VectorRegister d, VectorRegister a, VectorRe inline void Assembler::vsbox( VectorRegister d, VectorRegister a) { emit_int32( VSBOX_OPCODE | vrt(d) | vra(a) ); } // SHA (introduced with Power 8) -// Not yet implemented. +inline void Assembler::vshasigmad(VectorRegister d, VectorRegister a, bool st, int six) { emit_int32( VSHASIGMAD_OPCODE | vrt(d) | vra(a) | vst(st) | vsix(six)); } +inline void Assembler::vshasigmaw(VectorRegister d, VectorRegister a, bool st, int six) { emit_int32( VSHASIGMAW_OPCODE | vrt(d) | vra(a) | vst(st) | vsix(six)); } // Vector Binary Polynomial Multiplication (introduced with Power 8) inline void Assembler::vpmsumb( VectorRegister d, VectorRegister a, VectorRegister b) { emit_int32( VPMSUMB_OPCODE | vrt(d) | vra(a) | vrb(b)); } @@ -1035,6 +1036,22 @@ inline void Assembler::stvxl( VectorRegister d, Register s2) { emit_int32( STVXL inline void Assembler::lvsl( VectorRegister d, Register s2) { emit_int32( LVSL_OPCODE | vrt(d) | rb(s2)); } inline void Assembler::lvsr( VectorRegister d, Register s2) { emit_int32( LVSR_OPCODE | vrt(d) | rb(s2)); } +inline void Assembler::load_perm(VectorRegister perm, Register addr) { +#if defined(VM_LITTLE_ENDIAN) + lvsr(perm, addr); +#else + lvsl(perm, addr); +#endif +} + +inline void Assembler::vec_perm(VectorRegister first_dest, VectorRegister second, VectorRegister perm) { +#if defined(VM_LITTLE_ENDIAN) + vperm(first_dest, second, first_dest, perm); +#else + vperm(first_dest, first_dest, second, perm); +#endif +} + inline void Assembler::load_const(Register d, void* x, Register tmp) { load_const(d, (long)x, tmp); } diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp index 63c377b6c0a..f1fe2385907 100644 --- a/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc.hpp @@ -866,6 +866,40 @@ class MacroAssembler: public Assembler { void kernel_crc32_singleByteReg(Register crc, Register val, Register table, bool invertCRC); + // SHA-2 auxiliary functions and public interfaces + private: + void sha256_deque(const VectorRegister src, + const VectorRegister dst1, const VectorRegister dst2, const VectorRegister dst3); + void sha256_load_h_vec(const VectorRegister a, const VectorRegister e, const Register hptr); + void sha256_round(const VectorRegister* hs, const int total_hs, int& h_cnt, const VectorRegister kpw); + void sha256_load_w_plus_k_vec(const Register buf_in, const VectorRegister* ws, + const int total_ws, const Register k, const VectorRegister* kpws, + const int total_kpws); + void sha256_calc_4w(const VectorRegister w0, const VectorRegister w1, + const VectorRegister w2, const VectorRegister w3, const VectorRegister kpw0, + const VectorRegister kpw1, const VectorRegister kpw2, const VectorRegister kpw3, + const Register j, const Register k); + void sha256_update_sha_state(const VectorRegister a, const VectorRegister b, + const VectorRegister c, const VectorRegister d, const VectorRegister e, + const VectorRegister f, const VectorRegister g, const VectorRegister h, + const Register hptr); + + void sha512_load_w_vec(const Register buf_in, const VectorRegister* ws, const int total_ws); + void sha512_update_sha_state(const Register state, const VectorRegister* hs, const int total_hs); + void sha512_round(const VectorRegister* hs, const int total_hs, int& h_cnt, const VectorRegister kpw); + void sha512_load_h_vec(const Register state, const VectorRegister* hs, const int total_hs); + void sha512_calc_2w(const VectorRegister w0, const VectorRegister w1, + const VectorRegister w2, const VectorRegister w3, + const VectorRegister w4, const VectorRegister w5, + const VectorRegister w6, const VectorRegister w7, + const VectorRegister kpw0, const VectorRegister kpw1, const Register j, + const VectorRegister vRb, const Register k); + + public: + void sha256(bool multi_block); + void sha512(bool multi_block); + + // // Debugging // diff --git a/src/hotspot/cpu/ppc/macroAssembler_ppc_sha.cpp b/src/hotspot/cpu/ppc/macroAssembler_ppc_sha.cpp new file mode 100644 index 00000000000..7a82ed3f99d --- /dev/null +++ b/src/hotspot/cpu/ppc/macroAssembler_ppc_sha.cpp @@ -0,0 +1,1136 @@ +// Copyright (c) 2017 Instituto de Pesquisas Eldorado. All rights reserved. +// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. +// +// This code is free software; you can redistribute it and/or modify it +// under the terms of the GNU General Public License version 2 only, as +// published by the Free Software Foundation. +// +// This code is distributed in the hope that it will be useful, but WITHOUT +// ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or +// FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +// version 2 for more details (a copy is included in the LICENSE file that +// accompanied this code). +// +// You should have received a copy of the GNU General Public License version +// 2 along with this work; if not, write to the Free Software Foundation, +// Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. +// +// Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA +// or visit www.oracle.com if you need additional information or have any +// questions. + +// Implemented according to "Descriptions of SHA-256, SHA-384, and SHA-512" +// (http://www.iwar.org.uk/comsec/resources/cipher/sha256-384-512.pdf). + +#include "asm/macroAssembler.inline.hpp" +#include "runtime/stubRoutines.hpp" + +/********************************************************************** + * SHA 256 + *********************************************************************/ + +void MacroAssembler::sha256_deque(const VectorRegister src, + const VectorRegister dst1, + const VectorRegister dst2, + const VectorRegister dst3) { + vsldoi (dst1, src, src, 12); + vsldoi (dst2, src, src, 8); + vsldoi (dst3, src, src, 4); +} + +void MacroAssembler::sha256_round(const VectorRegister* hs, + const int total_hs, + int& h_cnt, + const VectorRegister kpw) { + // convenience registers: cycle from 0-7 downwards + const VectorRegister a = hs[(total_hs + 0 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister b = hs[(total_hs + 1 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister c = hs[(total_hs + 2 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister d = hs[(total_hs + 3 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister e = hs[(total_hs + 4 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister f = hs[(total_hs + 5 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister g = hs[(total_hs + 6 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister h = hs[(total_hs + 7 - (h_cnt % total_hs)) % total_hs]; + // temporaries + VectorRegister ch = VR0; + VectorRegister maj = VR1; + VectorRegister bsa = VR2; + VectorRegister bse = VR3; + VectorRegister vt0 = VR4; + VectorRegister vt1 = VR5; + VectorRegister vt2 = VR6; + VectorRegister vt3 = VR7; + + vsel (ch, g, f, e); + vxor (maj, a, b); + vshasigmaw (bse, e, 1, 0xf); + vadduwm (vt2, ch, kpw); + vadduwm (vt1, h, bse); + vsel (maj, b, c, maj); + vadduwm (vt3, vt1, vt2); + vshasigmaw (bsa, a, 1, 0); + vadduwm (vt0, bsa, maj); + + vadduwm (d, d, vt3); + vadduwm (h, vt3, vt0); + + // advance vector pointer to the next iteration + h_cnt++; +} + +void MacroAssembler::sha256_load_h_vec(const VectorRegister a, + const VectorRegister e, + const Register hptr) { + // temporaries + Register tmp = R8; + VectorRegister vt0 = VR0; + VectorRegister vRb = VR6; + // labels + Label sha256_aligned; + + andi_ (tmp, hptr, 0xf); + lvx (a, hptr); + addi (tmp, hptr, 16); + lvx (e, tmp); + beq (CCR0, sha256_aligned); + + // handle unaligned accesses + load_perm(vRb, hptr); + addi (tmp, hptr, 32); + vec_perm(a, e, vRb); + + lvx (vt0, tmp); + vec_perm(e, vt0, vRb); + + // aligned accesses + bind(sha256_aligned); +} + +void MacroAssembler::sha256_load_w_plus_k_vec(const Register buf_in, + const VectorRegister* ws, + const int total_ws, + const Register k, + const VectorRegister* kpws, + const int total_kpws) { + Label w_aligned, after_w_load; + + Register tmp = R8; + VectorRegister vt0 = VR0; + VectorRegister vt1 = VR1; + VectorRegister vRb = VR6; + + andi_ (tmp, buf_in, 0xF); + beq (CCR0, w_aligned); // address ends with 0x0, not 0x8 + + // deal with unaligned addresses + lvx (ws[0], buf_in); + load_perm(vRb, buf_in); + + for (int n = 1; n < total_ws; n++) { + VectorRegister w_cur = ws[n]; + VectorRegister w_prev = ws[n-1]; + + addi (tmp, buf_in, n * 16); + lvx (w_cur, tmp); + vec_perm(w_prev, w_cur, vRb); + } + addi (tmp, buf_in, total_ws * 16); + lvx (vt0, tmp); + vec_perm(ws[total_ws-1], vt0, vRb); + b (after_w_load); + + bind(w_aligned); + + // deal with aligned addresses + lvx(ws[0], buf_in); + for (int n = 1; n < total_ws; n++) { + VectorRegister w = ws[n]; + addi (tmp, buf_in, n * 16); + lvx (w, tmp); + } + + bind(after_w_load); + +#if defined(VM_LITTLE_ENDIAN) + // Byte swapping within int values + li (tmp, 8); + lvsl (vt0, tmp); + vspltisb (vt1, 0xb); + vxor (vt1, vt0, vt1); + for (int n = 0; n < total_ws; n++) { + VectorRegister w = ws[n]; + vec_perm(w, w, vt1); + } +#endif + + // Loading k, which is always aligned to 16-bytes + lvx (kpws[0], k); + for (int n = 1; n < total_kpws; n++) { + VectorRegister kpw = kpws[n]; + addi (tmp, k, 16 * n); + lvx (kpw, tmp); + } + + // Add w to K + assert(total_ws == total_kpws, "Redesign the loop below"); + for (int n = 0; n < total_kpws; n++) { + VectorRegister kpw = kpws[n]; + VectorRegister w = ws[n]; + + vadduwm (kpw, kpw, w); + } +} + +void MacroAssembler::sha256_calc_4w(const VectorRegister w0, + const VectorRegister w1, + const VectorRegister w2, + const VectorRegister w3, + const VectorRegister kpw0, + const VectorRegister kpw1, + const VectorRegister kpw2, + const VectorRegister kpw3, + const Register j, + const Register k) { + // Temporaries + const VectorRegister vt0 = VR0; + const VectorRegister vt1 = VR1; + const VectorSRegister vsrt1 = vt1->to_vsr(); + const VectorRegister vt2 = VR2; + const VectorRegister vt3 = VR3; + const VectorSRegister vst3 = vt3->to_vsr(); + const VectorRegister vt4 = VR4; + + // load to k[j] + lvx (vt0, j, k); + + // advance j + addi (j, j, 16); // 16 bytes were read + +#if defined(VM_LITTLE_ENDIAN) + // b = w[j-15], w[j-14], w[j-13], w[j-12] + vsldoi (vt1, w1, w0, 12); + + // c = w[j-7], w[j-6], w[j-5], w[j-4] + vsldoi (vt2, w3, w2, 12); + +#else + // b = w[j-15], w[j-14], w[j-13], w[j-12] + vsldoi (vt1, w0, w1, 4); + + // c = w[j-7], w[j-6], w[j-5], w[j-4] + vsldoi (vt2, w2, w3, 4); +#endif + + // d = w[j-2], w[j-1], w[j-4], w[j-3] + vsldoi (vt3, w3, w3, 8); + + // b = s0(w[j-15]) , s0(w[j-14]) , s0(w[j-13]) , s0(w[j-12]) + vshasigmaw (vt1, vt1, 0, 0); + + // d = s1(w[j-2]) , s1(w[j-1]) , s1(w[j-4]) , s1(w[j-3]) + vshasigmaw (vt3, vt3, 0, 0xf); + + // c = s0(w[j-15]) + w[j-7], + // s0(w[j-14]) + w[j-6], + // s0(w[j-13]) + w[j-5], + // s0(w[j-12]) + w[j-4] + vadduwm (vt2, vt1, vt2); + + // c = s0(w[j-15]) + w[j-7] + w[j-16], + // s0(w[j-14]) + w[j-6] + w[j-15], + // s0(w[j-13]) + w[j-5] + w[j-14], + // s0(w[j-12]) + w[j-4] + w[j-13] + vadduwm (vt2, vt2, w0); + + // e = s0(w[j-15]) + w[j-7] + w[j-16] + s1(w[j-2]), // w[j] + // s0(w[j-14]) + w[j-6] + w[j-15] + s1(w[j-1]), // w[j+1] + // s0(w[j-13]) + w[j-5] + w[j-14] + s1(w[j-4]), // UNDEFINED + // s0(w[j-12]) + w[j-4] + w[j-13] + s1(w[j-3]) // UNDEFINED + vadduwm (vt4, vt2, vt3); + + // At this point, e[0] and e[1] are the correct values to be stored at w[j] + // and w[j+1]. + // e[2] and e[3] are not considered. + // b = s1(w[j]) , s1(s(w[j+1]) , UNDEFINED , UNDEFINED + vshasigmaw (vt1, vt4, 0, 0xf); + + // v5 = s1(w[j-2]) , s1(w[j-1]) , s1(w[j]) , s1(w[j+1]) +#if defined(VM_LITTLE_ENDIAN) + xxmrgld (vst3, vsrt1, vst3); +#else + xxmrghd (vst3, vst3, vsrt1); +#endif + + // c = s0(w[j-15]) + w[j-7] + w[j-16] + s1(w[j-2]), // w[j] + // s0(w[j-14]) + w[j-6] + w[j-15] + s1(w[j-1]), // w[j+1] + // s0(w[j-13]) + w[j-5] + w[j-14] + s1(w[j]), // w[j+2] + // s0(w[j-12]) + w[j-4] + w[j-13] + s1(w[j+1]) // w[j+4] + vadduwm (vt2, vt2, vt3); + + // Updating w0 to w3 to hold the new previous 16 values from w. + vmr (w0, w1); + vmr (w1, w2); + vmr (w2, w3); + vmr (w3, vt2); + + // store k + w to v9 (4 values at once) +#if defined(VM_LITTLE_ENDIAN) + vadduwm (kpw0, vt2, vt0); + + vsldoi (kpw1, kpw0, kpw0, 12); + vsldoi (kpw2, kpw0, kpw0, 8); + vsldoi (kpw3, kpw0, kpw0, 4); +#else + vadduwm (kpw3, vt2, vt0); + + vsldoi (kpw2, kpw3, kpw3, 12); + vsldoi (kpw1, kpw3, kpw3, 8); + vsldoi (kpw0, kpw3, kpw3, 4); +#endif +} + +void MacroAssembler::sha256_update_sha_state(const VectorRegister a, + const VectorRegister b_, + const VectorRegister c, + const VectorRegister d, + const VectorRegister e, + const VectorRegister f, + const VectorRegister g, + const VectorRegister h, + const Register hptr) { + // temporaries + VectorRegister vt0 = VR0; + VectorRegister vt1 = VR1; + VectorRegister vt2 = VR2; + VectorRegister vt3 = VR3; + VectorRegister vt4 = VR4; + VectorRegister vt5 = VR5; + VectorRegister vaux = VR6; + VectorRegister vRb = VR6; + Register tmp = R8; + Register of16 = R8; + Register of32 = R9; + Label state_load_aligned; + + // Load hptr + andi_ (tmp, hptr, 0xf); + li (of16, 16); + lvx (vt0, hptr); + lvx (vt5, of16, hptr); + beq (CCR0, state_load_aligned); + + // handle unaligned accesses + li (of32, 32); + load_perm(vRb, hptr); + + vec_perm(vt0, vt5, vRb); // vt0 = hptr[0]..hptr[3] + + lvx (vt1, hptr, of32); + vec_perm(vt5, vt1, vRb); // vt5 = hptr[4]..hptr[7] + + // aligned accesses + bind(state_load_aligned); + +#if defined(VM_LITTLE_ENDIAN) + vmrglw (vt1, b_, a); // vt1 = {a, b, ?, ?} + vmrglw (vt2, d, c); // vt2 = {c, d, ?, ?} + vmrglw (vt3, f, e); // vt3 = {e, f, ?, ?} + vmrglw (vt4, h, g); // vt4 = {g, h, ?, ?} + xxmrgld (vt1->to_vsr(), vt2->to_vsr(), vt1->to_vsr()); // vt1 = {a, b, c, d} + xxmrgld (vt3->to_vsr(), vt4->to_vsr(), vt3->to_vsr()); // vt3 = {e, f, g, h} + vadduwm (a, vt0, vt1); // a = {a+hptr[0], b+hptr[1], c+hptr[2], d+hptr[3]} + vadduwm (e, vt5, vt3); // e = {e+hptr[4], f+hptr[5], g+hptr[6], h+hptr[7]} + + // Save hptr back, works for any alignment + xxswapd (vt0->to_vsr(), a->to_vsr()); + stxvd2x (vt0->to_vsr(), hptr); + xxswapd (vt5->to_vsr(), e->to_vsr()); + stxvd2x (vt5->to_vsr(), of16, hptr); +#else + vmrglw (vt1, a, b_); // vt1 = {a, b, ?, ?} + vmrglw (vt2, c, d); // vt2 = {c, d, ?, ?} + vmrglw (vt3, e, f); // vt3 = {e, f, ?, ?} + vmrglw (vt4, g, h); // vt4 = {g, h, ?, ?} + xxmrgld (vt1->to_vsr(), vt1->to_vsr(), vt2->to_vsr()); // vt1 = {a, b, c, d} + xxmrgld (vt3->to_vsr(), vt3->to_vsr(), vt4->to_vsr()); // vt3 = {e, f, g, h} + vadduwm (d, vt0, vt1); // d = {a+hptr[0], b+hptr[1], c+hptr[2], d+hptr[3]} + vadduwm (h, vt5, vt3); // h = {e+hptr[4], f+hptr[5], g+hptr[6], h+hptr[7]} + + // Save hptr back, works for any alignment + stxvd2x (d->to_vsr(), hptr); + stxvd2x (h->to_vsr(), of16, hptr); +#endif +} + +static const uint32_t sha256_round_table[64] __attribute((aligned(16))) = { + 0x428a2f98, 0x71374491, 0xb5c0fbcf, 0xe9b5dba5, + 0x3956c25b, 0x59f111f1, 0x923f82a4, 0xab1c5ed5, + 0xd807aa98, 0x12835b01, 0x243185be, 0x550c7dc3, + 0x72be5d74, 0x80deb1fe, 0x9bdc06a7, 0xc19bf174, + 0xe49b69c1, 0xefbe4786, 0x0fc19dc6, 0x240ca1cc, + 0x2de92c6f, 0x4a7484aa, 0x5cb0a9dc, 0x76f988da, + 0x983e5152, 0xa831c66d, 0xb00327c8, 0xbf597fc7, + 0xc6e00bf3, 0xd5a79147, 0x06ca6351, 0x14292967, + 0x27b70a85, 0x2e1b2138, 0x4d2c6dfc, 0x53380d13, + 0x650a7354, 0x766a0abb, 0x81c2c92e, 0x92722c85, + 0xa2bfe8a1, 0xa81a664b, 0xc24b8b70, 0xc76c51a3, + 0xd192e819, 0xd6990624, 0xf40e3585, 0x106aa070, + 0x19a4c116, 0x1e376c08, 0x2748774c, 0x34b0bcb5, + 0x391c0cb3, 0x4ed8aa4a, 0x5b9cca4f, 0x682e6ff3, + 0x748f82ee, 0x78a5636f, 0x84c87814, 0x8cc70208, + 0x90befffa, 0xa4506ceb, 0xbef9a3f7, 0xc67178f2, +}; +static const uint32_t *sha256_round_consts = sha256_round_table; + +// R3_ARG1 - byte[] Input string with padding but in Big Endian +// R4_ARG2 - int[] SHA.state (at first, the root of primes) +// R5_ARG3 - int offset +// R6_ARG4 - int limit +// +// Internal Register usage: +// R7 - k +// R8 - tmp | j | of16 +// R9 - of32 +// VR0-VR8 - ch, maj, bsa, bse, vt0-vt3 | vt0-vt5, vaux/vRb +// VR9-VR16 - a-h +// VR17-VR20 - w0-w3 +// VR21-VR23 - vRb | vaux0-vaux2 +// VR24-VR27 - kpw0-kpw3 +void MacroAssembler::sha256(bool multi_block) { + static const ssize_t buf_size = 64; + static const uint8_t w_size = sizeof(sha256_round_table)/sizeof(uint32_t); +#ifdef AIX + // malloc provides 16 byte alignment + if (((uintptr_t)sha256_round_consts & 0xF) != 0) { + uint32_t *new_round_consts = (uint32_t*)malloc(sizeof(sha256_round_table)); + guarantee(new_round_consts, "oom"); + memcpy(new_round_consts, sha256_round_consts, sizeof(sha256_round_table)); + sha256_round_consts = (const uint32_t*)new_round_consts; + } +#endif + + Register buf_in = R3_ARG1; + Register state = R4_ARG2; + Register ofs = R5_ARG3; + Register limit = R6_ARG4; + + Label sha_loop, core_loop; + + // Save non-volatile vector registers in the red zone + static const VectorRegister nv[] = { + VR20, VR21, VR22, VR23, VR24, VR25, VR26, VR27/*, VR28, VR29, VR30, VR31*/ + }; + static const uint8_t nv_size = sizeof(nv) / sizeof (VectorRegister); + + for (int c = 0; c < nv_size; c++) { + Register tmp = R8; + li (tmp, (c - (nv_size)) * 16); + stvx(nv[c], tmp, R1); + } + + // Load hash state to registers + VectorRegister a = VR9; + VectorRegister b = VR10; + VectorRegister c = VR11; + VectorRegister d = VR12; + VectorRegister e = VR13; + VectorRegister f = VR14; + VectorRegister g = VR15; + VectorRegister h = VR16; + static const VectorRegister hs[] = {a, b, c, d, e, f, g, h}; + static const int total_hs = sizeof(hs)/sizeof(VectorRegister); + // counter for cycling through hs vector to avoid register moves between iterations + int h_cnt = 0; + + // Load a-h registers from the memory pointed by state +#if defined(VM_LITTLE_ENDIAN) + sha256_load_h_vec(a, e, state); +#else + sha256_load_h_vec(d, h, state); +#endif + + // keep k loaded also during MultiBlock loops + Register k = R7; + assert(((uintptr_t)sha256_round_consts & 0xF) == 0, "k alignment"); + load_const_optimized(k, (address)sha256_round_consts, R0); + + // Avoiding redundant loads + if (multi_block) { + align(OptoLoopAlignment); + } + bind(sha_loop); +#if defined(VM_LITTLE_ENDIAN) + sha256_deque(a, b, c, d); + sha256_deque(e, f, g, h); +#else + sha256_deque(d, c, b, a); + sha256_deque(h, g, f, e); +#endif + + // Load 16 elements from w out of the loop. + // Order of the int values is Endianess specific. + VectorRegister w0 = VR17; + VectorRegister w1 = VR18; + VectorRegister w2 = VR19; + VectorRegister w3 = VR20; + static const VectorRegister ws[] = {w0, w1, w2, w3}; + static const int total_ws = sizeof(ws)/sizeof(VectorRegister); + + VectorRegister kpw0 = VR24; + VectorRegister kpw1 = VR25; + VectorRegister kpw2 = VR26; + VectorRegister kpw3 = VR27; + static const VectorRegister kpws[] = {kpw0, kpw1, kpw2, kpw3}; + static const int total_kpws = sizeof(kpws)/sizeof(VectorRegister); + + sha256_load_w_plus_k_vec(buf_in, ws, total_ws, k, kpws, total_kpws); + + // Cycle through the first 16 elements + assert(total_ws == total_kpws, "Redesign the loop below"); + for (int n = 0; n < total_ws; n++) { + VectorRegister vaux0 = VR21; + VectorRegister vaux1 = VR22; + VectorRegister vaux2 = VR23; + + sha256_deque(kpws[n], vaux0, vaux1, vaux2); + +#if defined(VM_LITTLE_ENDIAN) + sha256_round(hs, total_hs, h_cnt, kpws[n]); + sha256_round(hs, total_hs, h_cnt, vaux0); + sha256_round(hs, total_hs, h_cnt, vaux1); + sha256_round(hs, total_hs, h_cnt, vaux2); +#else + sha256_round(hs, total_hs, h_cnt, vaux2); + sha256_round(hs, total_hs, h_cnt, vaux1); + sha256_round(hs, total_hs, h_cnt, vaux0); + sha256_round(hs, total_hs, h_cnt, kpws[n]); +#endif + } + + Register tmp = R8; + // loop the 16th to the 64th iteration by 8 steps + li (tmp, (w_size - 16) / total_hs); + mtctr(tmp); + + // j will be aligned to 4 for loading words. + // Whenever read, advance the pointer (e.g: when j is used in a function) + Register j = R8; + li (j, 16*4); + + align(OptoLoopAlignment); + bind(core_loop); + + // due to VectorRegister rotate, always iterate in multiples of total_hs + for (int n = 0; n < total_hs/4; n++) { + sha256_calc_4w(w0, w1, w2, w3, kpw0, kpw1, kpw2, kpw3, j, k); + sha256_round(hs, total_hs, h_cnt, kpw0); + sha256_round(hs, total_hs, h_cnt, kpw1); + sha256_round(hs, total_hs, h_cnt, kpw2); + sha256_round(hs, total_hs, h_cnt, kpw3); + } + + bdnz (core_loop); + + // Update hash state + sha256_update_sha_state(a, b, c, d, e, f, g, h, state); + + if (multi_block) { + addi(buf_in, buf_in, buf_size); + addi(ofs, ofs, buf_size); + cmplw(CCR0, ofs, limit); + ble(CCR0, sha_loop); + + // return ofs + mr(R3_RET, ofs); + } + + // Restore non-volatile registers + for (int c = 0; c < nv_size; c++) { + Register tmp = R8; + li (tmp, (c - (nv_size)) * 16); + lvx(nv[c], tmp, R1); + } +} + + +/********************************************************************** + * SHA 512 + *********************************************************************/ + +void MacroAssembler::sha512_load_w_vec(const Register buf_in, + const VectorRegister* ws, + const int total_ws) { + Register tmp = R8; + VectorRegister vRb = VR8; + VectorRegister aux = VR9; + Label is_aligned, after_alignment; + + andi_ (tmp, buf_in, 0xF); + beq (CCR0, is_aligned); // address ends with 0x0, not 0x8 + + // deal with unaligned addresses + lvx (ws[0], buf_in); + load_perm(vRb, buf_in); + + for (int n = 1; n < total_ws; n++) { + VectorRegister w_cur = ws[n]; + VectorRegister w_prev = ws[n-1]; + addi (tmp, buf_in, n * 16); + lvx (w_cur, tmp); + vec_perm(w_prev, w_cur, vRb); + } + addi (tmp, buf_in, total_ws * 16); + lvx (aux, tmp); + vec_perm(ws[total_ws-1], aux, vRb); + b (after_alignment); + + bind(is_aligned); + lvx (ws[0], buf_in); + for (int n = 1; n < total_ws; n++) { + VectorRegister w = ws[n]; + addi (tmp, buf_in, n * 16); + lvx (w, tmp); + } + + bind(after_alignment); +} + +// Update hash state +void MacroAssembler::sha512_update_sha_state(const Register state, + const VectorRegister* hs, + const int total_hs) { + +#if defined(VM_LITTLE_ENDIAN) + int start_idx = 0; +#else + int start_idx = 1; +#endif + + // load initial hash from the memory pointed by state + VectorRegister ini_a = VR10; + VectorRegister ini_c = VR12; + VectorRegister ini_e = VR14; + VectorRegister ini_g = VR16; + static const VectorRegister inis[] = {ini_a, ini_c, ini_e, ini_g}; + static const int total_inis = sizeof(inis)/sizeof(VectorRegister); + + Label state_save_aligned, after_state_save_aligned; + + Register addr = R7; + Register tmp = R8; + VectorRegister vRb = VR8; + VectorRegister aux = VR9; + + andi_(tmp, state, 0xf); + beq(CCR0, state_save_aligned); + // deal with unaligned addresses + + { + VectorRegister a = hs[0]; + VectorRegister b_ = hs[1]; + VectorRegister c = hs[2]; + VectorRegister d = hs[3]; + VectorRegister e = hs[4]; + VectorRegister f = hs[5]; + VectorRegister g = hs[6]; + VectorRegister h = hs[7]; + load_perm(vRb, state); + lvx (ini_a, state); + addi (addr, state, 16); + + lvx (ini_c, addr); + addi (addr, state, 32); + vec_perm(ini_a, ini_c, vRb); + + lvx (ini_e, addr); + addi (addr, state, 48); + vec_perm(ini_c, ini_e, vRb); + + lvx (ini_g, addr); + addi (addr, state, 64); + vec_perm(ini_e, ini_g, vRb); + + lvx (aux, addr); + vec_perm(ini_g, aux, vRb); + +#if defined(VM_LITTLE_ENDIAN) + xxmrgld(a->to_vsr(), b_->to_vsr(), a->to_vsr()); + xxmrgld(c->to_vsr(), d->to_vsr(), c->to_vsr()); + xxmrgld(e->to_vsr(), f->to_vsr(), e->to_vsr()); + xxmrgld(g->to_vsr(), h->to_vsr(), g->to_vsr()); +#else + xxmrgld(b_->to_vsr(), a->to_vsr(), b_->to_vsr()); + xxmrgld(d->to_vsr(), c->to_vsr(), d->to_vsr()); + xxmrgld(f->to_vsr(), e->to_vsr(), f->to_vsr()); + xxmrgld(h->to_vsr(), g->to_vsr(), h->to_vsr()); +#endif + + for (int n = start_idx; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + VectorRegister ini_cur = inis[n/2]; + + vaddudm(h_cur, ini_cur, h_cur); + } + + for (int n = start_idx; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + + mfvrd (tmp, h_cur); +#if defined(VM_LITTLE_ENDIAN) + std (tmp, 8*n + 8, state); +#else + std (tmp, 8*n - 8, state); +#endif + vsldoi (aux, h_cur, h_cur, 8); + mfvrd (tmp, aux); + std (tmp, 8*n + 0, state); + } + + b (after_state_save_aligned); + } + + bind(state_save_aligned); + { + for (int n = 0; n < total_hs; n += 2) { +#if defined(VM_LITTLE_ENDIAN) + VectorRegister h_cur = hs[n]; + VectorRegister h_next = hs[n+1]; +#else + VectorRegister h_cur = hs[n+1]; + VectorRegister h_next = hs[n]; +#endif + VectorRegister ini_cur = inis[n/2]; + + if (n/2 == 0) { + lvx(ini_cur, state); + } else { + addi(addr, state, (n/2) * 16); + lvx(ini_cur, addr); + } + xxmrgld(h_cur->to_vsr(), h_next->to_vsr(), h_cur->to_vsr()); + } + + for (int n = start_idx; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + VectorRegister ini_cur = inis[n/2]; + + vaddudm(h_cur, ini_cur, h_cur); + } + + for (int n = start_idx; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + + if (n/2 == 0) { + stvx(h_cur, state); + } else { + addi(addr, state, (n/2) * 16); + stvx(h_cur, addr); + } + } + } + + bind(after_state_save_aligned); +} + +// Use h_cnt to cycle through hs elements but also increment it at the end +void MacroAssembler::sha512_round(const VectorRegister* hs, + const int total_hs, int& h_cnt, + const VectorRegister kpw) { + + // convenience registers: cycle from 0-7 downwards + const VectorRegister a = hs[(total_hs + 0 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister b = hs[(total_hs + 1 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister c = hs[(total_hs + 2 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister d = hs[(total_hs + 3 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister e = hs[(total_hs + 4 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister f = hs[(total_hs + 5 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister g = hs[(total_hs + 6 - (h_cnt % total_hs)) % total_hs]; + const VectorRegister h = hs[(total_hs + 7 - (h_cnt % total_hs)) % total_hs]; + // temporaries + const VectorRegister Ch = VR20; + const VectorRegister Maj = VR21; + const VectorRegister bsa = VR22; + const VectorRegister bse = VR23; + const VectorRegister tmp1 = VR24; + const VectorRegister tmp2 = VR25; + + vsel (Ch, g, f, e); + vxor (Maj, a, b); + vshasigmad(bse, e, 1, 0xf); + vaddudm (tmp2, Ch, kpw); + vaddudm (tmp1, h, bse); + vsel (Maj, b, c, Maj); + vaddudm (tmp1, tmp1, tmp2); + vshasigmad(bsa, a, 1, 0); + vaddudm (tmp2, bsa, Maj); + vaddudm (d, d, tmp1); + vaddudm (h, tmp1, tmp2); + + // advance vector pointer to the next iteration + h_cnt++; +} + +void MacroAssembler::sha512_calc_2w(const VectorRegister w0, + const VectorRegister w1, + const VectorRegister w2, + const VectorRegister w3, + const VectorRegister w4, + const VectorRegister w5, + const VectorRegister w6, + const VectorRegister w7, + const VectorRegister kpw0, + const VectorRegister kpw1, + const Register j, + const VectorRegister vRb, + const Register k) { + // Temporaries + const VectorRegister VR_a = VR20; + const VectorRegister VR_b = VR21; + const VectorRegister VR_c = VR22; + const VectorRegister VR_d = VR23; + + // load to k[j] + lvx (VR_a, j, k); + // advance j + addi (j, j, 16); // 16 bytes were read + +#if defined(VM_LITTLE_ENDIAN) + // v6 = w[j-15], w[j-14] + vperm (VR_b, w1, w0, vRb); + // v12 = w[j-7], w[j-6] + vperm (VR_c, w5, w4, vRb); +#else + // v6 = w[j-15], w[j-14] + vperm (VR_b, w0, w1, vRb); + // v12 = w[j-7], w[j-6] + vperm (VR_c, w4, w5, vRb); +#endif + + // v6 = s0(w[j-15]) , s0(w[j-14]) + vshasigmad (VR_b, VR_b, 0, 0); + // v5 = s1(w[j-2]) , s1(w[j-1]) + vshasigmad (VR_d, w7, 0, 0xf); + // v6 = s0(w[j-15]) + w[j-7] , s0(w[j-14]) + w[j-6] + vaddudm (VR_b, VR_b, VR_c); + // v8 = s1(w[j-2]) + w[j-16] , s1(w[j-1]) + w[j-15] + vaddudm (VR_d, VR_d, w0); + // v9 = s0(w[j-15]) + w[j-7] + w[j-16] + s1(w[j-2]), // w[j] + // s0(w[j-14]) + w[j-6] + w[j-15] + s1(w[j-1]), // w[j+1] + vaddudm (VR_c, VR_d, VR_b); + // Updating w0 to w7 to hold the new previous 16 values from w. + vmr (w0, w1); + vmr (w1, w2); + vmr (w2, w3); + vmr (w3, w4); + vmr (w4, w5); + vmr (w5, w6); + vmr (w6, w7); + vmr (w7, VR_c); + +#if defined(VM_LITTLE_ENDIAN) + // store k + w to kpw0 (2 values at once) + vaddudm (kpw0, VR_c, VR_a); + // kpw1 holds (k + w)[1] + vsldoi (kpw1, kpw0, kpw0, 8); +#else + // store k + w to kpw0 (2 values at once) + vaddudm (kpw1, VR_c, VR_a); + // kpw1 holds (k + w)[1] + vsldoi (kpw0, kpw1, kpw1, 8); +#endif +} + +void MacroAssembler::sha512_load_h_vec(const Register state, + const VectorRegister* hs, + const int total_hs) { +#if defined(VM_LITTLE_ENDIAN) + VectorRegister a = hs[0]; + VectorRegister g = hs[6]; + int start_idx = 0; +#else + VectorRegister a = hs[1]; + VectorRegister g = hs[7]; + int start_idx = 1; +#endif + + Register addr = R7; + VectorRegister vRb = VR8; + Register tmp = R8; + Label state_aligned, after_state_aligned; + + andi_(tmp, state, 0xf); + beq(CCR0, state_aligned); + + // deal with unaligned addresses + VectorRegister aux = VR9; + + lvx(hs[start_idx], state); + load_perm(vRb, state); + + for (int n = start_idx + 2; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + VectorRegister h_prev2 = hs[n - 2]; + addi(addr, state, (n/2) * 16); + lvx(h_cur, addr); + vec_perm(h_prev2, h_cur, vRb); + } + addi(addr, state, (total_hs/2) * 16); + lvx (aux, addr); + vec_perm(hs[total_hs - 2 + start_idx], aux, vRb); + b (after_state_aligned); + + bind(state_aligned); + + // deal with aligned addresses + lvx(hs[start_idx], state); + + for (int n = start_idx + 2; n < total_hs; n += 2) { + VectorRegister h_cur = hs[n]; + addi(addr, state, (n/2) * 16); + lvx(h_cur, addr); + } + + bind(after_state_aligned); +} + +static const uint64_t sha512_round_table[80] __attribute((aligned(16))) = { + 0x428a2f98d728ae22, 0x7137449123ef65cd, + 0xb5c0fbcfec4d3b2f, 0xe9b5dba58189dbbc, + 0x3956c25bf348b538, 0x59f111f1b605d019, + 0x923f82a4af194f9b, 0xab1c5ed5da6d8118, + 0xd807aa98a3030242, 0x12835b0145706fbe, + 0x243185be4ee4b28c, 0x550c7dc3d5ffb4e2, + 0x72be5d74f27b896f, 0x80deb1fe3b1696b1, + 0x9bdc06a725c71235, 0xc19bf174cf692694, + 0xe49b69c19ef14ad2, 0xefbe4786384f25e3, + 0x0fc19dc68b8cd5b5, 0x240ca1cc77ac9c65, + 0x2de92c6f592b0275, 0x4a7484aa6ea6e483, + 0x5cb0a9dcbd41fbd4, 0x76f988da831153b5, + 0x983e5152ee66dfab, 0xa831c66d2db43210, + 0xb00327c898fb213f, 0xbf597fc7beef0ee4, + 0xc6e00bf33da88fc2, 0xd5a79147930aa725, + 0x06ca6351e003826f, 0x142929670a0e6e70, + 0x27b70a8546d22ffc, 0x2e1b21385c26c926, + 0x4d2c6dfc5ac42aed, 0x53380d139d95b3df, + 0x650a73548baf63de, 0x766a0abb3c77b2a8, + 0x81c2c92e47edaee6, 0x92722c851482353b, + 0xa2bfe8a14cf10364, 0xa81a664bbc423001, + 0xc24b8b70d0f89791, 0xc76c51a30654be30, + 0xd192e819d6ef5218, 0xd69906245565a910, + 0xf40e35855771202a, 0x106aa07032bbd1b8, + 0x19a4c116b8d2d0c8, 0x1e376c085141ab53, + 0x2748774cdf8eeb99, 0x34b0bcb5e19b48a8, + 0x391c0cb3c5c95a63, 0x4ed8aa4ae3418acb, + 0x5b9cca4f7763e373, 0x682e6ff3d6b2b8a3, + 0x748f82ee5defb2fc, 0x78a5636f43172f60, + 0x84c87814a1f0ab72, 0x8cc702081a6439ec, + 0x90befffa23631e28, 0xa4506cebde82bde9, + 0xbef9a3f7b2c67915, 0xc67178f2e372532b, + 0xca273eceea26619c, 0xd186b8c721c0c207, + 0xeada7dd6cde0eb1e, 0xf57d4f7fee6ed178, + 0x06f067aa72176fba, 0x0a637dc5a2c898a6, + 0x113f9804bef90dae, 0x1b710b35131c471b, + 0x28db77f523047d84, 0x32caab7b40c72493, + 0x3c9ebe0a15c9bebc, 0x431d67c49c100d4c, + 0x4cc5d4becb3e42b6, 0x597f299cfc657e2a, + 0x5fcb6fab3ad6faec, 0x6c44198c4a475817, +}; +static const uint64_t *sha512_round_consts = sha512_round_table; + +// R3_ARG1 - byte[] Input string with padding but in Big Endian +// R4_ARG2 - int[] SHA.state (at first, the root of primes) +// R5_ARG3 - int offset +// R6_ARG4 - int limit +// +// Internal Register usage: +// R7 R8 R9 - volatile temporaries +// VR0-VR7 - a-h +// VR8 - vRb +// VR9 - aux (highly volatile, use with care) +// VR10-VR17 - w0-w7 | ini_a-ini_h +// VR18 - vsp16 | kplusw0 +// VR19 - vsp32 | kplusw1 +// VR20-VR25 - sha512_calc_2w and sha512_round temporaries +void MacroAssembler::sha512(bool multi_block) { + static const ssize_t buf_size = 128; + static const uint8_t w_size = sizeof(sha512_round_table)/sizeof(uint64_t); +#ifdef AIX + // malloc provides 16 byte alignment + if (((uintptr_t)sha512_round_consts & 0xF) != 0) { + uint64_t *new_round_consts = (uint64_t*)malloc(sizeof(sha512_round_table)); + guarantee(new_round_consts, "oom"); + memcpy(new_round_consts, sha512_round_consts, sizeof(sha512_round_table)); + sha512_round_consts = (const uint64_t*)new_round_consts; + } +#endif + + Register buf_in = R3_ARG1; + Register state = R4_ARG2; + Register ofs = R5_ARG3; + Register limit = R6_ARG4; + + Label sha_loop, core_loop; + + // Save non-volatile vector registers in the red zone + static const VectorRegister nv[] = { + VR20, VR21, VR22, VR23, VR24, VR25/*, VR26, VR27, VR28, VR29, VR30, VR31*/ + }; + static const uint8_t nv_size = sizeof(nv) / sizeof (VectorRegister); + + for (int c = 0; c < nv_size; c++) { + Register idx = R7; + li (idx, (c - (nv_size)) * 16); + stvx(nv[c], idx, R1); + } + + // Load hash state to registers + VectorRegister a = VR0; + VectorRegister b = VR1; + VectorRegister c = VR2; + VectorRegister d = VR3; + VectorRegister e = VR4; + VectorRegister f = VR5; + VectorRegister g = VR6; + VectorRegister h = VR7; + static const VectorRegister hs[] = {a, b, c, d, e, f, g, h}; + static const int total_hs = sizeof(hs)/sizeof(VectorRegister); + // counter for cycling through hs vector to avoid register moves between iterations + int h_cnt = 0; + + // Load a-h registers from the memory pointed by state + sha512_load_h_vec(state, hs, total_hs); + + Register k = R9; + assert(((uintptr_t)sha512_round_consts & 0xF) == 0, "k alignment"); + load_const_optimized(k, (address)sha512_round_consts, R0); + + if (multi_block) { + align(OptoLoopAlignment); + } + bind(sha_loop); + + for (int n = 0; n < total_hs; n += 2) { +#if defined(VM_LITTLE_ENDIAN) + VectorRegister h_cur = hs[n]; + VectorRegister h_next = hs[n + 1]; +#else + VectorRegister h_cur = hs[n + 1]; + VectorRegister h_next = hs[n]; +#endif + vsldoi (h_next, h_cur, h_cur, 8); + } + + // Load 16 elements from w out of the loop. + // Order of the long values is Endianess specific. + VectorRegister w0 = VR10; + VectorRegister w1 = VR11; + VectorRegister w2 = VR12; + VectorRegister w3 = VR13; + VectorRegister w4 = VR14; + VectorRegister w5 = VR15; + VectorRegister w6 = VR16; + VectorRegister w7 = VR17; + static const VectorRegister ws[] = {w0, w1, w2, w3, w4, w5, w6, w7}; + static const int total_ws = sizeof(ws)/sizeof(VectorRegister); + + // Load 16 w into vectors and setup vsl for vperm + sha512_load_w_vec(buf_in, ws, total_ws); + +#if defined(VM_LITTLE_ENDIAN) + VectorRegister vsp16 = VR18; + VectorRegister vsp32 = VR19; + VectorRegister shiftarg = VR9; + + vspltisw(vsp16, 8); + vspltisw(shiftarg, 1); + vsl (vsp16, vsp16, shiftarg); + vsl (vsp32, vsp16, shiftarg); + + VectorRegister vsp8 = VR9; + vspltish(vsp8, 8); + + // Convert input from Big Endian to Little Endian + for (int c = 0; c < total_ws; c++) { + VectorRegister w = ws[c]; + vrlh (w, w, vsp8); + } + for (int c = 0; c < total_ws; c++) { + VectorRegister w = ws[c]; + vrlw (w, w, vsp16); + } + for (int c = 0; c < total_ws; c++) { + VectorRegister w = ws[c]; + vrld (w, w, vsp32); + } +#endif + + Register Rb = R10; + VectorRegister vRb = VR8; + li (Rb, 8); + load_perm(vRb, Rb); + + VectorRegister kplusw0 = VR18; + VectorRegister kplusw1 = VR19; + + Register addr = R7; + + for (int n = 0; n < total_ws; n++) { + VectorRegister w = ws[n]; + + if (n == 0) { + lvx (kplusw0, k); + } else { + addi (addr, k, n * 16); + lvx (kplusw0, addr); + } +#if defined(VM_LITTLE_ENDIAN) + vaddudm(kplusw0, kplusw0, w); + vsldoi (kplusw1, kplusw0, kplusw0, 8); +#else + vaddudm(kplusw1, kplusw0, w); + vsldoi (kplusw0, kplusw1, kplusw1, 8); +#endif + + sha512_round(hs, total_hs, h_cnt, kplusw0); + sha512_round(hs, total_hs, h_cnt, kplusw1); + } + + Register tmp = R8; + li (tmp, (w_size-16)/total_hs); + mtctr (tmp); + // j will be aligned to 4 for loading words. + // Whenever read, advance the pointer (e.g: when j is used in a function) + Register j = tmp; + li (j, 8*16); + + align(OptoLoopAlignment); + bind(core_loop); + + // due to VectorRegister rotate, always iterate in multiples of total_hs + for (int n = 0; n < total_hs/2; n++) { + sha512_calc_2w(w0, w1, w2, w3, w4, w5, w6, w7, kplusw0, kplusw1, j, vRb, k); + sha512_round(hs, total_hs, h_cnt, kplusw0); + sha512_round(hs, total_hs, h_cnt, kplusw1); + } + + bdnz (core_loop); + + sha512_update_sha_state(state, hs, total_hs); + + if (multi_block) { + addi(buf_in, buf_in, buf_size); + addi(ofs, ofs, buf_size); + cmplw(CCR0, ofs, limit); + ble(CCR0, sha_loop); + + // return ofs + mr(R3_RET, ofs); + } + + // Restore non-volatile registers + for (int c = 0; c < nv_size; c++) { + Register idx = R7; + li (idx, (c - (nv_size)) * 16); + lvx(nv[c], idx, R1); + } +} diff --git a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp index 2a149432520..acfae9cfcba 100644 --- a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp +++ b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp @@ -3095,6 +3095,28 @@ class StubGenerator: public StubCodeGenerator { return start; } + address generate_sha256_implCompress(bool multi_block, const char *name) { + assert(UseSHA, "need SHA instructions"); + StubCodeMark mark(this, "StubRoutines", name); + address start = __ function_entry(); + + __ sha256 (multi_block); + + __ blr(); + return start; + } + + address generate_sha512_implCompress(bool multi_block, const char *name) { + assert(UseSHA, "need SHA instructions"); + StubCodeMark mark(this, "StubRoutines", name); + address start = __ function_entry(); + + __ sha512 (multi_block); + + __ blr(); + return start; + } + void generate_arraycopy_stubs() { // Note: the disjoint stubs must be generated first, some of // the conjoint stubs use them. @@ -3781,6 +3803,14 @@ class StubGenerator: public StubCodeGenerator { StubRoutines::_aescrypt_decryptBlock = generate_aescrypt_decryptBlock(); } + if (UseSHA256Intrinsics) { + StubRoutines::_sha256_implCompress = generate_sha256_implCompress(false, "sha256_implCompress"); + StubRoutines::_sha256_implCompressMB = generate_sha256_implCompress(true, "sha256_implCompressMB"); + } + if (UseSHA512Intrinsics) { + StubRoutines::_sha512_implCompress = generate_sha512_implCompress(false, "sha512_implCompress"); + StubRoutines::_sha512_implCompressMB = generate_sha512_implCompress(true, "sha512_implCompressMB"); + } } public: diff --git a/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp b/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp index dcda6be8a76..a012175c493 100644 --- a/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp +++ b/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp @@ -34,7 +34,7 @@ static bool returns_to_call_stub(address return_pc) { return return_pc == _call_ enum platform_dependent_constants { code_size1 = 20000, // simply increase if too small (assembler will crash if too small) - code_size2 = 20000 // simply increase if too small (assembler will crash if too small) + code_size2 = 22000 // simply increase if too small (assembler will crash if too small) }; // CRC32 Intrinsics. diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.cpp b/src/hotspot/cpu/ppc/vm_version_ppc.cpp index b6c4058c557..c4d3041183d 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.cpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.cpp @@ -113,7 +113,7 @@ void VM_Version::initialize() { // Create and print feature-string. char buf[(num_features+1) * 16]; // Max 16 chars per feature. jio_snprintf(buf, sizeof(buf), - "ppc64%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s", + "ppc64%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s", (has_fsqrt() ? " fsqrt" : ""), (has_isel() ? " isel" : ""), (has_lxarxeh() ? " lxarxeh" : ""), @@ -130,7 +130,8 @@ void VM_Version::initialize() { (has_mfdscr() ? " mfdscr" : ""), (has_vsx() ? " vsx" : ""), (has_ldbrx() ? " ldbrx" : ""), - (has_stdbrx() ? " stdbrx" : "") + (has_stdbrx() ? " stdbrx" : ""), + (has_vshasig() ? " sha" : "") // Make sure number of %s matches num_features! ); _features_string = os::strdup(buf); @@ -247,17 +248,43 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(UseFMA, true); } - if (UseSHA) { - warning("SHA instructions are not available on this CPU"); + if (has_vshasig()) { + if (FLAG_IS_DEFAULT(UseSHA)) { + UseSHA = true; + } + } else if (UseSHA) { + if (!FLAG_IS_DEFAULT(UseSHA)) + warning("SHA instructions are not available on this CPU"); FLAG_SET_DEFAULT(UseSHA, false); } - if (UseSHA1Intrinsics || UseSHA256Intrinsics || UseSHA512Intrinsics) { - warning("SHA intrinsics are not available on this CPU"); + + if (UseSHA1Intrinsics) { + warning("Intrinsics for SHA-1 crypto hash functions not available on this CPU."); FLAG_SET_DEFAULT(UseSHA1Intrinsics, false); + } + + if (UseSHA && has_vshasig()) { + if (FLAG_IS_DEFAULT(UseSHA256Intrinsics)) { + FLAG_SET_DEFAULT(UseSHA256Intrinsics, true); + } + } else if (UseSHA256Intrinsics) { + warning("Intrinsics for SHA-224 and SHA-256 crypto hash functions not available on this CPU."); FLAG_SET_DEFAULT(UseSHA256Intrinsics, false); + } + + if (UseSHA && has_vshasig()) { + if (FLAG_IS_DEFAULT(UseSHA512Intrinsics)) { + FLAG_SET_DEFAULT(UseSHA512Intrinsics, true); + } + } else if (UseSHA512Intrinsics) { + warning("Intrinsics for SHA-384 and SHA-512 crypto hash functions not available on this CPU."); FLAG_SET_DEFAULT(UseSHA512Intrinsics, false); } + if (!(UseSHA1Intrinsics || UseSHA256Intrinsics || UseSHA512Intrinsics)) { + FLAG_SET_DEFAULT(UseSHA, false); + } + if (FLAG_IS_DEFAULT(UseSquareToLenIntrinsic)) { UseSquareToLenIntrinsic = true; } @@ -663,6 +690,7 @@ void VM_Version::determine_features() { a->lxvd2x(VSR0, R3_ARG1); // code[14] -> vsx a->ldbrx(R7, R3_ARG1, R4_ARG2); // code[15] -> ldbrx a->stdbrx(R7, R3_ARG1, R4_ARG2); // code[16] -> stdbrx + a->vshasigmaw(VR0, VR1, 1, 0xF); // code[17] -> vshasig a->blr(); // Emit function to set one cache line to zero. Emit function descriptor and get pointer to it. @@ -714,6 +742,7 @@ void VM_Version::determine_features() { if (code[feature_cntr++]) features |= vsx_m; if (code[feature_cntr++]) features |= ldbrx_m; if (code[feature_cntr++]) features |= stdbrx_m; + if (code[feature_cntr++]) features |= vshasig_m; // Print the detection code. if (PrintAssembly) { diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.hpp b/src/hotspot/cpu/ppc/vm_version_ppc.hpp index f7d5ea73aca..eec629f1d3e 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.hpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.hpp @@ -49,6 +49,7 @@ protected: vsx, ldbrx, stdbrx, + vshasig, num_features // last entry to count features }; enum Feature_Flag_Set { @@ -64,6 +65,7 @@ protected: vand_m = (1 << vand ), lqarx_m = (1 << lqarx ), vcipher_m = (1 << vcipher), + vshasig_m = (1 << vshasig), vpmsumb_m = (1 << vpmsumb), tcheck_m = (1 << tcheck ), mfdscr_m = (1 << mfdscr ), @@ -106,6 +108,7 @@ public: static bool has_vsx() { return (_features & vsx_m) != 0; } static bool has_ldbrx() { return (_features & ldbrx_m) != 0; } static bool has_stdbrx() { return (_features & stdbrx_m) != 0; } + static bool has_vshasig() { return (_features & vshasig_m) != 0; } static bool has_mtfprd() { return has_vpmsumb(); } // alias for P8 // Assembler testing diff --git a/test/hotspot/jtreg/compiler/intrinsics/sha/cli/testcases/GenericTestCaseForOtherCPU.java b/test/hotspot/jtreg/compiler/intrinsics/sha/cli/testcases/GenericTestCaseForOtherCPU.java index 698afa06de0..2ecaf5f9d28 100644 --- a/test/hotspot/jtreg/compiler/intrinsics/sha/cli/testcases/GenericTestCaseForOtherCPU.java +++ b/test/hotspot/jtreg/compiler/intrinsics/sha/cli/testcases/GenericTestCaseForOtherCPU.java @@ -42,7 +42,8 @@ public class GenericTestCaseForOtherCPU extends new OrPredicate(Platform::isAArch64, new OrPredicate(Platform::isS390x, new OrPredicate(Platform::isSparc, - new OrPredicate(Platform::isX64, Platform::isX86)))))); + new OrPredicate(Platform::isPPC, + new OrPredicate(Platform::isX64, Platform::isX86))))))); } @Override diff --git a/test/hotspot/jtreg/compiler/testlibrary/sha/predicate/IntrinsicPredicates.java b/test/hotspot/jtreg/compiler/testlibrary/sha/predicate/IntrinsicPredicates.java index d866377049b..5dce9a1fb4b 100644 --- a/test/hotspot/jtreg/compiler/testlibrary/sha/predicate/IntrinsicPredicates.java +++ b/test/hotspot/jtreg/compiler/testlibrary/sha/predicate/IntrinsicPredicates.java @@ -71,23 +71,27 @@ public class IntrinsicPredicates { = new OrPredicate(new CPUSpecificPredicate("aarch64.*", new String[] { "sha256" }, null), new OrPredicate(new CPUSpecificPredicate("s390.*", new String[] { "sha256" }, null), new OrPredicate(new CPUSpecificPredicate("sparc.*", new String[] { "sha256" }, null), + new OrPredicate(new CPUSpecificPredicate("ppc64.*", new String[] { "sha" }, null), + new OrPredicate(new CPUSpecificPredicate("ppc64le.*", new String[] { "sha" }, null), // x86 variants new OrPredicate(new CPUSpecificPredicate("amd64.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("i386.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("x86.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("amd64.*", new String[] { "avx2", "bmi2" }, null), - new CPUSpecificPredicate("x86_64", new String[] { "avx2", "bmi2" }, null)))))))); + new CPUSpecificPredicate("x86_64", new String[] { "avx2", "bmi2" }, null)))))))))); public static final BooleanSupplier SHA512_INSTRUCTION_AVAILABLE = new OrPredicate(new CPUSpecificPredicate("aarch64.*", new String[] { "sha512" }, null), new OrPredicate(new CPUSpecificPredicate("s390.*", new String[] { "sha512" }, null), new OrPredicate(new CPUSpecificPredicate("sparc.*", new String[] { "sha512" }, null), + new OrPredicate(new CPUSpecificPredicate("ppc64.*", new String[] { "sha" }, null), + new OrPredicate(new CPUSpecificPredicate("ppc64le.*", new String[] { "sha" }, null), // x86 variants new OrPredicate(new CPUSpecificPredicate("amd64.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("i386.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("x86.*", new String[] { "sha" }, null), new OrPredicate(new CPUSpecificPredicate("amd64.*", new String[] { "avx2", "bmi2" }, null), - new CPUSpecificPredicate("x86_64", new String[] { "avx2", "bmi2" }, null)))))))); + new CPUSpecificPredicate("x86_64", new String[] { "avx2", "bmi2" }, null)))))))))); public static final BooleanSupplier ANY_SHA_INSTRUCTION_AVAILABLE = new OrPredicate(IntrinsicPredicates.SHA1_INSTRUCTION_AVAILABLE, From 7a446900dace4c4b006546d6f82050cd48bcc565 Mon Sep 17 00:00:00 2001 From: Calvin Cheung Date: Mon, 25 Sep 2017 14:23:18 -0700 Subject: [PATCH 43/80] 8187884: [TESTBUG] compiler/classUnloading/anonymousClass/TestAnonymousClassUnloading failed with ClassNotFoundException Reviewed-by: kvn --- .../anonymousClass/TestAnonymousClassUnloading.java | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/test/hotspot/jtreg/compiler/classUnloading/anonymousClass/TestAnonymousClassUnloading.java b/test/hotspot/jtreg/compiler/classUnloading/anonymousClass/TestAnonymousClassUnloading.java index 0c41ba78d3a..76559944c7c 100644 --- a/test/hotspot/jtreg/compiler/classUnloading/anonymousClass/TestAnonymousClassUnloading.java +++ b/test/hotspot/jtreg/compiler/classUnloading/anonymousClass/TestAnonymousClassUnloading.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2014, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2014, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -22,13 +22,16 @@ */ /* - * @test TestAnonymousClassUnloading + * @test * @bug 8054402 * @summary "Tests unloading of anonymous classes." * @library /test/lib / * @modules java.base/jdk.internal.misc + * @build sun.hotspot.WhiteBox + * @run driver ClassFileInstaller sun.hotspot.WhiteBox + * sun.hotspot.WhiteBox$WhiteBoxPermission * - * @run main/othervm/bootclasspath -XX:+UnlockDiagnosticVMOptions -XX:+WhiteBoxAPI + * @run main/othervm -Xbootclasspath/a:. -XX:+UnlockDiagnosticVMOptions -XX:+WhiteBoxAPI * -XX:-BackgroundCompilation * compiler.classUnloading.anonymousClass.TestAnonymousClassUnloading */ From 04b79fa8f36d439ce293d69e2451335cd3850c06 Mon Sep 17 00:00:00 2001 From: Mikael Gerdin Date: Mon, 25 Sep 2017 21:25:46 -0400 Subject: [PATCH 44/80] 8187040: ThreadCritical crashes on Solaris if used between os::init and os::init_2 Reviewed-by: dholmes, stuefe --- src/hotspot/os/aix/os_aix.cpp | 2 -- src/hotspot/os/aix/threadCritical_aix.cpp | 6 ------ src/hotspot/os/bsd/os_bsd.cpp | 2 -- src/hotspot/os/bsd/threadCritical_bsd.cpp | 6 ------ src/hotspot/os/linux/os_linux.cpp | 2 -- src/hotspot/os/linux/threadCritical_linux.cpp | 6 ------ src/hotspot/os/solaris/os_solaris.cpp | 5 ++--- src/hotspot/os/solaris/os_solaris.hpp | 4 ++++ src/hotspot/os/solaris/threadCritical_solaris.cpp | 14 ++------------ src/hotspot/os/windows/threadCritical_windows.cpp | 10 ---------- src/hotspot/share/runtime/threadCritical.hpp | 5 ----- 11 files changed, 8 insertions(+), 54 deletions(-) diff --git a/src/hotspot/os/aix/os_aix.cpp b/src/hotspot/os/aix/os_aix.cpp index 68a206afd14..70441018902 100644 --- a/src/hotspot/os/aix/os_aix.cpp +++ b/src/hotspot/os/aix/os_aix.cpp @@ -3443,8 +3443,6 @@ void os::init(void) { init_random(1234567); - ThreadCritical::initialize(); - // Main_thread points to the aboriginal thread. Aix::_main_thread = pthread_self(); diff --git a/src/hotspot/os/aix/threadCritical_aix.cpp b/src/hotspot/os/aix/threadCritical_aix.cpp index a5d893ba9f1..cd25cb68dc4 100644 --- a/src/hotspot/os/aix/threadCritical_aix.cpp +++ b/src/hotspot/os/aix/threadCritical_aix.cpp @@ -38,12 +38,6 @@ static pthread_t tc_owner = 0; static pthread_mutex_t tc_mutex = PTHREAD_MUTEX_INITIALIZER; static int tc_count = 0; -void ThreadCritical::initialize() { -} - -void ThreadCritical::release() { -} - ThreadCritical::ThreadCritical() { pthread_t self = pthread_self(); if (self != tc_owner) { diff --git a/src/hotspot/os/bsd/os_bsd.cpp b/src/hotspot/os/bsd/os_bsd.cpp index ef83bf31130..bfa7811f8da 100644 --- a/src/hotspot/os/bsd/os_bsd.cpp +++ b/src/hotspot/os/bsd/os_bsd.cpp @@ -3353,8 +3353,6 @@ void os::init(void) { init_random(1234567); - ThreadCritical::initialize(); - Bsd::set_page_size(getpagesize()); if (Bsd::page_size() == -1) { fatal("os_bsd.cpp: os::init: sysconf failed (%s)", os::strerror(errno)); diff --git a/src/hotspot/os/bsd/threadCritical_bsd.cpp b/src/hotspot/os/bsd/threadCritical_bsd.cpp index 7cac3ca228b..71c51df599d 100644 --- a/src/hotspot/os/bsd/threadCritical_bsd.cpp +++ b/src/hotspot/os/bsd/threadCritical_bsd.cpp @@ -37,12 +37,6 @@ static pthread_t tc_owner = 0; static pthread_mutex_t tc_mutex = PTHREAD_MUTEX_INITIALIZER; static int tc_count = 0; -void ThreadCritical::initialize() { -} - -void ThreadCritical::release() { -} - ThreadCritical::ThreadCritical() { pthread_t self = pthread_self(); if (self != tc_owner) { diff --git a/src/hotspot/os/linux/os_linux.cpp b/src/hotspot/os/linux/os_linux.cpp index e6ebec3e53e..5eabc870287 100644 --- a/src/hotspot/os/linux/os_linux.cpp +++ b/src/hotspot/os/linux/os_linux.cpp @@ -4768,8 +4768,6 @@ void os::init(void) { init_random(1234567); - ThreadCritical::initialize(); - Linux::set_page_size(sysconf(_SC_PAGESIZE)); if (Linux::page_size() == -1) { fatal("os_linux.cpp: os::init: sysconf failed (%s)", diff --git a/src/hotspot/os/linux/threadCritical_linux.cpp b/src/hotspot/os/linux/threadCritical_linux.cpp index 7cac3ca228b..71c51df599d 100644 --- a/src/hotspot/os/linux/threadCritical_linux.cpp +++ b/src/hotspot/os/linux/threadCritical_linux.cpp @@ -37,12 +37,6 @@ static pthread_t tc_owner = 0; static pthread_mutex_t tc_mutex = PTHREAD_MUTEX_INITIALIZER; static int tc_count = 0; -void ThreadCritical::initialize() { -} - -void ThreadCritical::release() { -} - ThreadCritical::ThreadCritical() { pthread_t self = pthread_self(); if (self != tc_owner) { diff --git a/src/hotspot/os/solaris/os_solaris.cpp b/src/hotspot/os/solaris/os_solaris.cpp index 065fcb4e602..814589d375d 100644 --- a/src/hotspot/os/solaris/os_solaris.cpp +++ b/src/hotspot/os/solaris/os_solaris.cpp @@ -4076,6 +4076,7 @@ int_fnP_cond_tP os::Solaris::_cond_broadcast; int_fnP_cond_tP_i_vP os::Solaris::_cond_init; int_fnP_cond_tP os::Solaris::_cond_destroy; int os::Solaris::_cond_scope = USYNC_THREAD; +bool os::Solaris::_synchronization_initialized; void os::Solaris::synchronization_init() { if (UseLWPSynchronization) { @@ -4125,6 +4126,7 @@ void os::Solaris::synchronization_init() { os::Solaris::set_cond_destroy(::cond_destroy); } } + _synchronization_initialized = true; } bool os::Solaris::liblgrp_init() { @@ -4198,9 +4200,6 @@ void os::init(void) { dladdr1_func = CAST_TO_FN_PTR(dladdr1_func_type, dlsym(hdl, "dladdr1")); } - // (Solaris only) this switches to calls that actually do locking. - ThreadCritical::initialize(); - main_thread = thr_self(); // dynamic lookup of functions that may not be available in our lowest diff --git a/src/hotspot/os/solaris/os_solaris.hpp b/src/hotspot/os/solaris/os_solaris.hpp index 56305846c58..c5fe31847f0 100644 --- a/src/hotspot/os/solaris/os_solaris.hpp +++ b/src/hotspot/os/solaris/os_solaris.hpp @@ -65,6 +65,8 @@ class Solaris { static int_fnP_cond_tP _cond_destroy; static int _cond_scope; + static bool _synchronization_initialized; + typedef uintptr_t lgrp_cookie_t; typedef id_t lgrp_id_t; typedef int lgrp_rsrc_t; @@ -227,6 +229,8 @@ class Solaris { static void set_cond_destroy(int_fnP_cond_tP func) { _cond_destroy = func; } static void set_cond_scope(int scope) { _cond_scope = scope; } + static bool synchronization_initialized() { return _synchronization_initialized; } + static void set_lgrp_home(lgrp_home_func_t func) { _lgrp_home = func; } static void set_lgrp_init(lgrp_init_func_t func) { _lgrp_init = func; } static void set_lgrp_fini(lgrp_fini_func_t func) { _lgrp_fini = func; } diff --git a/src/hotspot/os/solaris/threadCritical_solaris.cpp b/src/hotspot/os/solaris/threadCritical_solaris.cpp index 53bd865b592..bb2c9e7e875 100644 --- a/src/hotspot/os/solaris/threadCritical_solaris.cpp +++ b/src/hotspot/os/solaris/threadCritical_solaris.cpp @@ -42,10 +42,9 @@ static mutex_t global_mut; static thread_t global_mut_owner = -1; static int global_mut_count = 0; -static bool initialized = false; ThreadCritical::ThreadCritical() { - if (initialized) { + if (os::Solaris::synchronization_initialized()) { thread_t owner = thr_self(); if (global_mut_owner != owner) { if (os::Solaris::mutex_lock(&global_mut)) @@ -62,7 +61,7 @@ ThreadCritical::ThreadCritical() { } ThreadCritical::~ThreadCritical() { - if (initialized) { + if (os::Solaris::synchronization_initialized()) { assert(global_mut_owner == thr_self(), "must have correct owner"); assert(global_mut_count > 0, "must have correct count"); --global_mut_count; @@ -75,12 +74,3 @@ ThreadCritical::~ThreadCritical() { assert (Threads::number_of_threads() == 0, "valid only during initialization"); } } - -void ThreadCritical::initialize() { - // This method is called at the end of os::init(). Until - // then, we don't do real locking. - initialized = true; -} - -void ThreadCritical::release() { -} diff --git a/src/hotspot/os/windows/threadCritical_windows.cpp b/src/hotspot/os/windows/threadCritical_windows.cpp index b432f7bb078..66f19e91fc0 100644 --- a/src/hotspot/os/windows/threadCritical_windows.cpp +++ b/src/hotspot/os/windows/threadCritical_windows.cpp @@ -51,16 +51,6 @@ static DWORD lock_owner = -1; // and found them ~30 times slower than the critical region code. // -void ThreadCritical::initialize() { -} - -void ThreadCritical::release() { - assert(lock_owner == -1, "Mutex being deleted while owned."); - assert(lock_count == -1, "Mutex being deleted while recursively locked"); - assert(lock_event != NULL, "Sanity check"); - CloseHandle(lock_event); -} - ThreadCritical::ThreadCritical() { DWORD current_thread = GetCurrentThreadId(); diff --git a/src/hotspot/share/runtime/threadCritical.hpp b/src/hotspot/share/runtime/threadCritical.hpp index 340c00fa5d1..4ae5086d773 100644 --- a/src/hotspot/share/runtime/threadCritical.hpp +++ b/src/hotspot/share/runtime/threadCritical.hpp @@ -47,11 +47,6 @@ // or CHeapObj, due to initialization issues. class ThreadCritical : public StackObj { - friend class os; - private: - static void initialize(); - static void release(); - public: ThreadCritical(); ~ThreadCritical(); From 195531f73372ec5170e5894528c806ec67216fe1 Mon Sep 17 00:00:00 2001 From: Serguei Spitsyn Date: Tue, 26 Sep 2017 00:52:29 -0700 Subject: [PATCH 45/80] 8177901: JDWP exit error JVMTI_ERROR_WRONG_PHASE(112): on checking for an interface Add synchronization between CommandLoop and cbVMDeath callback Reviewed-by: dholmes, dcubed --- .../share/native/libjdwp/debugInit.c | 3 + .../share/native/libjdwp/eventHandler.c | 10 ++-- .../share/native/libjdwp/eventHelper.c | 55 ++++++++++++++++++- .../share/native/libjdwp/eventHelper.h | 5 +- 4 files changed, 64 insertions(+), 9 deletions(-) diff --git a/src/jdk.jdwp.agent/share/native/libjdwp/debugInit.c b/src/jdk.jdwp.agent/share/native/libjdwp/debugInit.c index 075dedacbb1..4ed1d5abf71 100644 --- a/src/jdk.jdwp.agent/share/native/libjdwp/debugInit.c +++ b/src/jdk.jdwp.agent/share/native/libjdwp/debugInit.c @@ -1301,6 +1301,9 @@ debugInit_exit(jvmtiError error, const char *msg) { enum exit_codes { EXIT_NO_ERRORS = 0, EXIT_JVMTI_ERROR = 1, EXIT_TRANSPORT_ERROR = 2 }; + // Release commandLoop vmDeathLock if necessary + commandLoop_exitVmDeathLockOnError(); + // Prepare to exit. Log error and finish logging LOG_MISC(("Exiting with error %s(%d): %s", jvmtiErrorText(error), error, ((msg == NULL) ? "" : msg))); diff --git a/src/jdk.jdwp.agent/share/native/libjdwp/eventHandler.c b/src/jdk.jdwp.agent/share/native/libjdwp/eventHandler.c index f78232e1229..2fc3d1b82d3 100644 --- a/src/jdk.jdwp.agent/share/native/libjdwp/eventHandler.c +++ b/src/jdk.jdwp.agent/share/native/libjdwp/eventHandler.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 1998, 2007, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1998, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -1287,11 +1287,11 @@ cbVMDeath(jvmtiEnv *jvmti_env, JNIEnv *env) } debugMonitorExit(callbackBlock); /* - * The VM will die soon after the completion of this callback - we - * may need to do a final synchronization with the command loop to - * avoid the VM terminating with replying to the final (resume) - * command. + * The VM will die soon after the completion of this callback - + * we synchronize with both the command loop and the debug loop + * for a more orderly shutdown. */ + commandLoop_sync(); debugLoop_sync(); LOG_MISC(("END cbVMDeath")); diff --git a/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.c b/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.c index bd5f080ba37..f301cdc63e3 100644 --- a/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.c +++ b/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.c @@ -29,6 +29,9 @@ #include "threadControl.h" #include "invoker.h" + +#define COMMAND_LOOP_THREAD_NAME "JDWP Event Helper Thread" + /* * Event helper thread command commandKinds */ @@ -121,6 +124,9 @@ static CommandQueue commandQueue; static jrawMonitorID commandQueueLock; static jrawMonitorID commandCompleteLock; static jrawMonitorID blockCommandLoopLock; +static jrawMonitorID vmDeathLock; +static volatile jboolean commandLoopEnteredVmDeathLock = JNI_FALSE; + static jint maxQueueSize = 50 * 1024; /* TO DO: Make this configurable */ static jboolean holdEvents; static jint currentQueueSize = 0; @@ -700,9 +706,15 @@ commandLoop(jvmtiEnv* jvmti_env, JNIEnv* jni_env, void* arg) * handleCommand() to prevent any races. */ jboolean doBlock = needBlockCommandLoop(command); - log_debugee_location("commandLoop(): command being handled", NULL, NULL, 0); - handleCommand(jni_env, command); + debugMonitorEnter(vmDeathLock); + commandLoopEnteredVmDeathLock = JNI_TRUE; + if (!gdata->vmDead) { + log_debugee_location("commandLoop(): command being handled", NULL, NULL, 0); + handleCommand(jni_env, command); + } completeCommand(command); + debugMonitorExit(vmDeathLock); + commandLoopEnteredVmDeathLock = JNI_FALSE; /* if we just finished a suspend-all cmd, then we block here */ if (doBlock) { doBlockCommandLoop(); @@ -725,10 +737,11 @@ eventHelper_initialize(jbyte sessionID) commandQueueLock = debugMonitorCreate("JDWP Event Helper Queue Monitor"); commandCompleteLock = debugMonitorCreate("JDWP Event Helper Completion Monitor"); blockCommandLoopLock = debugMonitorCreate("JDWP Event Block CommandLoop Monitor"); + vmDeathLock = debugMonitorCreate("JDWP VM_DEATH CommandLoop Monitor"); /* Start the event handler thread */ func = &commandLoop; - (void)spawnNewThread(func, NULL, "JDWP Event Helper Thread"); + (void)spawnNewThread(func, NULL, COMMAND_LOOP_THREAD_NAME); } void @@ -759,6 +772,42 @@ eventHelper_unlock(void) debugMonitorExit(commandQueueLock); } +void commandLoop_exitVmDeathLockOnError() +{ + const char* MSG_BASE = "exitVmDeathLockOnError: error in JVMTI %s: %d\n"; + jthread cur_thread = NULL; + jvmtiThreadInfo thread_info; + jvmtiError err = JVMTI_ERROR_NONE; + + err = JVMTI_FUNC_PTR(gdata->jvmti, GetCurrentThread) + (gdata->jvmti, &cur_thread); + if (err != JVMTI_ERROR_NONE) { + LOG_ERROR((MSG_BASE, "GetCurrentThread", err)); + return; + } + + err = JVMTI_FUNC_PTR(gdata->jvmti, GetThreadInfo) + (gdata->jvmti, cur_thread, &thread_info); + if (err != JVMTI_ERROR_NONE) { + LOG_ERROR((MSG_BASE, "GetThreadInfo", err)); + return; + } + if (strcmp(thread_info.name, COMMAND_LOOP_THREAD_NAME) != 0) { + return; + } + if (commandLoopEnteredVmDeathLock == JNI_TRUE) { + debugMonitorExit(vmDeathLock); + commandLoopEnteredVmDeathLock = JNI_FALSE; + } +} + +void +commandLoop_sync(void) +{ + debugMonitorEnter(vmDeathLock); + debugMonitorExit(vmDeathLock); +} + /* Change all references to global in the EventInfo struct */ static void saveEventInfoRefs(JNIEnv *env, EventInfo *evinfo) diff --git a/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.h b/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.h index fcc4e86f337..8387cb0f3da 100644 --- a/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.h +++ b/src/jdk.jdwp.agent/share/native/libjdwp/eventHelper.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 1998, 2004, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1998, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -54,6 +54,9 @@ void eventHelper_releaseEvents(void); void eventHelper_lock(void); void eventHelper_unlock(void); +void commandLoop_sync(void); /* commandLoop sync with cbVMDeath */ +void commandLoop_exitVmDeathLockOnError(void); + /* * Private interface for coordinating between eventHelper.c: commandLoop() * and ThreadReferenceImpl.c: resume() and VirtualMachineImpl.c: resume(). From 1af1d42ac426276fdfe88f14e5369e58feab700d Mon Sep 17 00:00:00 2001 From: Patric Hedlin Date: Fri, 29 Sep 2017 10:40:49 +0200 Subject: [PATCH 46/80] 8011352: C1: TraceCodeBlobStacks crashes fastdebug Solaris SPARC Handle null correctly Reviewed-by: roland, dlong, rbackman --- src/hotspot/cpu/sparc/frame_sparc.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/hotspot/cpu/sparc/frame_sparc.cpp b/src/hotspot/cpu/sparc/frame_sparc.cpp index 4fa7e6a973b..3985a875c34 100644 --- a/src/hotspot/cpu/sparc/frame_sparc.cpp +++ b/src/hotspot/cpu/sparc/frame_sparc.cpp @@ -119,8 +119,8 @@ address RegisterMap::pd_location(VMReg regname) const { reg = regname->as_Register(); } if (reg->is_out()) { - assert(_younger_window != NULL, "Younger window should be available"); - return second_word + (address)&_younger_window[reg->after_save()->sp_offset_in_saved_window()]; + return _younger_window == NULL ? NULL : + second_word + (address)&_younger_window[reg->after_save()->sp_offset_in_saved_window()]; } if (reg->is_local() || reg->is_in()) { assert(_window != NULL, "Window should be available"); From b125aebb91bd2fcd19aaf440c99ef61743a289b2 Mon Sep 17 00:00:00 2001 From: Patric Hedlin Date: Fri, 29 Sep 2017 10:40:54 +0200 Subject: [PATCH 47/80] 8167199: Add C2 SPARC intrinsic for BigInteger::multiplyToLen() method Preliminary support for intrinsic multiplyToLen, including generalised version based on 'mpmul' instruction (when available). Reviewed-by: kvn, neliasso --- src/hotspot/cpu/sparc/assembler_sparc.hpp | 48 +- .../cpu/sparc/assembler_sparc.inline.hpp | 66 +- src/hotspot/cpu/sparc/globals_sparc.hpp | 5 +- .../cpu/sparc/macroAssembler_sparc.cpp | 26 +- .../cpu/sparc/macroAssembler_sparc.hpp | 17 +- .../cpu/sparc/macroAssembler_sparc.inline.hpp | 2 +- src/hotspot/cpu/sparc/register_sparc.hpp | 8 +- src/hotspot/cpu/sparc/stubGenerator_sparc.cpp | 778 +++++++++++++++++- src/hotspot/cpu/sparc/stubRoutines_sparc.hpp | 2 +- src/hotspot/cpu/sparc/vm_version_sparc.cpp | 19 + 10 files changed, 912 insertions(+), 59 deletions(-) diff --git a/src/hotspot/cpu/sparc/assembler_sparc.hpp b/src/hotspot/cpu/sparc/assembler_sparc.hpp index 69822951928..c3f1ddddbfe 100644 --- a/src/hotspot/cpu/sparc/assembler_sparc.hpp +++ b/src/hotspot/cpu/sparc/assembler_sparc.hpp @@ -122,6 +122,7 @@ class Assembler : public AbstractAssembler { fpop1_op3 = 0x34, fpop2_op3 = 0x35, impdep1_op3 = 0x36, + addx_op3 = 0x36, aes3_op3 = 0x36, sha_op3 = 0x36, bmask_op3 = 0x36, @@ -133,6 +134,8 @@ class Assembler : public AbstractAssembler { fzero_op3 = 0x36, fsrc_op3 = 0x36, fnot_op3 = 0x36, + mpmul_op3 = 0x36, + umulx_op3 = 0x36, xmulx_op3 = 0x36, crc32c_op3 = 0x36, impdep2_op3 = 0x37, @@ -195,6 +198,9 @@ class Assembler : public AbstractAssembler { fnegs_opf = 0x05, fnegd_opf = 0x06, + addxc_opf = 0x11, + addxccc_opf = 0x13, + umulxhi_opf = 0x16, alignaddr_opf = 0x18, bmask_opf = 0x19, @@ -240,7 +246,8 @@ class Assembler : public AbstractAssembler { sha256_opf = 0x142, sha512_opf = 0x143, - crc32c_opf = 0x147 + crc32c_opf = 0x147, + mpmul_opf = 0x148 }; enum op5s { @@ -380,7 +387,7 @@ class Assembler : public AbstractAssembler { assert_signed_range(x, nbits + 2); } - static void assert_unsigned_const(int x, int nbits) { + static void assert_unsigned_range(int x, int nbits) { assert(juint(x) < juint(1 << nbits), "unsigned constant out of range"); } @@ -534,6 +541,12 @@ class Assembler : public AbstractAssembler { return x & ((1 << nbits) - 1); } + // unsigned immediate, in low bits, at most nbits long. + static int uimm(int x, int nbits) { + assert_unsigned_range(x, nbits); + return x & ((1 << nbits) - 1); + } + // compute inverse of wdisp16 static intptr_t inv_wdisp16(int x, intptr_t pos) { int lo = x & ((1 << 14) - 1); @@ -631,6 +644,9 @@ class Assembler : public AbstractAssembler { // FMAf instructions supported only on certain processors static void fmaf_only() { assert(VM_Version::has_fmaf(), "This instruction only works on SPARC with FMAf"); } + // MPMUL instruction supported only on certain processors + static void mpmul_only() { assert( VM_Version::has_mpmul(), "This instruction only works on SPARC with MPMUL"); } + // instruction only in VIS1 static void vis1_only() { assert(VM_Version::has_vis1(), "This instruction only works on SPARC with VIS1"); } @@ -772,11 +788,12 @@ class Assembler : public AbstractAssembler { AbstractAssembler::flush(); } - inline void emit_int32(int); // shadows AbstractAssembler::emit_int32 - inline void emit_data(int); - inline void emit_data(int, RelocationHolder const &rspec); - inline void emit_data(int, relocInfo::relocType rtype); - // helper for above functions + inline void emit_int32(int32_t); // shadows AbstractAssembler::emit_int32 + inline void emit_data(int32_t); + inline void emit_data(int32_t, RelocationHolder const&); + inline void emit_data(int32_t, relocInfo::relocType rtype); + + // Helper for the above functions. inline void check_delay(); @@ -960,6 +977,8 @@ class Assembler : public AbstractAssembler { inline void ldf(FloatRegisterImpl::Width w, Register s1, int simm13a, FloatRegister d, RelocationHolder const &rspec = RelocationHolder()); + inline void ldd(Register s1, Register s2, FloatRegister d); + inline void ldd(Register s1, int simm13a, FloatRegister d); inline void ldfsr(Register s1, Register s2); inline void ldfsr(Register s1, int simm13a); @@ -987,8 +1006,6 @@ class Assembler : public AbstractAssembler { inline void lduw(Register s1, int simm13a, Register d); inline void ldx(Register s1, Register s2, Register d); inline void ldx(Register s1, int simm13a, Register d); - inline void ldd(Register s1, Register s2, Register d); - inline void ldd(Register s1, int simm13a, Register d); // pp 177 @@ -1157,6 +1174,9 @@ class Assembler : public AbstractAssembler { inline void stf(FloatRegisterImpl::Width w, FloatRegister d, Register s1, Register s2); inline void stf(FloatRegisterImpl::Width w, FloatRegister d, Register s1, int simm13a); + inline void std(FloatRegister d, Register s1, Register s2); + inline void std(FloatRegister d, Register s1, int simm13a); + inline void stfsr(Register s1, Register s2); inline void stfsr(Register s1, int simm13a); inline void stxfsr(Register s1, Register s2); @@ -1177,8 +1197,6 @@ class Assembler : public AbstractAssembler { inline void stw(Register d, Register s1, int simm13a); inline void stx(Register d, Register s1, Register s2); inline void stx(Register d, Register s1, int simm13a); - inline void std(Register d, Register s1, Register s2); - inline void std(Register d, Register s1, int simm13a); // pp 177 @@ -1267,6 +1285,9 @@ class Assembler : public AbstractAssembler { // VIS3 instructions + inline void addxc(Register s1, Register s2, Register d); + inline void addxccc(Register s1, Register s2, Register d); + inline void movstosw(FloatRegister s, Register d); inline void movstouw(FloatRegister s, Register d); inline void movdtox(FloatRegister s, Register d); @@ -1276,6 +1297,7 @@ class Assembler : public AbstractAssembler { inline void xmulx(Register s1, Register s2, Register d); inline void xmulxhi(Register s1, Register s2, Register d); + inline void umulxhi(Register s1, Register s2, Register d); // Crypto SHA instructions @@ -1287,6 +1309,10 @@ class Assembler : public AbstractAssembler { inline void crc32c(FloatRegister s1, FloatRegister s2, FloatRegister d); + // MPMUL instruction + + inline void mpmul(int uimm5); + // Creation Assembler(CodeBuffer* code) : AbstractAssembler(code) { #ifdef VALIDATE_PIPELINE diff --git a/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp b/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp index 070a1f80db3..7a87f0c3387 100644 --- a/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp +++ b/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp @@ -59,7 +59,7 @@ inline void Assembler::check_delay() { #endif } -inline void Assembler::emit_int32(int x) { +inline void Assembler::emit_int32(int32_t x) { check_delay(); #ifdef VALIDATE_PIPELINE _hazard_state = NoHazard; @@ -67,16 +67,16 @@ inline void Assembler::emit_int32(int x) { AbstractAssembler::emit_int32(x); } -inline void Assembler::emit_data(int x) { +inline void Assembler::emit_data(int32_t x) { emit_int32(x); } -inline void Assembler::emit_data(int x, relocInfo::relocType rtype) { +inline void Assembler::emit_data(int32_t x, relocInfo::relocType rtype) { relocate(rtype); emit_int32(x); } -inline void Assembler::emit_data(int x, RelocationHolder const &rspec) { +inline void Assembler::emit_data(int32_t x, RelocationHolder const &rspec) { relocate(rspec); emit_int32(x); } @@ -402,6 +402,15 @@ inline void Assembler::ldf(FloatRegisterImpl::Width w, Register s1, int simm13a, emit_data(op(ldst_op) | fd(d, w) | alt_op3(ldf_op3, w) | rs1(s1) | immed(true) | simm(simm13a, 13), rspec); } +inline void Assembler::ldd(Register s1, Register s2, FloatRegister d) { + assert(d->is_even(), "not even"); + ldf(FloatRegisterImpl::D, s1, s2, d); +} +inline void Assembler::ldd(Register s1, int simm13a, FloatRegister d) { + assert(d->is_even(), "not even"); + ldf(FloatRegisterImpl::D, s1, simm13a, d); +} + inline void Assembler::ldxfsr(Register s1, Register s2) { emit_int32(op(ldst_op) | rd(G1) | op3(ldfsr_op3) | rs1(s1) | rs2(s2)); } @@ -460,16 +469,6 @@ inline void Assembler::ldx(Register s1, Register s2, Register d) { inline void Assembler::ldx(Register s1, int simm13a, Register d) { emit_data(op(ldst_op) | rd(d) | op3(ldx_op3) | rs1(s1) | immed(true) | simm(simm13a, 13)); } -inline void Assembler::ldd(Register s1, Register s2, Register d) { - v9_dep(); - assert(d->is_even(), "not even"); - emit_int32(op(ldst_op) | rd(d) | op3(ldd_op3) | rs1(s1) | rs2(s2)); -} -inline void Assembler::ldd(Register s1, int simm13a, Register d) { - v9_dep(); - assert(d->is_even(), "not even"); - emit_data(op(ldst_op) | rd(d) | op3(ldd_op3) | rs1(s1) | immed(true) | simm(simm13a, 13)); -} inline void Assembler::ldsba(Register s1, Register s2, int ia, Register d) { emit_int32(op(ldst_op) | rd(d) | op3(ldsb_op3 | alt_bit_op3) | rs1(s1) | imm_asi(ia) | rs2(s2)); @@ -806,6 +805,15 @@ inline void Assembler::stf(FloatRegisterImpl::Width w, FloatRegister d, Register emit_data(op(ldst_op) | fd(d, w) | alt_op3(stf_op3, w) | rs1(s1) | immed(true) | simm(simm13a, 13)); } +inline void Assembler::std(FloatRegister d, Register s1, Register s2) { + assert(d->is_even(), "not even"); + stf(FloatRegisterImpl::D, d, s1, s2); +} +inline void Assembler::std(FloatRegister d, Register s1, int simm13a) { + assert(d->is_even(), "not even"); + stf(FloatRegisterImpl::D, d, s1, simm13a); +} + inline void Assembler::stxfsr(Register s1, Register s2) { emit_int32(op(ldst_op) | rd(G1) | op3(stfsr_op3) | rs1(s1) | rs2(s2)); } @@ -848,16 +856,6 @@ inline void Assembler::stx(Register d, Register s1, Register s2) { inline void Assembler::stx(Register d, Register s1, int simm13a) { emit_data(op(ldst_op) | rd(d) | op3(stx_op3) | rs1(s1) | immed(true) | simm(simm13a, 13)); } -inline void Assembler::std(Register d, Register s1, Register s2) { - v9_dep(); - assert(d->is_even(), "not even"); - emit_int32(op(ldst_op) | rd(d) | op3(std_op3) | rs1(s1) | rs2(s2)); -} -inline void Assembler::std(Register d, Register s1, int simm13a) { - v9_dep(); - assert(d->is_even(), "not even"); - emit_data(op(ldst_op) | rd(d) | op3(std_op3) | rs1(s1) | immed(true) | simm(simm13a, 13)); -} inline void Assembler::stba(Register d, Register s1, Register s2, int ia) { emit_int32(op(ldst_op) | rd(d) | op3(stb_op3 | alt_bit_op3) | rs1(s1) | imm_asi(ia) | rs2(s2)); @@ -1043,6 +1041,15 @@ inline void Assembler::bshuffle(FloatRegister s1, FloatRegister s2, FloatRegiste // VIS3 instructions +inline void Assembler::addxc(Register s1, Register s2, Register d) { + vis3_only(); + emit_int32(op(arith_op) | rd(d) | op3(addx_op3) | rs1(s1) | opf(addxc_opf) | rs2(s2)); +} +inline void Assembler::addxccc(Register s1, Register s2, Register d) { + vis3_only(); + emit_int32(op(arith_op) | rd(d) | op3(addx_op3) | rs1(s1) | opf(addxccc_opf) | rs2(s2)); +} + inline void Assembler::movstosw(FloatRegister s, Register d) { vis3_only(); emit_int32(op(arith_op) | rd(d) | op3(mftoi_op3) | opf(mstosw_opf) | fs2(s, FloatRegisterImpl::S)); @@ -1073,6 +1080,10 @@ inline void Assembler::xmulxhi(Register s1, Register s2, Register d) { vis3_only(); emit_int32(op(arith_op) | rd(d) | op3(xmulx_op3) | rs1(s1) | opf(xmulxhi_opf) | rs2(s2)); } +inline void Assembler::umulxhi(Register s1, Register s2, Register d) { + vis3_only(); + emit_int32(op(arith_op) | rd(d) | op3(umulx_op3) | rs1(s1) | opf(umulxhi_opf) | rs2(s2)); +} // Crypto SHA instructions @@ -1096,4 +1107,11 @@ inline void Assembler::crc32c(FloatRegister s1, FloatRegister s2, FloatRegister emit_int32(op(arith_op) | fd(d, FloatRegisterImpl::D) | op3(crc32c_op3) | fs1(s1, FloatRegisterImpl::D) | opf(crc32c_opf) | fs2(s2, FloatRegisterImpl::D)); } +// MPMUL instruction + +inline void Assembler::mpmul(int uimm5) { + mpmul_only(); + emit_int32(op(arith_op) | rd(0) | op3(mpmul_op3) | rs1(0) | opf(mpmul_opf) | uimm(uimm5, 5)); +} + #endif // CPU_SPARC_VM_ASSEMBLER_SPARC_INLINE_HPP diff --git a/src/hotspot/cpu/sparc/globals_sparc.hpp b/src/hotspot/cpu/sparc/globals_sparc.hpp index 89361fcddbd..a232649f957 100644 --- a/src/hotspot/cpu/sparc/globals_sparc.hpp +++ b/src/hotspot/cpu/sparc/globals_sparc.hpp @@ -97,12 +97,15 @@ define_pd_global(intx, InitArrayShortSize, 8*BytesPerLong); writeable) \ \ product(intx, UseVIS, 99, \ - "Highest supported VIS instructions set on Sparc") \ + "Highest supported VIS instructions set on SPARC") \ range(0, 99) \ \ product(bool, UseCBCond, false, \ "Use compare and branch instruction on SPARC") \ \ + product(bool, UseMPMUL, false, \ + "Use multi-precision multiply instruction (mpmul) on SPARC") \ + \ product(bool, UseBlockZeroing, false, \ "Use special cpu instructions for block zeroing") \ \ diff --git a/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp b/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp index b667f1b1103..52d7d8c2fb3 100644 --- a/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp +++ b/src/hotspot/cpu/sparc/macroAssembler_sparc.cpp @@ -1574,29 +1574,39 @@ void MacroAssembler::br_null_short(Register s1, Predict p, Label& L) { assert_not_delayed(); if (use_cbcond(L)) { Assembler::cbcond(zero, ptr_cc, s1, 0, L); - return; + } else { + br_null(s1, false, p, L); + delayed()->nop(); } - br_null(s1, false, p, L); - delayed()->nop(); } void MacroAssembler::br_notnull_short(Register s1, Predict p, Label& L) { assert_not_delayed(); if (use_cbcond(L)) { Assembler::cbcond(notZero, ptr_cc, s1, 0, L); - return; + } else { + br_notnull(s1, false, p, L); + delayed()->nop(); } - br_notnull(s1, false, p, L); - delayed()->nop(); } // Unconditional short branch void MacroAssembler::ba_short(Label& L) { + assert_not_delayed(); if (use_cbcond(L)) { Assembler::cbcond(equal, icc, G0, G0, L); - return; + } else { + br(always, false, pt, L); + delayed()->nop(); } - br(always, false, pt, L); +} + +// Branch if 'icc' says zero or not (i.e. icc.z == 1|0). + +void MacroAssembler::br_icc_zero(bool iszero, Predict p, Label &L) { + assert_not_delayed(); + Condition cf = (iszero ? Assembler::zero : Assembler::notZero); + br(cf, false, p, L); delayed()->nop(); } diff --git a/src/hotspot/cpu/sparc/macroAssembler_sparc.hpp b/src/hotspot/cpu/sparc/macroAssembler_sparc.hpp index 4f24d0354ee..db1ebf1ead8 100644 --- a/src/hotspot/cpu/sparc/macroAssembler_sparc.hpp +++ b/src/hotspot/cpu/sparc/macroAssembler_sparc.hpp @@ -606,7 +606,7 @@ class MacroAssembler : public Assembler { // offset. No explicit code generation is needed if the offset is within a certain // range (0 <= offset <= page_size). // - // %%%%%% Currently not done for SPARC + // FIXME: Currently not done for SPARC void null_check(Register reg, int offset = -1); static bool needs_explicit_null_check(intptr_t offset); @@ -648,6 +648,9 @@ class MacroAssembler : public Assembler { // unconditional short branch void ba_short(Label& L); + // Branch on icc.z (true or not). + void br_icc_zero(bool iszero, Predict p, Label &L); + inline void bp( Condition c, bool a, CC cc, Predict p, address d, relocInfo::relocType rt = relocInfo::none ); inline void bp( Condition c, bool a, CC cc, Predict p, Label& L ); @@ -663,19 +666,19 @@ class MacroAssembler : public Assembler { inline void fbp( Condition c, bool a, CC cc, Predict p, Label& L ); // Sparc shorthands(pp 85, V8 manual, pp 289 V9 manual) - inline void cmp( Register s1, Register s2 ); - inline void cmp( Register s1, int simm13a ); + inline void cmp( Register s1, Register s2 ); + inline void cmp( Register s1, int simm13a ); inline void jmp( Register s1, Register s2 ); inline void jmp( Register s1, int simm13a, RelocationHolder const& rspec = RelocationHolder() ); // Check if the call target is out of wdisp30 range (relative to the code cache) static inline bool is_far_target(address d); - inline void call( address d, relocInfo::relocType rt = relocInfo::runtime_call_type ); - inline void call( address d, RelocationHolder const& rspec); + inline void call( address d, relocInfo::relocType rt = relocInfo::runtime_call_type ); + inline void call( address d, RelocationHolder const& rspec); - inline void call( Label& L, relocInfo::relocType rt = relocInfo::runtime_call_type ); - inline void call( Label& L, RelocationHolder const& rspec); + inline void call( Label& L, relocInfo::relocType rt = relocInfo::runtime_call_type ); + inline void call( Label& L, RelocationHolder const& rspec); inline void callr( Register s1, Register s2 ); inline void callr( Register s1, int simm13a, RelocationHolder const& rspec = RelocationHolder() ); diff --git a/src/hotspot/cpu/sparc/macroAssembler_sparc.inline.hpp b/src/hotspot/cpu/sparc/macroAssembler_sparc.inline.hpp index 679bbd30c29..16871d98629 100644 --- a/src/hotspot/cpu/sparc/macroAssembler_sparc.inline.hpp +++ b/src/hotspot/cpu/sparc/macroAssembler_sparc.inline.hpp @@ -185,7 +185,7 @@ inline void MacroAssembler::br( Condition c, bool a, Predict p, address d, reloc } inline void MacroAssembler::br( Condition c, bool a, Predict p, Label& L ) { - // See note[+] on 'avoid_pipeline_stalls()', in "assembler_sparc.inline.hpp". + // See note[+] on 'avoid_pipeline_stall()', in "assembler_sparc.inline.hpp". avoid_pipeline_stall(); br(c, a, p, target(L)); } diff --git a/src/hotspot/cpu/sparc/register_sparc.hpp b/src/hotspot/cpu/sparc/register_sparc.hpp index 22cb0283825..5682b622d9c 100644 --- a/src/hotspot/cpu/sparc/register_sparc.hpp +++ b/src/hotspot/cpu/sparc/register_sparc.hpp @@ -236,7 +236,7 @@ class FloatRegisterImpl: public AbstractRegisterImpl { inline VMReg as_VMReg( ); // accessors - int encoding() const { assert(is_valid(), "invalid register"); return value(); } + int encoding() const { assert(is_valid(), "invalid register"); return value(); } public: int encoding(Width w) const { @@ -258,10 +258,12 @@ class FloatRegisterImpl: public AbstractRegisterImpl { return -1; } - bool is_valid() const { return 0 <= value() && value() < number_of_registers; } + bool is_valid() const { return 0 <= value() && value() < number_of_registers; } + bool is_even() const { return (encoding() & 1) == 0; } + const char* name() const; - FloatRegister successor() const { return as_FloatRegister(encoding() + 1); } + FloatRegister successor() const { return as_FloatRegister(encoding() + 1); } }; diff --git a/src/hotspot/cpu/sparc/stubGenerator_sparc.cpp b/src/hotspot/cpu/sparc/stubGenerator_sparc.cpp index 9c4713e936d..351555dbe51 100644 --- a/src/hotspot/cpu/sparc/stubGenerator_sparc.cpp +++ b/src/hotspot/cpu/sparc/stubGenerator_sparc.cpp @@ -58,7 +58,6 @@ // Note: The register L7 is used as L7_thread_cache, and may not be used // any other way within this module. - static const Register& Lstub_temp = L2; // ------------------------------------------------------------------------------------------------------------------------- @@ -4943,7 +4942,7 @@ class StubGenerator: public StubCodeGenerator { return start; } -/** + /** * Arguments: * * Inputs: @@ -4975,6 +4974,773 @@ class StubGenerator: public StubCodeGenerator { return start; } + /** + * Arguments: + * + * Inputs: + * I0 - int* x-addr + * I1 - int x-len + * I2 - int* y-addr + * I3 - int y-len + * I4 - int* z-addr (output vector) + * I5 - int z-len + */ + address generate_multiplyToLen() { + assert(UseMultiplyToLenIntrinsic, "need VIS3 instructions"); + + __ align(CodeEntryAlignment); + StubCodeMark mark(this, "StubRoutines", "multiplyToLen"); + address start = __ pc(); + + __ save_frame(0); + + const Register xptr = I0; // input address + const Register xlen = I1; // ...and length in 32b-words + const Register yptr = I2; // + const Register ylen = I3; // + const Register zptr = I4; // output address + const Register zlen = I5; // ...and length in 32b-words + + /* The minimal "limb" representation suggest that odd length vectors are as + * likely as even length dittos. This in turn suggests that we need to cope + * with odd/even length arrays and data not aligned properly for 64-bit read + * and write operations. We thus use a number of different kernels: + * + * if (is_even(x.len) && is_even(y.len)) + * if (is_align64(x) && is_align64(y) && is_align64(z)) + * if (x.len == y.len && 16 <= x.len && x.len <= 64) + * memv_mult_mpmul(...) + * else + * memv_mult_64x64(...) + * else + * memv_mult_64x64u(...) + * else + * memv_mult_32x32(...) + * + * Here we assume VIS3 support (for 'umulxhi', 'addxc' and 'addxccc'). + * In case CBCOND instructions are supported, we will use 'cxbX'. If the + * MPMUL instruction is supported, we will generate a kernel using 'mpmul' + * (for vectors with proper characteristics). + */ + const Register tmp0 = L0; + const Register tmp1 = L1; + + Label L_mult_32x32; + Label L_mult_64x64u; + Label L_mult_64x64; + Label L_exit; + + if_both_even(xlen, ylen, tmp0, false, L_mult_32x32); + if_all3_aligned(xptr, yptr, zptr, tmp1, 64, false, L_mult_64x64u); + + if (UseMPMUL) { + if_eq(xlen, ylen, false, L_mult_64x64); + if_in_rng(xlen, 16, 64, tmp0, tmp1, false, L_mult_64x64); + + // 1. Multiply naturally aligned 64b-datums using a generic 'mpmul' kernel, + // operating on equal length vectors of size [16..64]. + gen_mult_mpmul(xlen, xptr, yptr, zptr, L_exit); + } + + // 2. Multiply naturally aligned 64-bit datums (64x64). + __ bind(L_mult_64x64); + gen_mult_64x64(xptr, xlen, yptr, ylen, zptr, zlen, L_exit); + + // 3. Multiply unaligned 64-bit datums (64x64). + __ bind(L_mult_64x64u); + gen_mult_64x64_unaligned(xptr, xlen, yptr, ylen, zptr, zlen, L_exit); + + // 4. Multiply naturally aligned 32-bit datums (32x32). + __ bind(L_mult_32x32); + gen_mult_32x32(xptr, xlen, yptr, ylen, zptr, zlen, L_exit); + + __ bind(L_exit); + __ ret(); + __ delayed()->restore(); + + return start; + } + + // Additional help functions used by multiplyToLen generation. + + void if_both_even(Register r1, Register r2, Register tmp, bool iseven, Label &L) + { + __ or3(r1, r2, tmp); + __ andcc(tmp, 0x1, tmp); + __ br_icc_zero(iseven, Assembler::pn, L); + } + + void if_all3_aligned(Register r1, Register r2, Register r3, + Register tmp, uint align, bool isalign, Label &L) + { + __ or3(r1, r2, tmp); + __ or3(r3, tmp, tmp); + __ andcc(tmp, (align - 1), tmp); + __ br_icc_zero(isalign, Assembler::pn, L); + } + + void if_eq(Register x, Register y, bool iseq, Label &L) + { + Assembler::Condition cf = (iseq ? Assembler::equal : Assembler::notEqual); + __ cmp_and_br_short(x, y, cf, Assembler::pt, L); + } + + void if_in_rng(Register x, int lb, int ub, Register t1, Register t2, bool inrng, Label &L) + { + assert(Assembler::is_simm13(lb), "Small ints only!"); + assert(Assembler::is_simm13(ub), "Small ints only!"); + // Compute (x - lb) * (ub - x) >= 0 + // NOTE: With the local use of this routine, we rely on small integers to + // guarantee that we do not overflow in the multiplication. + __ add(G0, ub, t2); + __ sub(x, lb, t1); + __ sub(t2, x, t2); + __ mulx(t1, t2, t1); + Assembler::Condition cf = (inrng ? Assembler::greaterEqual : Assembler::less); + __ cmp_and_br_short(t1, G0, cf, Assembler::pt, L); + } + + void ldd_entry(Register base, Register offs, FloatRegister dest) + { + __ ldd(base, offs, dest); + __ inc(offs, 8); + } + + void ldx_entry(Register base, Register offs, Register dest) + { + __ ldx(base, offs, dest); + __ inc(offs, 8); + } + + void mpmul_entry(int m, Label &next) + { + __ mpmul(m); + __ cbcond(Assembler::equal, Assembler::icc, G0, G0, next); + } + + void stx_entry(Label &L, Register r1, Register r2, Register base, Register offs) + { + __ bind(L); + __ stx(r1, base, offs); + __ inc(offs, 8); + __ stx(r2, base, offs); + __ inc(offs, 8); + } + + void offs_entry(Label &Lbl0, Label &Lbl1) + { + assert(Lbl0.is_bound(), "must be"); + assert(Lbl1.is_bound(), "must be"); + + int offset = Lbl0.loc_pos() - Lbl1.loc_pos(); + + __ emit_data(offset); + } + + /* Generate the actual multiplication kernels for BigInteger vectors: + * + * 1. gen_mult_mpmul(...) + * + * 2. gen_mult_64x64(...) + * + * 3. gen_mult_64x64_unaligned(...) + * + * 4. gen_mult_32x32(...) + */ + void gen_mult_mpmul(Register len, Register xptr, Register yptr, Register zptr, + Label &L_exit) + { + const Register zero = G0; + const Register gxp = G1; // Need to use global registers across RWs. + const Register gyp = G2; + const Register gzp = G3; + const Register offs = G4; + const Register disp = G5; + + __ mov(xptr, gxp); + __ mov(yptr, gyp); + __ mov(zptr, gzp); + + /* Compute jump vector entry: + * + * 1. mpmul input size (0..31) x 64b + * 2. vector input size in 32b limbs (even number) + * 3. branch entries in reverse order (31..0), using two + * instructions per entry (2 * 4 bytes). + * + * displacement = byte_offset(bra_offset(len)) + * = byte_offset((64 - len)/2) + * = 8 * (64 - len)/2 + * = 4 * (64 - len) + */ + Register temp = I5; // Alright to use input regs. in first batch. + + __ sub(zero, len, temp); + __ add(temp, 64, temp); + __ sllx(temp, 2, disp); // disp := (64 - len) << 2 + + // Dispatch relative current PC, into instruction table below. + __ rdpc(temp); + __ add(temp, 16, temp); + __ jmp(temp, disp); + __ delayed()->clr(offs); + + ldd_entry(gxp, offs, F22); + ldd_entry(gxp, offs, F20); + ldd_entry(gxp, offs, F18); + ldd_entry(gxp, offs, F16); + ldd_entry(gxp, offs, F14); + ldd_entry(gxp, offs, F12); + ldd_entry(gxp, offs, F10); + ldd_entry(gxp, offs, F8); + ldd_entry(gxp, offs, F6); + ldd_entry(gxp, offs, F4); + ldx_entry(gxp, offs, I5); + ldx_entry(gxp, offs, I4); + ldx_entry(gxp, offs, I3); + ldx_entry(gxp, offs, I2); + ldx_entry(gxp, offs, I1); + ldx_entry(gxp, offs, I0); + ldx_entry(gxp, offs, L7); + ldx_entry(gxp, offs, L6); + ldx_entry(gxp, offs, L5); + ldx_entry(gxp, offs, L4); + ldx_entry(gxp, offs, L3); + ldx_entry(gxp, offs, L2); + ldx_entry(gxp, offs, L1); + ldx_entry(gxp, offs, L0); + ldd_entry(gxp, offs, F2); + ldd_entry(gxp, offs, F0); + ldx_entry(gxp, offs, O5); + ldx_entry(gxp, offs, O4); + ldx_entry(gxp, offs, O3); + ldx_entry(gxp, offs, O2); + ldx_entry(gxp, offs, O1); + ldx_entry(gxp, offs, O0); + + __ save(SP, -176, SP); + + const Register addr = gxp; // Alright to reuse 'gxp'. + + // Dispatch relative current PC, into instruction table below. + __ rdpc(addr); + __ add(addr, 16, addr); + __ jmp(addr, disp); + __ delayed()->clr(offs); + + ldd_entry(gyp, offs, F58); + ldd_entry(gyp, offs, F56); + ldd_entry(gyp, offs, F54); + ldd_entry(gyp, offs, F52); + ldd_entry(gyp, offs, F50); + ldd_entry(gyp, offs, F48); + ldd_entry(gyp, offs, F46); + ldd_entry(gyp, offs, F44); + ldd_entry(gyp, offs, F42); + ldd_entry(gyp, offs, F40); + ldd_entry(gyp, offs, F38); + ldd_entry(gyp, offs, F36); + ldd_entry(gyp, offs, F34); + ldd_entry(gyp, offs, F32); + ldd_entry(gyp, offs, F30); + ldd_entry(gyp, offs, F28); + ldd_entry(gyp, offs, F26); + ldd_entry(gyp, offs, F24); + ldx_entry(gyp, offs, O5); + ldx_entry(gyp, offs, O4); + ldx_entry(gyp, offs, O3); + ldx_entry(gyp, offs, O2); + ldx_entry(gyp, offs, O1); + ldx_entry(gyp, offs, O0); + ldx_entry(gyp, offs, L7); + ldx_entry(gyp, offs, L6); + ldx_entry(gyp, offs, L5); + ldx_entry(gyp, offs, L4); + ldx_entry(gyp, offs, L3); + ldx_entry(gyp, offs, L2); + ldx_entry(gyp, offs, L1); + ldx_entry(gyp, offs, L0); + + __ save(SP, -176, SP); + __ save(SP, -176, SP); + __ save(SP, -176, SP); + __ save(SP, -176, SP); + __ save(SP, -176, SP); + + Label L_mpmul_restore_4, L_mpmul_restore_3, L_mpmul_restore_2; + Label L_mpmul_restore_1, L_mpmul_restore_0; + + // Dispatch relative current PC, into instruction table below. + __ rdpc(addr); + __ add(addr, 16, addr); + __ jmp(addr, disp); + __ delayed()->clr(offs); + + mpmul_entry(31, L_mpmul_restore_0); + mpmul_entry(30, L_mpmul_restore_0); + mpmul_entry(29, L_mpmul_restore_0); + mpmul_entry(28, L_mpmul_restore_0); + mpmul_entry(27, L_mpmul_restore_1); + mpmul_entry(26, L_mpmul_restore_1); + mpmul_entry(25, L_mpmul_restore_1); + mpmul_entry(24, L_mpmul_restore_1); + mpmul_entry(23, L_mpmul_restore_1); + mpmul_entry(22, L_mpmul_restore_1); + mpmul_entry(21, L_mpmul_restore_1); + mpmul_entry(20, L_mpmul_restore_2); + mpmul_entry(19, L_mpmul_restore_2); + mpmul_entry(18, L_mpmul_restore_2); + mpmul_entry(17, L_mpmul_restore_2); + mpmul_entry(16, L_mpmul_restore_2); + mpmul_entry(15, L_mpmul_restore_2); + mpmul_entry(14, L_mpmul_restore_2); + mpmul_entry(13, L_mpmul_restore_3); + mpmul_entry(12, L_mpmul_restore_3); + mpmul_entry(11, L_mpmul_restore_3); + mpmul_entry(10, L_mpmul_restore_3); + mpmul_entry( 9, L_mpmul_restore_3); + mpmul_entry( 8, L_mpmul_restore_3); + mpmul_entry( 7, L_mpmul_restore_3); + mpmul_entry( 6, L_mpmul_restore_4); + mpmul_entry( 5, L_mpmul_restore_4); + mpmul_entry( 4, L_mpmul_restore_4); + mpmul_entry( 3, L_mpmul_restore_4); + mpmul_entry( 2, L_mpmul_restore_4); + mpmul_entry( 1, L_mpmul_restore_4); + mpmul_entry( 0, L_mpmul_restore_4); + + Label L_z31, L_z30, L_z29, L_z28, L_z27, L_z26, L_z25, L_z24; + Label L_z23, L_z22, L_z21, L_z20, L_z19, L_z18, L_z17, L_z16; + Label L_z15, L_z14, L_z13, L_z12, L_z11, L_z10, L_z09, L_z08; + Label L_z07, L_z06, L_z05, L_z04, L_z03, L_z02, L_z01, L_z00; + + Label L_zst_base; // Store sequence base address. + __ bind(L_zst_base); + + stx_entry(L_z31, L7, L6, gzp, offs); + stx_entry(L_z30, L5, L4, gzp, offs); + stx_entry(L_z29, L3, L2, gzp, offs); + stx_entry(L_z28, L1, L0, gzp, offs); + __ restore(); + stx_entry(L_z27, O5, O4, gzp, offs); + stx_entry(L_z26, O3, O2, gzp, offs); + stx_entry(L_z25, O1, O0, gzp, offs); + stx_entry(L_z24, L7, L6, gzp, offs); + stx_entry(L_z23, L5, L4, gzp, offs); + stx_entry(L_z22, L3, L2, gzp, offs); + stx_entry(L_z21, L1, L0, gzp, offs); + __ restore(); + stx_entry(L_z20, O5, O4, gzp, offs); + stx_entry(L_z19, O3, O2, gzp, offs); + stx_entry(L_z18, O1, O0, gzp, offs); + stx_entry(L_z17, L7, L6, gzp, offs); + stx_entry(L_z16, L5, L4, gzp, offs); + stx_entry(L_z15, L3, L2, gzp, offs); + stx_entry(L_z14, L1, L0, gzp, offs); + __ restore(); + stx_entry(L_z13, O5, O4, gzp, offs); + stx_entry(L_z12, O3, O2, gzp, offs); + stx_entry(L_z11, O1, O0, gzp, offs); + stx_entry(L_z10, L7, L6, gzp, offs); + stx_entry(L_z09, L5, L4, gzp, offs); + stx_entry(L_z08, L3, L2, gzp, offs); + stx_entry(L_z07, L1, L0, gzp, offs); + __ restore(); + stx_entry(L_z06, O5, O4, gzp, offs); + stx_entry(L_z05, O3, O2, gzp, offs); + stx_entry(L_z04, O1, O0, gzp, offs); + stx_entry(L_z03, L7, L6, gzp, offs); + stx_entry(L_z02, L5, L4, gzp, offs); + stx_entry(L_z01, L3, L2, gzp, offs); + stx_entry(L_z00, L1, L0, gzp, offs); + + __ restore(); + __ restore(); + // Exit out of 'mpmul' routine, back to multiplyToLen. + __ ba_short(L_exit); + + Label L_zst_offs; + __ bind(L_zst_offs); + + offs_entry(L_z31, L_zst_base); // index 31: 2048x2048 + offs_entry(L_z30, L_zst_base); + offs_entry(L_z29, L_zst_base); + offs_entry(L_z28, L_zst_base); + offs_entry(L_z27, L_zst_base); + offs_entry(L_z26, L_zst_base); + offs_entry(L_z25, L_zst_base); + offs_entry(L_z24, L_zst_base); + offs_entry(L_z23, L_zst_base); + offs_entry(L_z22, L_zst_base); + offs_entry(L_z21, L_zst_base); + offs_entry(L_z20, L_zst_base); + offs_entry(L_z19, L_zst_base); + offs_entry(L_z18, L_zst_base); + offs_entry(L_z17, L_zst_base); + offs_entry(L_z16, L_zst_base); + offs_entry(L_z15, L_zst_base); + offs_entry(L_z14, L_zst_base); + offs_entry(L_z13, L_zst_base); + offs_entry(L_z12, L_zst_base); + offs_entry(L_z11, L_zst_base); + offs_entry(L_z10, L_zst_base); + offs_entry(L_z09, L_zst_base); + offs_entry(L_z08, L_zst_base); + offs_entry(L_z07, L_zst_base); + offs_entry(L_z06, L_zst_base); + offs_entry(L_z05, L_zst_base); + offs_entry(L_z04, L_zst_base); + offs_entry(L_z03, L_zst_base); + offs_entry(L_z02, L_zst_base); + offs_entry(L_z01, L_zst_base); + offs_entry(L_z00, L_zst_base); // index 0: 64x64 + + __ bind(L_mpmul_restore_4); + __ restore(); + __ bind(L_mpmul_restore_3); + __ restore(); + __ bind(L_mpmul_restore_2); + __ restore(); + __ bind(L_mpmul_restore_1); + __ restore(); + __ bind(L_mpmul_restore_0); + + // Dispatch via offset vector entry, into z-store sequence. + Label L_zst_rdpc; + __ bind(L_zst_rdpc); + + assert(L_zst_base.is_bound(), "must be"); + assert(L_zst_offs.is_bound(), "must be"); + assert(L_zst_rdpc.is_bound(), "must be"); + + int dbase = L_zst_rdpc.loc_pos() - L_zst_base.loc_pos(); + int doffs = L_zst_rdpc.loc_pos() - L_zst_offs.loc_pos(); + + temp = gyp; // Alright to reuse 'gyp'. + + __ rdpc(addr); + __ sub(addr, doffs, temp); + __ srlx(disp, 1, disp); + __ lduw(temp, disp, offs); + __ sub(addr, dbase, temp); + __ jmp(temp, offs); + __ delayed()->clr(offs); + } + + void gen_mult_64x64(Register xp, Register xn, + Register yp, Register yn, + Register zp, Register zn, Label &L_exit) + { + // Assuming that a stack frame has already been created, i.e. local and + // output registers are available for immediate use. + + const Register ri = L0; // Outer loop index, xv[i] + const Register rj = L1; // Inner loop index, yv[j] + const Register rk = L2; // Output loop index, zv[k] + const Register rx = L4; // x-vector datum [i] + const Register ry = L5; // y-vector datum [j] + const Register rz = L6; // z-vector datum [k] + const Register rc = L7; // carry over (to z-vector datum [k-1]) + + const Register lop = O0; // lo-64b product + const Register hip = O1; // hi-64b product + + const Register zero = G0; + + Label L_loop_i, L_exit_loop_i; + Label L_loop_j; + Label L_loop_i2, L_exit_loop_i2; + + __ srlx(xn, 1, xn); // index for u32 to u64 ditto + __ srlx(yn, 1, yn); // index for u32 to u64 ditto + __ srlx(zn, 1, zn); // index for u32 to u64 ditto + __ dec(xn); // Adjust [0..(N/2)-1] + __ dec(yn); + __ dec(zn); + __ clr(rc); // u64 c = 0 + __ sllx(xn, 3, ri); // int i = xn (byte offset i = 8*xn) + __ sllx(yn, 3, rj); // int j = yn (byte offset i = 8*xn) + __ sllx(zn, 3, rk); // int k = zn (byte offset k = 8*zn) + __ ldx(yp, rj, ry); // u64 y = yp[yn] + + // for (int i = xn; i >= 0; i--) + __ bind(L_loop_i); + + __ cmp_and_br_short(ri, 0, // i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i); + __ ldx(xp, ri, rx); // x = xp[i] + __ mulx(rx, ry, lop); // lo-64b-part of result 64x64 + __ umulxhi(rx, ry, hip); // hi-64b-part of result 64x64 + __ addcc(rc, lop, lop); // Accumulate lower order bits (producing carry) + __ addxc(hip, zero, rc); // carry over to next datum [k-1] + __ stx(lop, zp, rk); // z[k] = lop + __ dec(rk, 8); // k-- + __ dec(ri, 8); // i-- + __ ba_short(L_loop_i); + + __ bind(L_exit_loop_i); + __ stx(rc, zp, rk); // z[k] = c + + // for (int j = yn - 1; j >= 0; j--) + __ sllx(yn, 3, rj); // int j = yn - 1 (byte offset j = 8*yn) + __ dec(rj, 8); + + __ bind(L_loop_j); + + __ cmp_and_br_short(rj, 0, // j >= 0 + Assembler::less, Assembler::pn, L_exit); + __ clr(rc); // u64 c = 0 + __ ldx(yp, rj, ry); // u64 y = yp[j] + + // for (int i = xn, k = --zn; i >= 0; i--) + __ dec(zn); // --zn + __ sllx(xn, 3, ri); // int i = xn (byte offset i = 8*xn) + __ sllx(zn, 3, rk); // int k = zn (byte offset k = 8*zn) + + __ bind(L_loop_i2); + + __ cmp_and_br_short(ri, 0, // i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i2); + __ ldx(xp, ri, rx); // x = xp[i] + __ ldx(zp, rk, rz); // z = zp[k], accumulator + __ mulx(rx, ry, lop); // lo-64b-part of result 64x64 + __ umulxhi(rx, ry, hip); // hi-64b-part of result 64x64 + __ addcc(rz, rc, rz); // Accumulate lower order bits, + __ addxc(hip, zero, rc); // Accumulate higher order bits to carry + __ addcc(rz, lop, rz); // z += lo(p) + c + __ addxc(rc, zero, rc); + __ stx(rz, zp, rk); // zp[k] = z + __ dec(rk, 8); // k-- + __ dec(ri, 8); // i-- + __ ba_short(L_loop_i2); + + __ bind(L_exit_loop_i2); + __ stx(rc, zp, rk); // z[k] = c + __ dec(rj, 8); // j-- + __ ba_short(L_loop_j); + } + + void gen_mult_64x64_unaligned(Register xp, Register xn, + Register yp, Register yn, + Register zp, Register zn, Label &L_exit) + { + // Assuming that a stack frame has already been created, i.e. local and + // output registers are available for use. + + const Register xpc = L0; // Outer loop cursor, xp[i] + const Register ypc = L1; // Inner loop cursor, yp[j] + const Register zpc = L2; // Output loop cursor, zp[k] + const Register rx = L4; // x-vector datum [i] + const Register ry = L5; // y-vector datum [j] + const Register rz = L6; // z-vector datum [k] + const Register rc = L7; // carry over (to z-vector datum [k-1]) + const Register rt = O2; + + const Register lop = O0; // lo-64b product + const Register hip = O1; // hi-64b product + + const Register zero = G0; + + Label L_loop_i, L_exit_loop_i; + Label L_loop_j; + Label L_loop_i2, L_exit_loop_i2; + + __ srlx(xn, 1, xn); // index for u32 to u64 ditto + __ srlx(yn, 1, yn); // index for u32 to u64 ditto + __ srlx(zn, 1, zn); // index for u32 to u64 ditto + __ dec(xn); // Adjust [0..(N/2)-1] + __ dec(yn); + __ dec(zn); + __ clr(rc); // u64 c = 0 + __ sllx(xn, 3, xpc); // u32* xpc = &xp[xn] (byte offset 8*xn) + __ add(xp, xpc, xpc); + __ sllx(yn, 3, ypc); // u32* ypc = &yp[yn] (byte offset 8*yn) + __ add(yp, ypc, ypc); + __ sllx(zn, 3, zpc); // u32* zpc = &zp[zn] (byte offset 8*zn) + __ add(zp, zpc, zpc); + __ lduw(ypc, 0, rt); // u64 y = yp[yn] + __ lduw(ypc, 4, ry); // ... + __ sllx(rt, 32, rt); + __ or3(rt, ry, ry); + + // for (int i = xn; i >= 0; i--) + __ bind(L_loop_i); + + __ cmp_and_br_short(xpc, xp,// i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i); + __ lduw(xpc, 0, rt); // u64 x = xp[i] + __ lduw(xpc, 4, rx); // ... + __ sllx(rt, 32, rt); + __ or3(rt, rx, rx); + __ mulx(rx, ry, lop); // lo-64b-part of result 64x64 + __ umulxhi(rx, ry, hip); // hi-64b-part of result 64x64 + __ addcc(rc, lop, lop); // Accumulate lower order bits (producing carry) + __ addxc(hip, zero, rc); // carry over to next datum [k-1] + __ srlx(lop, 32, rt); + __ stw(rt, zpc, 0); // z[k] = lop + __ stw(lop, zpc, 4); // ... + __ dec(zpc, 8); // k-- (zpc--) + __ dec(xpc, 8); // i-- (xpc--) + __ ba_short(L_loop_i); + + __ bind(L_exit_loop_i); + __ srlx(rc, 32, rt); + __ stw(rt, zpc, 0); // z[k] = c + __ stw(rc, zpc, 4); + + // for (int j = yn - 1; j >= 0; j--) + __ sllx(yn, 3, ypc); // u32* ypc = &yp[yn] (byte offset 8*yn) + __ add(yp, ypc, ypc); + __ dec(ypc, 8); // yn - 1 (ypc--) + + __ bind(L_loop_j); + + __ cmp_and_br_short(ypc, yp,// j >= 0 + Assembler::less, Assembler::pn, L_exit); + __ clr(rc); // u64 c = 0 + __ lduw(ypc, 0, rt); // u64 y = yp[j] (= *ypc) + __ lduw(ypc, 4, ry); // ... + __ sllx(rt, 32, rt); + __ or3(rt, ry, ry); + + // for (int i = xn, k = --zn; i >= 0; i--) + __ sllx(xn, 3, xpc); // u32* xpc = &xp[xn] (byte offset 8*xn) + __ add(xp, xpc, xpc); + __ dec(zn); // --zn + __ sllx(zn, 3, zpc); // u32* zpc = &zp[zn] (byte offset 8*zn) + __ add(zp, zpc, zpc); + + __ bind(L_loop_i2); + + __ cmp_and_br_short(xpc, xp,// i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i2); + __ lduw(xpc, 0, rt); // u64 x = xp[i] (= *xpc) + __ lduw(xpc, 4, rx); // ... + __ sllx(rt, 32, rt); + __ or3(rt, rx, rx); + + __ lduw(zpc, 0, rt); // u64 z = zp[k] (= *zpc) + __ lduw(zpc, 4, rz); // ... + __ sllx(rt, 32, rt); + __ or3(rt, rz, rz); + + __ mulx(rx, ry, lop); // lo-64b-part of result 64x64 + __ umulxhi(rx, ry, hip); // hi-64b-part of result 64x64 + __ addcc(rz, rc, rz); // Accumulate lower order bits... + __ addxc(hip, zero, rc); // Accumulate higher order bits to carry + __ addcc(rz, lop, rz); // ... z += lo(p) + c + __ addxccc(rc, zero, rc); + __ srlx(rz, 32, rt); + __ stw(rt, zpc, 0); // zp[k] = z (*zpc = z) + __ stw(rz, zpc, 4); + __ dec(zpc, 8); // k-- (zpc--) + __ dec(xpc, 8); // i-- (xpc--) + __ ba_short(L_loop_i2); + + __ bind(L_exit_loop_i2); + __ srlx(rc, 32, rt); + __ stw(rt, zpc, 0); // z[k] = c + __ stw(rc, zpc, 4); + __ dec(ypc, 8); // j-- (ypc--) + __ ba_short(L_loop_j); + } + + void gen_mult_32x32(Register xp, Register xn, + Register yp, Register yn, + Register zp, Register zn, Label &L_exit) + { + // Assuming that a stack frame has already been created, i.e. local and + // output registers are available for use. + + const Register ri = L0; // Outer loop index, xv[i] + const Register rj = L1; // Inner loop index, yv[j] + const Register rk = L2; // Output loop index, zv[k] + const Register rx = L4; // x-vector datum [i] + const Register ry = L5; // y-vector datum [j] + const Register rz = L6; // z-vector datum [k] + const Register rc = L7; // carry over (to z-vector datum [k-1]) + + const Register p64 = O0; // 64b product + const Register z65 = O1; // carry+64b accumulator + const Register c65 = O2; // carry at bit 65 + const Register c33 = O2; // carry at bit 33 (after shift) + + const Register zero = G0; + + Label L_loop_i, L_exit_loop_i; + Label L_loop_j; + Label L_loop_i2, L_exit_loop_i2; + + __ dec(xn); // Adjust [0..N-1] + __ dec(yn); + __ dec(zn); + __ clr(rc); // u32 c = 0 + __ sllx(xn, 2, ri); // int i = xn (byte offset i = 4*xn) + __ sllx(yn, 2, rj); // int j = yn (byte offset i = 4*xn) + __ sllx(zn, 2, rk); // int k = zn (byte offset k = 4*zn) + __ lduw(yp, rj, ry); // u32 y = yp[yn] + + // for (int i = xn; i >= 0; i--) + __ bind(L_loop_i); + + __ cmp_and_br_short(ri, 0, // i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i); + __ lduw(xp, ri, rx); // x = xp[i] + __ mulx(rx, ry, p64); // 64b result of 32x32 + __ addcc(rc, p64, z65); // Accumulate to 65 bits (producing carry) + __ addxc(zero, zero, c65); // Materialise carry (in bit 65) into lsb, + __ sllx(c65, 32, c33); // and shift into bit 33 + __ srlx(z65, 32, rc); // carry = c33 | hi(z65) >> 32 + __ add(c33, rc, rc); // carry over to next datum [k-1] + __ stw(z65, zp, rk); // z[k] = lo(z65) + __ dec(rk, 4); // k-- + __ dec(ri, 4); // i-- + __ ba_short(L_loop_i); + + __ bind(L_exit_loop_i); + __ stw(rc, zp, rk); // z[k] = c + + // for (int j = yn - 1; j >= 0; j--) + __ sllx(yn, 2, rj); // int j = yn - 1 (byte offset j = 4*yn) + __ dec(rj, 4); + + __ bind(L_loop_j); + + __ cmp_and_br_short(rj, 0, // j >= 0 + Assembler::less, Assembler::pn, L_exit); + __ clr(rc); // u32 c = 0 + __ lduw(yp, rj, ry); // u32 y = yp[j] + + // for (int i = xn, k = --zn; i >= 0; i--) + __ dec(zn); // --zn + __ sllx(xn, 2, ri); // int i = xn (byte offset i = 4*xn) + __ sllx(zn, 2, rk); // int k = zn (byte offset k = 4*zn) + + __ bind(L_loop_i2); + + __ cmp_and_br_short(ri, 0, // i >= 0 + Assembler::less, Assembler::pn, L_exit_loop_i2); + __ lduw(xp, ri, rx); // x = xp[i] + __ lduw(zp, rk, rz); // z = zp[k], accumulator + __ mulx(rx, ry, p64); // 64b result of 32x32 + __ add(rz, rc, rz); // Accumulate lower order bits, + __ addcc(rz, p64, z65); // z += lo(p64) + c + __ addxc(zero, zero, c65); // Materialise carry (in bit 65) into lsb, + __ sllx(c65, 32, c33); // and shift into bit 33 + __ srlx(z65, 32, rc); // carry = c33 | hi(z65) >> 32 + __ add(c33, rc, rc); // carry over to next datum [k-1] + __ stw(z65, zp, rk); // zp[k] = lo(z65) + __ dec(rk, 4); // k-- + __ dec(ri, 4); // i-- + __ ba_short(L_loop_i2); + + __ bind(L_exit_loop_i2); + __ stw(rc, zp, rk); // z[k] = c + __ dec(rj, 4); // j-- + __ ba_short(L_loop_j); + } + + void generate_initial() { // Generates all stubs and initializes the entry points @@ -5073,8 +5839,14 @@ class StubGenerator: public StubCodeGenerator { if (UseAdler32Intrinsics) { StubRoutines::_updateBytesAdler32 = generate_updateBytesAdler32(); } - } +#ifdef COMPILER2 + // Intrinsics supported by C2 only: + if (UseMultiplyToLenIntrinsic) { + StubRoutines::_multiplyToLen = generate_multiplyToLen(); + } +#endif // COMPILER2 + } public: StubGenerator(CodeBuffer* code, bool all) : StubCodeGenerator(code) { diff --git a/src/hotspot/cpu/sparc/stubRoutines_sparc.hpp b/src/hotspot/cpu/sparc/stubRoutines_sparc.hpp index eb6c909c0b3..d41c5b8e4ae 100644 --- a/src/hotspot/cpu/sparc/stubRoutines_sparc.hpp +++ b/src/hotspot/cpu/sparc/stubRoutines_sparc.hpp @@ -41,7 +41,7 @@ static bool returns_to_call_stub(address return_pc) { enum /* platform_dependent_constants */ { // %%%%%%%% May be able to shrink this a lot code_size1 = 20000, // simply increase if too small (assembler will crash if too small) - code_size2 = 27000 // simply increase if too small (assembler will crash if too small) + code_size2 = 29000 // simply increase if too small (assembler will crash if too small) }; class Sparc { diff --git a/src/hotspot/cpu/sparc/vm_version_sparc.cpp b/src/hotspot/cpu/sparc/vm_version_sparc.cpp index 37203221f71..6e1480f459e 100644 --- a/src/hotspot/cpu/sparc/vm_version_sparc.cpp +++ b/src/hotspot/cpu/sparc/vm_version_sparc.cpp @@ -168,6 +168,16 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(UseCBCond, false); } + // Use 'mpmul' instruction if available. + if (has_mpmul()) { + if (FLAG_IS_DEFAULT(UseMPMUL)) { + FLAG_SET_DEFAULT(UseMPMUL, true); + } + } else if (UseMPMUL) { + warning("MPMUL instruction is not available on this CPU"); + FLAG_SET_DEFAULT(UseMPMUL, false); + } + assert(BlockZeroingLowLimit > 0, "invalid value"); if (has_blk_zeroing() && cache_line_size > 0) { @@ -409,6 +419,15 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(UseCRC32Intrinsics, false); } + if (UseVIS > 2) { + if (FLAG_IS_DEFAULT(UseMultiplyToLenIntrinsic)) { + FLAG_SET_DEFAULT(UseMultiplyToLenIntrinsic, true); + } + } else if (UseMultiplyToLenIntrinsic) { + warning("SPARC multiplyToLen intrinsics require VIS3 instructions support. Intrinsics will be disabled"); + FLAG_SET_DEFAULT(UseMultiplyToLenIntrinsic, false); + } + if (UseVectorizedMismatchIntrinsic) { warning("UseVectorizedMismatchIntrinsic specified, but not available on this CPU."); FLAG_SET_DEFAULT(UseVectorizedMismatchIntrinsic, false); From d801fa5d9d5f37132b5cd5784aa5a538fde8854a Mon Sep 17 00:00:00 2001 From: Patric Hedlin Date: Fri, 29 Sep 2017 10:41:36 +0200 Subject: [PATCH 48/80] 8182279: Updating SPARC feature/capability detection to support Core C5 Renamed Core Sx to Core Cx (C3, C4, C5, according to name change). Reviewed-by: kvn, dholmes --- src/hotspot/cpu/sparc/vmStructs_sparc.hpp | 8 +++ src/hotspot/cpu/sparc/vm_version_sparc.cpp | 18 +++++- src/hotspot/cpu/sparc/vm_version_sparc.hpp | 61 ++++++++++++++++--- .../vm_version_solaris_sparc.cpp | 55 ++++++++++++++--- src/hotspot/share/jvmci/vmStructs_jvmci.cpp | 8 +++ .../SPARCHotSpotJVMCIBackendFactory.java | 24 ++++++++ .../hotspot/sparc/SPARCHotSpotVMConfig.java | 8 +++ .../src/jdk/vm/ci/sparc/SPARC.java | 8 +++ 8 files changed, 169 insertions(+), 21 deletions(-) diff --git a/src/hotspot/cpu/sparc/vmStructs_sparc.hpp b/src/hotspot/cpu/sparc/vmStructs_sparc.hpp index aa21dbdb2db..d678b4dbfd4 100644 --- a/src/hotspot/cpu/sparc/vmStructs_sparc.hpp +++ b/src/hotspot/cpu/sparc/vmStructs_sparc.hpp @@ -101,6 +101,14 @@ declare_constant(VM_Version::ISA_XMONT) \ declare_constant(VM_Version::ISA_PAUSE_NSEC) \ declare_constant(VM_Version::ISA_VAMASK) \ + declare_constant(VM_Version::ISA_SPARC6) \ + declare_constant(VM_Version::ISA_DICTUNP) \ + declare_constant(VM_Version::ISA_FPCMPSHL) \ + declare_constant(VM_Version::ISA_RLE) \ + declare_constant(VM_Version::ISA_SHA3) \ + declare_constant(VM_Version::ISA_VIS3C) \ + declare_constant(VM_Version::ISA_SPARC5B) \ + declare_constant(VM_Version::ISA_MME) \ declare_constant(VM_Version::CPU_FAST_IDIV) \ declare_constant(VM_Version::CPU_FAST_RDPC) \ declare_constant(VM_Version::CPU_FAST_BIS) \ diff --git a/src/hotspot/cpu/sparc/vm_version_sparc.cpp b/src/hotspot/cpu/sparc/vm_version_sparc.cpp index 6e1480f459e..b5ef619c35e 100644 --- a/src/hotspot/cpu/sparc/vm_version_sparc.cpp +++ b/src/hotspot/cpu/sparc/vm_version_sparc.cpp @@ -103,7 +103,7 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(AllocatePrefetchInstr, 1); } else if (has_sparc5()) { - // Use prefetch instruction to avoid partial RAW issue on Core S4 processors, + // Use prefetch instruction to avoid partial RAW issue on Core C4 processors, // also use prefetch style 3. FLAG_SET_DEFAULT(AllocatePrefetchInstr, 0); if (FLAG_IS_DEFAULT(AllocatePrefetchStyle)) { @@ -128,7 +128,7 @@ void VM_Version::initialize() { // We increase the number of prefetched cache lines, to use just a bit more // aggressive approach, when the L2-cache line size is small (32 bytes), or - // when running on newer processor implementations, such as the Core S4. + // when running on newer processor implementations, such as the Core C4. bool inc_prefetch = cache_line_size > 0 && (cache_line_size < 64 || has_sparc5()); if (inc_prefetch) { @@ -218,7 +218,9 @@ void VM_Version::initialize() { char buf[512]; jio_snprintf(buf, sizeof(buf), - "%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s", + "%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s" + "%s%s%s%s%s%s%s%s%s" "%s%s%s%s%s%s%s%s%s" + "%s%s%s%s%s%s%s", (has_v9() ? "v9" : ""), (has_popc() ? ", popc" : ""), (has_vis1() ? ", vis1" : ""), @@ -251,6 +253,16 @@ void VM_Version::initialize() { (has_pause_nsec() ? ", pause_nsec" : ""), (has_vamask() ? ", vamask" : ""), + (has_sparc6() ? ", sparc6" : ""), + (has_dictunp() ? ", dictunp" : ""), + (has_fpcmpshl() ? ", fpcmpshl" : ""), + (has_rle() ? ", rle" : ""), + (has_sha3() ? ", sha3" : ""), + (has_athena_plus2()? ", athena_plus2" : ""), + (has_vis3c() ? ", vis3c" : ""), + (has_sparc5b() ? ", sparc5b" : ""), + (has_mme() ? ", mme" : ""), + (has_fast_idiv() ? ", *idiv" : ""), (has_fast_rdpc() ? ", *rdpc" : ""), (has_fast_bis() ? ", *bis" : ""), diff --git a/src/hotspot/cpu/sparc/vm_version_sparc.hpp b/src/hotspot/cpu/sparc/vm_version_sparc.hpp index 58e8283d6ee..04ff200f439 100644 --- a/src/hotspot/cpu/sparc/vm_version_sparc.hpp +++ b/src/hotspot/cpu/sparc/vm_version_sparc.hpp @@ -67,6 +67,16 @@ protected: ISA_PAUSE_NSEC, ISA_VAMASK, + ISA_SPARC6, + ISA_DICTUNP, + ISA_FPCMPSHL, + ISA_RLE, + ISA_SHA3, + ISA_FJATHPLUS2, + ISA_VIS3C, + ISA_SPARC5B, + ISA_MME, + // Synthesised properties: CPU_FAST_IDIV, @@ -79,7 +89,7 @@ protected: }; private: - enum { ISA_last_feature = ISA_VAMASK, + enum { ISA_last_feature = ISA_MME, CPU_last_feature = CPU_BLK_ZEROING }; enum { @@ -119,6 +129,16 @@ private: ISA_pause_nsec_msk = UINT64_C(1) << ISA_PAUSE_NSEC, ISA_vamask_msk = UINT64_C(1) << ISA_VAMASK, + ISA_sparc6_msk = UINT64_C(1) << ISA_SPARC6, + ISA_dictunp_msk = UINT64_C(1) << ISA_DICTUNP, + ISA_fpcmpshl_msk = UINT64_C(1) << ISA_FPCMPSHL, + ISA_rle_msk = UINT64_C(1) << ISA_RLE, + ISA_sha3_msk = UINT64_C(1) << ISA_SHA3, + ISA_fjathplus2_msk = UINT64_C(1) << ISA_FJATHPLUS2, + ISA_vis3c_msk = UINT64_C(1) << ISA_VIS3C, + ISA_sparc5b_msk = UINT64_C(1) << ISA_SPARC5B, + ISA_mme_msk = UINT64_C(1) << ISA_MME, + CPU_fast_idiv_msk = UINT64_C(1) << CPU_FAST_IDIV, CPU_fast_rdpc_msk = UINT64_C(1) << CPU_FAST_RDPC, CPU_fast_bis_msk = UINT64_C(1) << CPU_FAST_BIS, @@ -153,40 +173,51 @@ private: * UltraSPARC T2+: (Victoria Falls, etc.) * SPARC-V9, VIS, VIS2, ASI_BIS, POPC (Crypto/hash in SPU) * - * UltraSPARC T3: (Rainbow Falls/S2) + * UltraSPARC T3: (Rainbow Falls/C2) * SPARC-V9, VIS, VIS2, ASI_BIS, POPC (Crypto/hash in SPU) * - * Oracle SPARC T4/T5/M5: (Core S3) + * Oracle SPARC T4/T5/M5: (Core C3) * SPARC-V9, VIS, VIS2, VIS3, ASI_BIS, HPC, POPC, FMAF, IMA, PAUSE, CBCOND, * AES, DES, Kasumi, Camellia, MD5, SHA1, SHA256, SHA512, CRC32C, MONT, MPMUL * - * Oracle SPARC M7: (Core S4) + * Oracle SPARC M7: (Core C4) * SPARC-V9, VIS, VIS2, VIS3, ASI_BIS, HPC, POPC, FMAF, IMA, PAUSE, CBCOND, * AES, DES, Camellia, MD5, SHA1, SHA256, SHA512, CRC32C, MONT, MPMUL, VIS3b, * ADI, SPARC5, MWAIT, XMPMUL, XMONT, PAUSE_NSEC, VAMASK * + * Oracle SPARC M8: (Core C5) + * SPARC-V9, VIS, VIS2, VIS3, ASI_BIS, HPC, POPC, FMAF, IMA, PAUSE, CBCOND, + * AES, DES, Camellia, MD5, SHA1, SHA256, SHA512, CRC32C, MONT, MPMUL, VIS3b, + * ADI, SPARC5, MWAIT, XMPMUL, XMONT, PAUSE_NSEC, VAMASK, SPARC6, FPCMPSHL, + * DICTUNP, RLE, SHA3, MME + * + * NOTE: Oracle Number support ignored. */ enum { niagara1_msk = ISA_v9_msk | ISA_vis1_msk | ISA_blk_init_msk, niagara2_msk = niagara1_msk | ISA_popc_msk, - core_S2_msk = niagara2_msk | ISA_vis2_msk, + core_C2_msk = niagara2_msk | ISA_vis2_msk, - core_S3_msk = core_S2_msk | ISA_fmaf_msk | ISA_vis3_msk | ISA_hpc_msk | + core_C3_msk = core_C2_msk | ISA_fmaf_msk | ISA_vis3_msk | ISA_hpc_msk | ISA_ima_msk | ISA_aes_msk | ISA_des_msk | ISA_kasumi_msk | ISA_camellia_msk | ISA_md5_msk | ISA_sha1_msk | ISA_sha256_msk | ISA_sha512_msk | ISA_mpmul_msk | ISA_mont_msk | ISA_pause_msk | ISA_cbcond_msk | ISA_crc32c_msk, - core_S4_msk = core_S3_msk - ISA_kasumi_msk | + core_C4_msk = core_C3_msk - ISA_kasumi_msk | ISA_vis3b_msk | ISA_adi_msk | ISA_sparc5_msk | ISA_mwait_msk | ISA_xmpmul_msk | ISA_xmont_msk | ISA_pause_nsec_msk | ISA_vamask_msk, + core_C5_msk = core_C4_msk | ISA_sparc6_msk | ISA_dictunp_msk | + ISA_fpcmpshl_msk | ISA_rle_msk | ISA_sha3_msk | ISA_mme_msk, + ultra_sparc_t1_msk = niagara1_msk, ultra_sparc_t2_msk = niagara2_msk, - ultra_sparc_t3_msk = core_S2_msk, - ultra_sparc_m5_msk = core_S3_msk, // NOTE: First out-of-order pipeline. - ultra_sparc_m7_msk = core_S4_msk + ultra_sparc_t3_msk = core_C2_msk, + ultra_sparc_m5_msk = core_C3_msk, // NOTE: First out-of-order pipeline. + ultra_sparc_m7_msk = core_C4_msk, + ultra_sparc_m8_msk = core_C5_msk }; static uint _L2_data_cache_line_size; @@ -247,6 +278,16 @@ public: static bool has_pause_nsec() { return (_features & ISA_pause_nsec_msk) != 0; } static bool has_vamask() { return (_features & ISA_vamask_msk) != 0; } + static bool has_sparc6() { return (_features & ISA_sparc6_msk) != 0; } + static bool has_dictunp() { return (_features & ISA_dictunp_msk) != 0; } + static bool has_fpcmpshl() { return (_features & ISA_fpcmpshl_msk) != 0; } + static bool has_rle() { return (_features & ISA_rle_msk) != 0; } + static bool has_sha3() { return (_features & ISA_sha3_msk) != 0; } + static bool has_athena_plus2() { return (_features & ISA_fjathplus2_msk) != 0; } + static bool has_vis3c() { return (_features & ISA_vis3c_msk) != 0; } + static bool has_sparc5b() { return (_features & ISA_sparc5b_msk) != 0; } + static bool has_mme() { return (_features & ISA_mme_msk) != 0; } + static bool has_fast_idiv() { return (_features & CPU_fast_idiv_msk) != 0; } static bool has_fast_rdpc() { return (_features & CPU_fast_rdpc_msk) != 0; } static bool has_fast_bis() { return (_features & CPU_fast_bis_msk) != 0; } diff --git a/src/hotspot/os_cpu/solaris_sparc/vm_version_solaris_sparc.cpp b/src/hotspot/os_cpu/solaris_sparc/vm_version_solaris_sparc.cpp index da767cbf642..7cbf60ee92a 100644 --- a/src/hotspot/os_cpu/solaris_sparc/vm_version_solaris_sparc.cpp +++ b/src/hotspot/os_cpu/solaris_sparc/vm_version_solaris_sparc.cpp @@ -380,7 +380,7 @@ void VM_Version::platform_features() { if (av & AV_SPARC_CRC32C) features |= ISA_crc32c_msk; #ifndef AV2_SPARC_FJATHPLUS -#define AV2_SPARC_FJATHPLUS 0x00000001 // Fujitsu Athena+ +#define AV2_SPARC_FJATHPLUS 0x00000001 // Fujitsu Athena+ insns #endif #ifndef AV2_SPARC_VIS3B #define AV2_SPARC_VIS3B 0x00000002 // VIS3 present on multiple chips @@ -405,6 +405,34 @@ void VM_Version::platform_features() { #endif #ifndef AV2_SPARC_VAMASK #define AV2_SPARC_VAMASK 0x00000100 // Virtual Address masking +#endif + +#ifndef AV2_SPARC_SPARC6 +#define AV2_SPARC_SPARC6 0x00000200 // REVB*, FPSLL*, RDENTROPY, LDM* and STM* +#endif +#ifndef AV2_SPARC_DICTUNP +#define AV2_SPARC_DICTUNP 0x00002000 // Dictionary unpack instruction +#endif +#ifndef AV2_SPARC_FPCMPSHL +#define AV2_SPARC_FPCMPSHL 0x00004000 // Partition compare with shifted result +#endif +#ifndef AV2_SPARC_RLE +#define AV2_SPARC_RLE 0x00008000 // Run-length encoded burst and length +#endif +#ifndef AV2_SPARC_SHA3 +#define AV2_SPARC_SHA3 0x00010000 // SHA3 instructions +#endif +#ifndef AV2_SPARC_FJATHPLUS2 +#define AV2_SPARC_FJATHPLUS2 0x00020000 // Fujitsu Athena++ insns +#endif +#ifndef AV2_SPARC_VIS3C +#define AV2_SPARC_VIS3C 0x00040000 // Subset of VIS3 insns provided by Athena++ +#endif +#ifndef AV2_SPARC_SPARC5B +#define AV2_SPARC_SPARC5B 0x00080000 // subset of SPARC5 insns (fpadd8, fpsub8) +#endif +#ifndef AV2_SPARC_MME +#define AV2_SPARC_MME 0x00100000 // Misaligned Mitigation Enable #endif if (avn > 1) { @@ -419,19 +447,30 @@ void VM_Version::platform_features() { if (av2 & AV2_SPARC_XMONT) features |= ISA_xmont_msk; if (av2 & AV2_SPARC_PAUSE_NSEC) features |= ISA_pause_nsec_msk; if (av2 & AV2_SPARC_VAMASK) features |= ISA_vamask_msk; + + if (av2 & AV2_SPARC_SPARC6) features |= ISA_sparc6_msk; + if (av2 & AV2_SPARC_DICTUNP) features |= ISA_dictunp_msk; + if (av2 & AV2_SPARC_FPCMPSHL) features |= ISA_fpcmpshl_msk; + if (av2 & AV2_SPARC_RLE) features |= ISA_rle_msk; + if (av2 & AV2_SPARC_SHA3) features |= ISA_sha3_msk; + if (av2 & AV2_SPARC_FJATHPLUS2) features |= ISA_fjathplus2_msk; + if (av2 & AV2_SPARC_VIS3C) features |= ISA_vis3c_msk; + if (av2 & AV2_SPARC_SPARC5B) features |= ISA_sparc5b_msk; + if (av2 & AV2_SPARC_MME) features |= ISA_mme_msk; } _features = features; // ISA feature set completed, update state. Sysinfo machine(SI_MACHINE); - bool is_sun4v = machine.match("sun4v"); // All Oracle SPARC + Fujitsu Athena+ + bool is_sun4v = machine.match("sun4v"); // All Oracle SPARC + Fujitsu Athena+/++ bool is_sun4u = machine.match("sun4u"); // All other Fujitsu - // Handle Athena+ conservatively (simply because we are lacking info.). + // Handle Athena+/++ conservatively (simply because we are lacking info.). - bool do_sun4v = is_sun4v && !has_athena_plus(); - bool do_sun4u = is_sun4u || has_athena_plus(); + bool an_athena = has_athena_plus() || has_athena_plus2(); + bool do_sun4v = is_sun4v && !an_athena; + bool do_sun4u = is_sun4u || an_athena; uint64_t synthetic = 0; @@ -441,16 +480,16 @@ void VM_Version::platform_features() { // Fast IDIV, BIS and LD available on Niagara Plus. if (has_vis2()) { synthetic |= (CPU_fast_idiv_msk | CPU_fast_ld_msk); - // ...on Core S4 however, we prefer not to use BIS. + // ...on Core C4 however, we prefer not to use BIS. if (!has_sparc5()) { synthetic |= CPU_fast_bis_msk; } } - // Niagara Core S3 supports fast RDPC and block zeroing. + // SPARC Core C3 supports fast RDPC and block zeroing. if (has_ima()) { synthetic |= (CPU_fast_rdpc_msk | CPU_blk_zeroing_msk); } - // Niagara Core S3 and S4 have slow CMOVE. + // SPARC Core C3 and C4 have slow CMOVE. if (!has_ima()) { synthetic |= CPU_fast_cmove_msk; } diff --git a/src/hotspot/share/jvmci/vmStructs_jvmci.cpp b/src/hotspot/share/jvmci/vmStructs_jvmci.cpp index a048fd22218..2d14d680529 100644 --- a/src/hotspot/share/jvmci/vmStructs_jvmci.cpp +++ b/src/hotspot/share/jvmci/vmStructs_jvmci.cpp @@ -761,6 +761,14 @@ declare_constant(VM_Version::ISA_XMONT) \ declare_constant(VM_Version::ISA_PAUSE_NSEC) \ declare_constant(VM_Version::ISA_VAMASK) \ + declare_constant(VM_Version::ISA_SPARC6) \ + declare_constant(VM_Version::ISA_DICTUNP) \ + declare_constant(VM_Version::ISA_FPCMPSHL) \ + declare_constant(VM_Version::ISA_RLE) \ + declare_constant(VM_Version::ISA_SHA3) \ + declare_constant(VM_Version::ISA_VIS3C) \ + declare_constant(VM_Version::ISA_SPARC5B) \ + declare_constant(VM_Version::ISA_MME) \ declare_constant(VM_Version::CPU_FAST_IDIV) \ declare_constant(VM_Version::CPU_FAST_RDPC) \ declare_constant(VM_Version::CPU_FAST_BIS) \ diff --git a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotJVMCIBackendFactory.java b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotJVMCIBackendFactory.java index 7006517548f..8331dc15903 100644 --- a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotJVMCIBackendFactory.java +++ b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotJVMCIBackendFactory.java @@ -79,9 +79,15 @@ public class SPARCHotSpotJVMCIBackendFactory implements HotSpotJVMCIBackendFacto if ((config.vmVersionFeatures & 1L << config.sparc_DES) != 0) { features.add(CPUFeature.DES); } + if ((config.vmVersionFeatures & 1L << config.sparc_DICTUNP) != 0) { + features.add(CPUFeature.DICTUNP); + } if ((config.vmVersionFeatures & 1L << config.sparc_FMAF) != 0) { features.add(CPUFeature.FMAF); } + if ((config.vmVersionFeatures & 1L << config.sparc_FPCMPSHL) != 0) { + features.add(CPUFeature.FPCMPSHL); + } if ((config.vmVersionFeatures & 1L << config.sparc_HPC) != 0) { features.add(CPUFeature.HPC); } @@ -94,6 +100,9 @@ public class SPARCHotSpotJVMCIBackendFactory implements HotSpotJVMCIBackendFacto if ((config.vmVersionFeatures & 1L << config.sparc_MD5) != 0) { features.add(CPUFeature.MD5); } + if ((config.vmVersionFeatures & 1L << config.sparc_MME) != 0) { + features.add(CPUFeature.MME); + } if ((config.vmVersionFeatures & 1L << config.sparc_MONT) != 0) { features.add(CPUFeature.MONT); } @@ -112,18 +121,30 @@ public class SPARCHotSpotJVMCIBackendFactory implements HotSpotJVMCIBackendFacto if ((config.vmVersionFeatures & 1L << config.sparc_POPC) != 0) { features.add(CPUFeature.POPC); } + if ((config.vmVersionFeatures & 1L << config.sparc_RLE) != 0) { + features.add(CPUFeature.RLE); + } if ((config.vmVersionFeatures & 1L << config.sparc_SHA1) != 0) { features.add(CPUFeature.SHA1); } if ((config.vmVersionFeatures & 1L << config.sparc_SHA256) != 0) { features.add(CPUFeature.SHA256); } + if ((config.vmVersionFeatures & 1L << config.sparc_SHA3) != 0) { + features.add(CPUFeature.SHA3); + } if ((config.vmVersionFeatures & 1L << config.sparc_SHA512) != 0) { features.add(CPUFeature.SHA512); } if ((config.vmVersionFeatures & 1L << config.sparc_SPARC5) != 0) { features.add(CPUFeature.SPARC5); } + if ((config.vmVersionFeatures & 1L << config.sparc_SPARC5B) != 0) { + features.add(CPUFeature.SPARC5B); + } + if ((config.vmVersionFeatures & 1L << config.sparc_SPARC6) != 0) { + features.add(CPUFeature.SPARC6); + } if ((config.vmVersionFeatures & 1L << config.sparc_V9) != 0) { features.add(CPUFeature.V9); } @@ -142,6 +163,9 @@ public class SPARCHotSpotJVMCIBackendFactory implements HotSpotJVMCIBackendFacto if ((config.vmVersionFeatures & 1L << config.sparc_VIS3B) != 0) { features.add(CPUFeature.VIS3B); } + if ((config.vmVersionFeatures & 1L << config.sparc_VIS3C) != 0) { + features.add(CPUFeature.VIS3C); + } if ((config.vmVersionFeatures & 1L << config.sparc_XMONT) != 0) { features.add(CPUFeature.XMONT); } diff --git a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotVMConfig.java b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotVMConfig.java index a5ae1d85eef..e1b441cadb8 100644 --- a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotVMConfig.java +++ b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.hotspot.sparc/src/jdk/vm/ci/hotspot/sparc/SPARCHotSpotVMConfig.java @@ -55,27 +55,35 @@ class SPARCHotSpotVMConfig extends HotSpotVMConfigAccess { final int sparc_CBCOND = getConstant("VM_Version::ISA_CBCOND", Integer.class); final int sparc_CRC32C = getConstant("VM_Version::ISA_CRC32C", Integer.class); final int sparc_DES = getConstant("VM_Version::ISA_DES", Integer.class); + final int sparc_DICTUNP = getConstant("VM_Version::ISA_DICTUNP", Integer.class); final int sparc_FMAF = getConstant("VM_Version::ISA_FMAF", Integer.class); + final int sparc_FPCMPSHL = getConstant("VM_Version::ISA_FPCMPSHL", Integer.class); final int sparc_HPC = getConstant("VM_Version::ISA_HPC", Integer.class); final int sparc_IMA = getConstant("VM_Version::ISA_IMA", Integer.class); final int sparc_KASUMI = getConstant("VM_Version::ISA_KASUMI", Integer.class); final int sparc_MD5 = getConstant("VM_Version::ISA_MD5", Integer.class); + final int sparc_MME = getConstant("VM_Version::ISA_MME", Integer.class); final int sparc_MONT = getConstant("VM_Version::ISA_MONT", Integer.class); final int sparc_MPMUL = getConstant("VM_Version::ISA_MPMUL", Integer.class); final int sparc_MWAIT = getConstant("VM_Version::ISA_MWAIT", Integer.class); final int sparc_PAUSE = getConstant("VM_Version::ISA_PAUSE", Integer.class); final int sparc_PAUSE_NSEC = getConstant("VM_Version::ISA_PAUSE_NSEC", Integer.class); final int sparc_POPC = getConstant("VM_Version::ISA_POPC", Integer.class); + final int sparc_RLE = getConstant("VM_Version::ISA_RLE", Integer.class); final int sparc_SHA1 = getConstant("VM_Version::ISA_SHA1", Integer.class); final int sparc_SHA256 = getConstant("VM_Version::ISA_SHA256", Integer.class); + final int sparc_SHA3 = getConstant("VM_Version::ISA_SHA3", Integer.class); final int sparc_SHA512 = getConstant("VM_Version::ISA_SHA512", Integer.class); final int sparc_SPARC5 = getConstant("VM_Version::ISA_SPARC5", Integer.class); + final int sparc_SPARC5B = getConstant("VM_Version::ISA_SPARC5B", Integer.class); + final int sparc_SPARC6 = getConstant("VM_Version::ISA_SPARC6", Integer.class); final int sparc_V9 = getConstant("VM_Version::ISA_V9", Integer.class); final int sparc_VAMASK = getConstant("VM_Version::ISA_VAMASK", Integer.class); final int sparc_VIS1 = getConstant("VM_Version::ISA_VIS1", Integer.class); final int sparc_VIS2 = getConstant("VM_Version::ISA_VIS2", Integer.class); final int sparc_VIS3 = getConstant("VM_Version::ISA_VIS3", Integer.class); final int sparc_VIS3B = getConstant("VM_Version::ISA_VIS3B", Integer.class); + final int sparc_VIS3C = getConstant("VM_Version::ISA_VIS3C", Integer.class); final int sparc_XMONT = getConstant("VM_Version::ISA_XMONT", Integer.class); final int sparc_XMPMUL = getConstant("VM_Version::ISA_XMPMUL", Integer.class); diff --git a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.sparc/src/jdk/vm/ci/sparc/SPARC.java b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.sparc/src/jdk/vm/ci/sparc/SPARC.java index ee40d426346..29dd0fb4d36 100644 --- a/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.sparc/src/jdk/vm/ci/sparc/SPARC.java +++ b/src/jdk.internal.vm.ci/share/classes/jdk.vm.ci.sparc/src/jdk/vm/ci/sparc/SPARC.java @@ -344,27 +344,35 @@ public class SPARC extends Architecture { CBCOND, CRC32C, DES, + DICTUNP, FMAF, + FPCMPSHL, HPC, IMA, KASUMI, MD5, + MME, MONT, MPMUL, MWAIT, PAUSE, PAUSE_NSEC, POPC, + RLE, SHA1, SHA256, + SHA3, SHA512, SPARC5, + SPARC5B, + SPARC6, V9, VAMASK, VIS1, VIS2, VIS3, VIS3B, + VIS3C, XMONT, XMPMUL, // Synthesised CPU properties: From e31bc5637a298f1dafa5bbb33ca7b8a4927287b6 Mon Sep 17 00:00:00 2001 From: Patric Hedlin Date: Fri, 29 Sep 2017 10:44:58 +0200 Subject: [PATCH 49/80] 8188031: Complement fused mac operations on SPARC Adding a few (FMAf) matcher patterns to the SPARC back-end Reviewed-by: rbackman, kvn --- src/hotspot/cpu/sparc/assembler_sparc.hpp | 6 +- .../cpu/sparc/assembler_sparc.inline.hpp | 13 ++ src/hotspot/cpu/sparc/sparc.ad | 128 +++++++++++++++++- 3 files changed, 143 insertions(+), 4 deletions(-) diff --git a/src/hotspot/cpu/sparc/assembler_sparc.hpp b/src/hotspot/cpu/sparc/assembler_sparc.hpp index c3f1ddddbfe..f8f5b11c9a6 100644 --- a/src/hotspot/cpu/sparc/assembler_sparc.hpp +++ b/src/hotspot/cpu/sparc/assembler_sparc.hpp @@ -645,7 +645,7 @@ class Assembler : public AbstractAssembler { static void fmaf_only() { assert(VM_Version::has_fmaf(), "This instruction only works on SPARC with FMAf"); } // MPMUL instruction supported only on certain processors - static void mpmul_only() { assert( VM_Version::has_mpmul(), "This instruction only works on SPARC with MPMUL"); } + static void mpmul_only() { assert(VM_Version::has_mpmul(), "This instruction only works on SPARC with MPMUL"); } // instruction only in VIS1 static void vis1_only() { assert(VM_Version::has_vis1(), "This instruction only works on SPARC with VIS1"); } @@ -946,6 +946,10 @@ class Assembler : public AbstractAssembler { // fmaf instructions. inline void fmadd(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d); + inline void fmsub(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d); + + inline void fnmadd(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d); + inline void fnmsub(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d); // pp 165 diff --git a/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp b/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp index 7a87f0c3387..b9a918e5e0b 100644 --- a/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp +++ b/src/hotspot/cpu/sparc/assembler_sparc.inline.hpp @@ -359,6 +359,19 @@ inline void Assembler::fmadd(FloatRegisterImpl::Width w, FloatRegister s1, Float fmaf_only(); emit_int32(op(arith_op) | fd(d, w) | op3(stpartialf_op3) | fs1(s1, w) | fs3(s3, w) | op5(w) | fs2(s2, w)); } +inline void Assembler::fmsub(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d) { + fmaf_only(); + emit_int32(op(arith_op) | fd(d, w) | op3(stpartialf_op3) | fs1(s1, w) | fs3(s3, w) | op5(0x4 + w) | fs2(s2, w)); +} + +inline void Assembler::fnmadd(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d) { + fmaf_only(); + emit_int32(op(arith_op) | fd(d, w) | op3(stpartialf_op3) | fs1(s1, w) | fs3(s3, w) | op5(0xc + w) | fs2(s2, w)); +} +inline void Assembler::fnmsub(FloatRegisterImpl::Width w, FloatRegister s1, FloatRegister s2, FloatRegister s3, FloatRegister d) { + fmaf_only(); + emit_int32(op(arith_op) | fd(d, w) | op3(stpartialf_op3) | fs1(s1, w) | fs3(s3, w) | op5(0x8 + w) | fs2(s2, w)); +} inline void Assembler::flush(Register s1, Register s2) { emit_int32(op(arith_op) | op3(flush_op3) | rs1(s1) | rs2(s2)); diff --git a/src/hotspot/cpu/sparc/sparc.ad b/src/hotspot/cpu/sparc/sparc.ad index 07f62bac5aa..c582cd5a6a8 100644 --- a/src/hotspot/cpu/sparc/sparc.ad +++ b/src/hotspot/cpu/sparc/sparc.ad @@ -2628,7 +2628,6 @@ enc_class fsqrtd (dflt_reg dst, dflt_reg src) %{ %} - enc_class fmadds (sflt_reg dst, sflt_reg a, sflt_reg b, sflt_reg c) %{ MacroAssembler _masm(&cbuf); @@ -2651,7 +2650,71 @@ enc_class fmaddd (dflt_reg dst, dflt_reg a, dflt_reg b, dflt_reg c) %{ __ fmadd(FloatRegisterImpl::D, Fra, Frb, Frc, Frd); %} +enc_class fmsubs (sflt_reg dst, sflt_reg a, sflt_reg b, sflt_reg c) %{ + MacroAssembler _masm(&cbuf); + FloatRegister Frd = reg_to_SingleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_SingleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_SingleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_SingleFloatRegister_object($c$$reg); + + __ fmsub(FloatRegisterImpl::S, Fra, Frb, Frc, Frd); +%} + +enc_class fmsubd (dflt_reg dst, dflt_reg a, dflt_reg b, dflt_reg c) %{ + MacroAssembler _masm(&cbuf); + + FloatRegister Frd = reg_to_DoubleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_DoubleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_DoubleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_DoubleFloatRegister_object($c$$reg); + + __ fmsub(FloatRegisterImpl::D, Fra, Frb, Frc, Frd); +%} + +enc_class fnmadds (sflt_reg dst, sflt_reg a, sflt_reg b, sflt_reg c) %{ + MacroAssembler _masm(&cbuf); + + FloatRegister Frd = reg_to_SingleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_SingleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_SingleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_SingleFloatRegister_object($c$$reg); + + __ fnmadd(FloatRegisterImpl::S, Fra, Frb, Frc, Frd); +%} + +enc_class fnmaddd (dflt_reg dst, dflt_reg a, dflt_reg b, dflt_reg c) %{ + MacroAssembler _masm(&cbuf); + + FloatRegister Frd = reg_to_DoubleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_DoubleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_DoubleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_DoubleFloatRegister_object($c$$reg); + + __ fnmadd(FloatRegisterImpl::D, Fra, Frb, Frc, Frd); +%} + +enc_class fnmsubs (sflt_reg dst, sflt_reg a, sflt_reg b, sflt_reg c) %{ + MacroAssembler _masm(&cbuf); + + FloatRegister Frd = reg_to_SingleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_SingleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_SingleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_SingleFloatRegister_object($c$$reg); + + __ fnmsub(FloatRegisterImpl::S, Fra, Frb, Frc, Frd); +%} + +enc_class fnmsubd (dflt_reg dst, dflt_reg a, dflt_reg b, dflt_reg c) %{ + MacroAssembler _masm(&cbuf); + + FloatRegister Frd = reg_to_DoubleFloatRegister_object($dst$$reg); + FloatRegister Fra = reg_to_DoubleFloatRegister_object($a$$reg); + FloatRegister Frb = reg_to_DoubleFloatRegister_object($b$$reg); + FloatRegister Frc = reg_to_DoubleFloatRegister_object($c$$reg); + + __ fnmsub(FloatRegisterImpl::D, Fra, Frb, Frc, Frd); +%} enc_class fmovs (dflt_reg dst, dflt_reg src) %{ @@ -7597,7 +7660,7 @@ instruct sqrtD_reg_reg(regD dst, regD src) %{ ins_pipe(fdivD_reg_reg); %} -// Single precision fused floating-point multiply-add (d = a * b + c). +// Single/Double precision fused floating-point multiply-add (d = a * b + c). instruct fmaF_regx4(regF dst, regF a, regF b, regF c) %{ predicate(UseFMA); match(Set dst (FmaF c (Binary a b))); @@ -7606,7 +7669,6 @@ instruct fmaF_regx4(regF dst, regF a, regF b, regF c) %{ ins_pipe(fmaF_regx4); %} -// Double precision fused floating-point multiply-add (d = a * b + c). instruct fmaD_regx4(regD dst, regD a, regD b, regD c) %{ predicate(UseFMA); match(Set dst (FmaD c (Binary a b))); @@ -7615,6 +7677,66 @@ instruct fmaD_regx4(regD dst, regD a, regD b, regD c) %{ ins_pipe(fmaD_regx4); %} +// Additional patterns matching complement versions that we can map directly to +// variants of the fused multiply-add instructions. + +// Single/Double precision fused floating-point multiply-sub (d = a * b - c) +instruct fmsubF_regx4(regF dst, regF a, regF b, regF c) %{ + predicate(UseFMA); + match(Set dst (FmaF (NegF c) (Binary a b))); + format %{ "fmsubs $a,$b,$c,$dst\t# $dst = $a * $b - $c" %} + ins_encode(fmsubs(dst, a, b, c)); + ins_pipe(fmaF_regx4); +%} + +instruct fmsubD_regx4(regD dst, regD a, regD b, regD c) %{ + predicate(UseFMA); + match(Set dst (FmaD (NegD c) (Binary a b))); + format %{ "fmsubd $a,$b,$c,$dst\t# $dst = $a * $b - $c" %} + ins_encode(fmsubd(dst, a, b, c)); + ins_pipe(fmaD_regx4); +%} + +// Single/Double precision fused floating-point neg. multiply-add, +// d = -1 * a * b - c = -(a * b + c) +instruct fnmaddF_regx4(regF dst, regF a, regF b, regF c) %{ + predicate(UseFMA); + match(Set dst (FmaF (NegF c) (Binary (NegF a) b))); + match(Set dst (FmaF (NegF c) (Binary a (NegF b)))); + format %{ "fnmadds $a,$b,$c,$dst\t# $dst = -($a * $b + $c)" %} + ins_encode(fnmadds(dst, a, b, c)); + ins_pipe(fmaF_regx4); +%} + +instruct fnmaddD_regx4(regD dst, regD a, regD b, regD c) %{ + predicate(UseFMA); + match(Set dst (FmaD (NegD c) (Binary (NegD a) b))); + match(Set dst (FmaD (NegD c) (Binary a (NegD b)))); + format %{ "fnmaddd $a,$b,$c,$dst\t# $dst = -($a * $b + $c)" %} + ins_encode(fnmaddd(dst, a, b, c)); + ins_pipe(fmaD_regx4); +%} + +// Single/Double precision fused floating-point neg. multiply-sub, +// d = -1 * a * b + c = -(a * b - c) +instruct fnmsubF_regx4(regF dst, regF a, regF b, regF c) %{ + predicate(UseFMA); + match(Set dst (FmaF c (Binary (NegF a) b))); + match(Set dst (FmaF c (Binary a (NegF b)))); + format %{ "fnmsubs $a,$b,$c,$dst\t# $dst = -($a * $b - $c)" %} + ins_encode(fnmsubs(dst, a, b, c)); + ins_pipe(fmaF_regx4); +%} + +instruct fnmsubD_regx4(regD dst, regD a, regD b, regD c) %{ + predicate(UseFMA); + match(Set dst (FmaD c (Binary (NegD a) b))); + match(Set dst (FmaD c (Binary a (NegD b)))); + format %{ "fnmsubd $a,$b,$c,$dst\t# $dst = -($a * $b - $c)" %} + ins_encode(fnmsubd(dst, a, b, c)); + ins_pipe(fmaD_regx4); +%} + //----------Logical Instructions----------------------------------------------- // And Instructions // Register And From 858db7244e9f92d35ce9e2128ca1cf59c3e27af7 Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Fri, 29 Sep 2017 21:00:18 +0900 Subject: [PATCH 50/80] 8187402: UnknownOopException is occurred on Stack Memory window in HSDB Reviewed-by: sspitsyn, jgeorge --- src/hotspot/share/runtime/vmStructs.cpp | 8 ++++++-- .../share/classes/sun/jvm/hotspot/code/VMRegImpl.java | 8 +++++++- .../share/classes/sun/jvm/hotspot/runtime/Frame.java | 4 ++-- .../share/classes/sun/jvm/hotspot/runtime/VMReg.java | 6 +++++- 4 files changed, 20 insertions(+), 6 deletions(-) diff --git a/src/hotspot/share/runtime/vmStructs.cpp b/src/hotspot/share/runtime/vmStructs.cpp index d9dd0d15b50..93e9abf209b 100644 --- a/src/hotspot/share/runtime/vmStructs.cpp +++ b/src/hotspot/share/runtime/vmStructs.cpp @@ -2726,8 +2726,12 @@ typedef RehashableHashtable RehashableSymbolHashtable; /* JVMCI */ \ /****************/ \ \ - declare_preprocessor_constant("INCLUDE_JVMCI", INCLUDE_JVMCI) - + declare_preprocessor_constant("INCLUDE_JVMCI", INCLUDE_JVMCI) \ + \ + /****************/ \ + /* VMRegImpl */ \ + /****************/ \ + declare_constant(VMRegImpl::stack_slot_size) //-------------------------------------------------------------------------------- // VM_LONG_CONSTANTS diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/VMRegImpl.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/VMRegImpl.java index 8159437621a..19ae300108e 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/VMRegImpl.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/code/VMRegImpl.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2006, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2006, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -37,6 +37,7 @@ public class VMRegImpl { private static int stack0Val; private static Address stack0Addr; private static AddressField regNameField; + private static int stackSlotSize; static { VM.registerVMInitializedObserver(new Observer() { @@ -53,6 +54,7 @@ public class VMRegImpl { stack0Val = (int) stack0Addr.hashCode(); stack0 = new VMReg(stack0Val); regNameField = type.getAddressField("regName[0]"); + stackSlotSize = db.lookupIntConstant("VMRegImpl::stack_slot_size"); } public static VMReg getStack0() { @@ -67,4 +69,8 @@ public class VMRegImpl { long addrSize = VM.getVM().getAddressSize(); return CStringUtilities.getString(regName.getAddressAt(index * addrSize)); } + + public static int getStackSlotSize() { + return stackSlotSize; + } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/Frame.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/Frame.java index ab536d20f5d..d9de87767fd 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/Frame.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/Frame.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -430,7 +430,7 @@ public abstract class Frame implements Cloneable { // If it is passed in a register, it got spilled in the stub frame. return regMap.getLocation(reg); } else { - long spOffset = VM.getVM().getAddressSize() * reg.minus(stack0); + long spOffset = reg.reg2Stack() * VM.getVM().getVMRegImplInfo().getStackSlotSize(); return getUnextendedSP().addOffsetTo(spOffset); } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/VMReg.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/VMReg.java index 15c049f8425..f3bdca35f23 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/VMReg.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/VMReg.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2003, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -84,4 +84,8 @@ public class VMReg { public boolean greaterThanOrEqual(VMReg arg) { return value >= arg.value; } public int minus(VMReg arg) { return value - arg.value; } + + public int reg2Stack() { + return value - VM.getVM().getVMRegImplInfo().getStack0().getValue(); + } } From 6213838f11cfa6640bb987ea3b0d8009c5f5796c Mon Sep 17 00:00:00 2001 From: Calvin Cheung Date: Fri, 29 Sep 2017 10:11:01 -0700 Subject: [PATCH 51/80] 8138600: eliminate the need of ModuleLoaderMap.dat for CDS Removed the code which generates the ModuleLoaderMap.dat and the code which references it Reviewed-by: mchung, jiangli --- make/gensrc/GensrcModuleLoaderMap.gmk | 11 -- .../tools/module/GenModuleLoaderMap.java | 18 +-- src/hotspot/share/classfile/classLoader.cpp | 108 ------------------ src/hotspot/share/classfile/classLoader.hpp | 11 -- .../vm/cds/resources/ModuleLoaderMap.dat | 4 - 5 files changed, 5 insertions(+), 147 deletions(-) delete mode 100644 src/java.base/share/classes/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat diff --git a/make/gensrc/GensrcModuleLoaderMap.gmk b/make/gensrc/GensrcModuleLoaderMap.gmk index 5d4adeeccba..86d4446496a 100644 --- a/make/gensrc/GensrcModuleLoaderMap.gmk +++ b/make/gensrc/GensrcModuleLoaderMap.gmk @@ -54,15 +54,4 @@ $(SUPPORT_OUTPUTDIR)/gensrc/java.base/jdk/internal/module/ModuleLoaderMap.java: GENSRC_JAVA_BASE += $(SUPPORT_OUTPUTDIR)/gensrc/java.base/jdk/internal/module/ModuleLoaderMap.java -$(SUPPORT_OUTPUTDIR)/gensrc/java.base/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat: \ - $(TOPDIR)/src/java.base/share/classes/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat \ - $(VARDEPS_FILE) $(BUILD_TOOLS_JDK) - $(MKDIR) -p $(@D) - $(RM) $@ $@.tmp - $(TOOL_GENCLASSLOADERMAP) -boot $(BOOT_MODULES_LIST) \ - -platform $(PLATFORM_MODULES_LIST) -o $@.tmp $< - $(MV) $@.tmp $@ - -GENSRC_JAVA_BASE += $(SUPPORT_OUTPUTDIR)/gensrc/java.base/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat - ################################################################################ diff --git a/make/jdk/src/classes/build/tools/module/GenModuleLoaderMap.java b/make/jdk/src/classes/build/tools/module/GenModuleLoaderMap.java index 6719277fac1..c6c90e0fb59 100644 --- a/make/jdk/src/classes/build/tools/module/GenModuleLoaderMap.java +++ b/make/jdk/src/classes/build/tools/module/GenModuleLoaderMap.java @@ -77,30 +77,22 @@ public class GenModuleLoaderMap { throw new IllegalArgumentException(source + " not exist"); } - boolean needsQuotes = outfile.toString().contains(".java.tmp"); - try (BufferedWriter bw = Files.newBufferedWriter(outfile, StandardCharsets.UTF_8); PrintWriter writer = new PrintWriter(bw)) { for (String line : Files.readAllLines(source)) { if (line.contains("@@BOOT_MODULE_NAMES@@")) { - line = patch(line, "@@BOOT_MODULE_NAMES@@", bootModules, needsQuotes); + line = patch(line, "@@BOOT_MODULE_NAMES@@", bootModules); } else if (line.contains("@@PLATFORM_MODULE_NAMES@@")) { - line = patch(line, "@@PLATFORM_MODULE_NAMES@@", platformModules, needsQuotes); + line = patch(line, "@@PLATFORM_MODULE_NAMES@@", platformModules); } writer.println(line); } } } - private static String patch(String s, String tag, Stream stream, boolean needsQuotes) { - String mns = null; - if (needsQuotes) { - mns = stream.sorted() - .collect(Collectors.joining("\",\n \"")); - } else { - mns = stream.sorted() - .collect(Collectors.joining("\n")); - } + private static String patch(String s, String tag, Stream stream) { + String mns = stream.sorted() + .collect(Collectors.joining("\",\n \"")); return s.replace(tag, mns); } diff --git a/src/hotspot/share/classfile/classLoader.cpp b/src/hotspot/share/classfile/classLoader.cpp index 8592616311f..d0873c3e010 100644 --- a/src/hotspot/share/classfile/classLoader.cpp +++ b/src/hotspot/share/classfile/classLoader.cpp @@ -802,7 +802,6 @@ void ClassLoader::setup_search_path(const char *class_path, bool bootstrap_searc if (DumpSharedSpaces) { JImageFile *jimage = _jrt_entry->jimage(); assert(jimage != NULL, "No java runtime image file present"); - ClassLoader::initialize_module_loader_map(jimage); } #endif } @@ -1144,61 +1143,6 @@ int ClassLoader::crc32(int crc, const char* buf, int len) { return (*Crc32)(crc, (const jbyte*)buf, len); } -#if INCLUDE_CDS -void ClassLoader::initialize_module_loader_map(JImageFile* jimage) { - if (!DumpSharedSpaces) { - return; // only needed for CDS dump time - } - - ResourceMark rm; - jlong size; - JImageLocationRef location = (*JImageFindResource)(jimage, JAVA_BASE_NAME, get_jimage_version_string(), MODULE_LOADER_MAP, &size); - if (location == 0) { - vm_exit_during_initialization( - "Cannot find ModuleLoaderMap location from modules jimage.", NULL); - } - char* buffer = NEW_RESOURCE_ARRAY(char, size + 1); - buffer[size] = '\0'; - jlong read = (*JImageGetResource)(jimage, location, buffer, size); - if (read != size) { - vm_exit_during_initialization( - "Cannot find ModuleLoaderMap resource from modules jimage.", NULL); - } - char* char_buf = (char*)buffer; - int buflen = (int)strlen(char_buf); - char* begin_ptr = char_buf; - char* end_ptr = strchr(begin_ptr, '\n'); - bool process_boot_modules = false; - _boot_modules_array = new (ResourceObj::C_HEAP, mtModule) - GrowableArray(INITIAL_BOOT_MODULES_ARRAY_SIZE, true); - _platform_modules_array = new (ResourceObj::C_HEAP, mtModule) - GrowableArray(INITIAL_PLATFORM_MODULES_ARRAY_SIZE, true); - while (end_ptr != NULL && (end_ptr - char_buf) < buflen) { - // Allocate a buffer from the C heap to be appended to the _boot_modules_array - // or the _platform_modules_array. - char* temp_name = NEW_C_HEAP_ARRAY(char, (size_t)(end_ptr - begin_ptr + 1), mtInternal); - strncpy(temp_name, begin_ptr, end_ptr - begin_ptr); - temp_name[end_ptr - begin_ptr] = '\0'; - if (strncmp(temp_name, "BOOT", 4) == 0) { - process_boot_modules = true; - FREE_C_HEAP_ARRAY(char, temp_name); - } else if (strncmp(temp_name, "PLATFORM", 8) == 0) { - process_boot_modules = false; - FREE_C_HEAP_ARRAY(char, temp_name); - } else { - // module name - if (process_boot_modules) { - _boot_modules_array->append(temp_name); - } else { - _platform_modules_array->append(temp_name); - } - } - begin_ptr = ++end_ptr; - end_ptr = strchr(begin_ptr, '\n'); - } -} -#endif - // Function add_package extracts the package from the fully qualified class name // and checks if the package is in the boot loader's package entry table. If so, // then it sets the classpath_index in the package entry record. @@ -1290,58 +1234,6 @@ objArrayOop ClassLoader::get_system_packages(TRAPS) { return result(); } -#if INCLUDE_CDS -s2 ClassLoader::module_to_classloader(const char* module_name) { - - assert(DumpSharedSpaces, "dump time only"); - assert(_boot_modules_array != NULL, "_boot_modules_array is NULL"); - assert(_platform_modules_array != NULL, "_platform_modules_array is NULL"); - - int array_size = _boot_modules_array->length(); - for (int i = 0; i < array_size; i++) { - if (strcmp(module_name, _boot_modules_array->at(i)) == 0) { - return BOOT_LOADER; - } - } - - array_size = _platform_modules_array->length(); - for (int i = 0; i < array_size; i++) { - if (strcmp(module_name, _platform_modules_array->at(i)) == 0) { - return PLATFORM_LOADER; - } - } - - return APP_LOADER; -} - -s2 ClassLoader::classloader_type(Symbol* class_name, ClassPathEntry* e, int classpath_index, TRAPS) { - assert(DumpSharedSpaces, "Only used for CDS dump time"); - - // obtain the classloader type based on the class name. - // First obtain the package name based on the class name. Then obtain - // the classloader type based on the package name from the jimage using - // a jimage API. If the classloader type cannot be found from the - // jimage, it is determined by the class path entry. - jshort loader_type = ClassLoader::APP_LOADER; - if (e->is_jrt()) { - ResourceMark rm; - TempNewSymbol pkg_name = InstanceKlass::package_from_name(class_name, CHECK_0); - if (pkg_name != NULL) { - const char* pkg_name_C_string = (const char*)(pkg_name->as_C_string()); - ClassPathImageEntry* cpie = (ClassPathImageEntry*)e; - JImageFile* jimage = cpie->jimage(); - char* module_name = (char*)(*JImagePackageToModule)(jimage, pkg_name_C_string); - if (module_name != NULL) { - loader_type = ClassLoader::module_to_classloader(module_name); - } - } - } else if (ClassLoaderExt::is_boot_classpath(classpath_index)) { - loader_type = ClassLoader::BOOT_LOADER; - } - return loader_type; -} -#endif - // caller needs ResourceMark const char* ClassLoader::file_name_for_class_name(const char* class_name, int class_name_len) { diff --git a/src/hotspot/share/classfile/classLoader.hpp b/src/hotspot/share/classfile/classLoader.hpp index c3f363c0326..382da36079b 100644 --- a/src/hotspot/share/classfile/classLoader.hpp +++ b/src/hotspot/share/classfile/classLoader.hpp @@ -37,13 +37,6 @@ // Name of boot "modules" image #define MODULES_IMAGE_NAME "modules" -// Name of the resource containing mapping from module names to defining class loader type -#define MODULE_LOADER_MAP "jdk/internal/vm/cds/resources/ModuleLoaderMap.dat" - -// Initial sizes of the following arrays are based on the generated ModuleLoaderMap.dat -#define INITIAL_BOOT_MODULES_ARRAY_SIZE 30 -#define INITIAL_PLATFORM_MODULES_ARRAY_SIZE 15 - // Class path entry (directory or zip file) class JImageFile; @@ -439,10 +432,6 @@ class ClassLoader: AllStatic { static bool check_shared_paths_misc_info(void* info, int size); static void exit_with_path_failure(const char* error, const char* message); - static s2 module_to_classloader(const char* module_name); - static void initialize_module_loader_map(JImageFile* jimage); - static s2 classloader_type(Symbol* class_name, ClassPathEntry* e, - int classpath_index, TRAPS); static void record_shared_class_loader_type(InstanceKlass* ik, const ClassFileStream* stream); #endif static JImageLocationRef jimage_find_resource(JImageFile* jf, const char* module_name, diff --git a/src/java.base/share/classes/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat b/src/java.base/share/classes/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat deleted file mode 100644 index a634d5b03d4..00000000000 --- a/src/java.base/share/classes/jdk/internal/vm/cds/resources/ModuleLoaderMap.dat +++ /dev/null @@ -1,4 +0,0 @@ -BOOT -@@BOOT_MODULE_NAMES@@ -PLATFORM -@@PLATFORM_MODULE_NAMES@@ From 96d081745567752fdfd2a143713b6e8f82dec1f5 Mon Sep 17 00:00:00 2001 From: Ujwal Vangapally Date: Thu, 5 Oct 2017 01:31:53 -0700 Subject: [PATCH 52/80] 8185003: JMX: Add a version of ThreadMXBean.dumpAllThreads with a maxDepth argument Added two new API's to limit the stack trace depth Reviewed-by: mchung, dfuchs, rriggs, egahlin --- src/hotspot/share/services/jmm.h | 8 +- src/hotspot/share/services/management.cpp | 9 +- src/hotspot/share/services/threadService.cpp | 8 +- .../java/lang/management/ThreadMXBean.java | 215 +++++++++++++----- .../classes/sun/management/ThreadImpl.java | 32 ++- .../share/native/include/jmm.h | 8 +- .../share/native/libmanagement/ThreadImpl.c | 8 +- .../share/native/libmanagement/management.c | 4 +- .../native/libmanagement_ext/management_ext.c | 4 +- .../MaxDepthForThreadInfoTest.java | 101 ++++++++ 10 files changed, 317 insertions(+), 80 deletions(-) create mode 100644 test/jdk/java/lang/management/ThreadMXBean/MaxDepthForThreadInfoTest.java diff --git a/src/hotspot/share/services/jmm.h b/src/hotspot/share/services/jmm.h index b6497cd8982..df232f6feec 100644 --- a/src/hotspot/share/services/jmm.h +++ b/src/hotspot/share/services/jmm.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2014, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -50,7 +50,8 @@ enum { JMM_VERSION_1_2 = 0x20010200, // JDK 7 JMM_VERSION_1_2_1 = 0x20010201, // JDK 7 GA JMM_VERSION_1_2_2 = 0x20010202, - JMM_VERSION = 0x20010203 + JMM_VERSION_2 = 0x20020000, // JDK 10 + JMM_VERSION = 0x20020000 }; typedef struct { @@ -315,7 +316,8 @@ typedef struct jmmInterface_1_ { jobjectArray (JNICALL *DumpThreads) (JNIEnv *env, jlongArray ids, jboolean lockedMonitors, - jboolean lockedSynchronizers); + jboolean lockedSynchronizers, + jint maxDepth); void (JNICALL *SetGCNotificationEnabled) (JNIEnv *env, jobject mgr, jboolean enabled); diff --git a/src/hotspot/share/services/management.cpp b/src/hotspot/share/services/management.cpp index 12d88b7419f..bc50816d83d 100644 --- a/src/hotspot/share/services/management.cpp +++ b/src/hotspot/share/services/management.cpp @@ -1160,7 +1160,8 @@ JVM_END // locked_monitors - if true, dump locked object monitors // locked_synchronizers - if true, dump locked JSR-166 synchronizers // -JVM_ENTRY(jobjectArray, jmm_DumpThreads(JNIEnv *env, jlongArray thread_ids, jboolean locked_monitors, jboolean locked_synchronizers)) +JVM_ENTRY(jobjectArray, jmm_DumpThreads(JNIEnv *env, jlongArray thread_ids, jboolean locked_monitors, + jboolean locked_synchronizers, jint maxDepth)) ResourceMark rm(THREAD); // make sure the AbstractOwnableSynchronizer klass is loaded before taking thread snapshots @@ -1181,14 +1182,14 @@ JVM_ENTRY(jobjectArray, jmm_DumpThreads(JNIEnv *env, jlongArray thread_ids, jboo do_thread_dump(&dump_result, ids_ah, num_threads, - -1, /* entire stack */ + maxDepth, /* stack depth */ (locked_monitors ? true : false), /* with locked monitors */ (locked_synchronizers ? true : false), /* with locked synchronizers */ CHECK_NULL); } else { // obtain thread dump of all threads VM_ThreadDump op(&dump_result, - -1, /* entire stack */ + maxDepth, /* stack depth */ (locked_monitors ? true : false), /* with locked monitors */ (locked_synchronizers ? true : false) /* with locked synchronizers */); VMThread::execute(&op); @@ -2237,7 +2238,7 @@ const struct jmmInterface_1_ jmm_interface = { void* Management::get_jmm_interface(int version) { #if INCLUDE_MANAGEMENT - if (version == JMM_VERSION_1_0) { + if (version == JMM_VERSION) { return (void*) &jmm_interface; } #endif // INCLUDE_MANAGEMENT diff --git a/src/hotspot/share/services/threadService.cpp b/src/hotspot/share/services/threadService.cpp index 1100cb07971..da25120bb37 100644 --- a/src/hotspot/share/services/threadService.cpp +++ b/src/hotspot/share/services/threadService.cpp @@ -562,6 +562,10 @@ void ThreadStackTrace::dump_stack_at_safepoint(int maxDepth) { vframe* start_vf = _thread->last_java_vframe(®_map); int count = 0; for (vframe* f = start_vf; f; f = f->sender() ) { + if (maxDepth >= 0 && count == maxDepth) { + // Skip frames if more than maxDepth + break; + } if (f->is_java_frame()) { javaVFrame* jvf = javaVFrame::cast(f); add_stack_frame(jvf); @@ -569,10 +573,6 @@ void ThreadStackTrace::dump_stack_at_safepoint(int maxDepth) { } else { // Ignore non-Java frames } - if (maxDepth > 0 && count == maxDepth) { - // Skip frames if more than maxDepth - break; - } } } diff --git a/src/java.management/share/classes/java/lang/management/ThreadMXBean.java b/src/java.management/share/classes/java/lang/management/ThreadMXBean.java index 48fafa5f248..f8b48736821 100644 --- a/src/java.management/share/classes/java/lang/management/ThreadMXBean.java +++ b/src/java.management/share/classes/java/lang/management/ThreadMXBean.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2013, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -687,52 +687,13 @@ public interface ThreadMXBean extends PlatformManagedObject { /** * Returns the thread info for each thread - * whose ID is in the input array {@code ids}, with stack trace - * and synchronization information. - * - *

- * This method obtains a snapshot of the thread information - * for each thread including: - *

    - *
  • the entire stack trace,
  • - *
  • the object monitors currently locked by the thread - * if {@code lockedMonitors} is {@code true}, and
  • - *
  • the - * ownable synchronizers currently locked by the thread - * if {@code lockedSynchronizers} is {@code true}.
  • - *
- *

- * This method returns an array of the {@code ThreadInfo} objects, - * each is the thread information about the thread with the same index - * as in the {@code ids} array. - * If a thread of the given ID is not alive or does not exist, - * {@code null} will be set in the corresponding element - * in the returned array. A thread is alive if - * it has been started and has not yet died. - *

- * If a thread does not lock any object monitor or {@code lockedMonitors} - * is {@code false}, the returned {@code ThreadInfo} object will have an - * empty {@code MonitorInfo} array. Similarly, if a thread does not - * lock any synchronizer or {@code lockedSynchronizers} is {@code false}, - * the returned {@code ThreadInfo} object - * will have an empty {@code LockInfo} array. - * - *

- * When both {@code lockedMonitors} and {@code lockedSynchronizers} - * parameters are {@code false}, it is equivalent to calling: - *

-     *     {@link #getThreadInfo(long[], int)  getThreadInfo(ids, Integer.MAX_VALUE)}
-     * 
- * - *

- * This method is designed for troubleshooting use, but not for - * synchronization control. It might be an expensive operation. - * - *

- * MBeanServer access:
- * The mapped type of {@code ThreadInfo} is - * {@code CompositeData} with attributes as specified in the - * {@link ThreadInfo#from ThreadInfo.from} method. + * whose ID is in the input array {@code ids}, + * with stack trace and synchronization information. + * This is equivalent to calling: + *

+ * {@link #getThreadInfo(long[], boolean, boolean, int) + * getThreadInfo(ids, lockedMonitors, lockedSynchronizers, Integer.MAX_VALUE)} + *
* * @param ids an array of thread IDs. * @param lockedMonitors if {@code true}, retrieves all locked monitors. @@ -763,18 +724,110 @@ public interface ThreadMXBean extends PlatformManagedObject { * * @since 1.6 */ - public ThreadInfo[] getThreadInfo(long[] ids, boolean lockedMonitors, boolean lockedSynchronizers); + public ThreadInfo[] getThreadInfo(long[] ids, boolean lockedMonitors, + boolean lockedSynchronizers); + + /** + * Returns the thread info for each thread whose ID + * is in the input array {@code ids}, + * with stack trace of the specified maximum number of elements + * and synchronization information. + * If {@code maxDepth == 0}, no stack trace of the thread + * will be dumped. + * + *

+ * This method obtains a snapshot of the thread information + * for each thread including: + *

    + *
  • stack trace of the specified maximum number of elements,
  • + *
  • the object monitors currently locked by the thread + * if {@code lockedMonitors} is {@code true}, and
  • + *
  • the + * ownable synchronizers currently locked by the thread + * if {@code lockedSynchronizers} is {@code true}.
  • + *
+ *

+ * This method returns an array of the {@code ThreadInfo} objects, + * each is the thread information about the thread with the same index + * as in the {@code ids} array. + * If a thread of the given ID is not alive or does not exist, + * {@code null} will be set in the corresponding element + * in the returned array. A thread is alive if + * it has been started and has not yet died. + *

+ * If a thread does not lock any object monitor or {@code lockedMonitors} + * is {@code false}, the returned {@code ThreadInfo} object will have an + * empty {@code MonitorInfo} array. Similarly, if a thread does not + * lock any synchronizer or {@code lockedSynchronizers} is {@code false}, + * the returned {@code ThreadInfo} object + * will have an empty {@code LockInfo} array. + * + *

+ * When both {@code lockedMonitors} and {@code lockedSynchronizers} + * parameters are {@code false}, it is equivalent to calling: + *

+     *     {@link #getThreadInfo(long[], int)  getThreadInfo(ids, maxDepth)}
+     * 
+ * + *

+ * This method is designed for troubleshooting use, but not for + * synchronization control. It might be an expensive operation. + * + *

+ * MBeanServer access:
+ * The mapped type of {@code ThreadInfo} is + * {@code CompositeData} with attributes as specified in the + * {@link ThreadInfo#from ThreadInfo.from} method. + * + * @implSpec The default implementation throws + * {@code UnsupportedOperationException}. + * + * @param ids an array of thread IDs. + * @param lockedMonitors if {@code true}, retrieves all locked monitors. + * @param lockedSynchronizers if {@code true}, retrieves all locked + * ownable synchronizers. + * @param maxDepth indicates the maximum number of + * {@link StackTraceElement} to be retrieved from the stack trace. + * + * @return an array of the {@link ThreadInfo} objects, each containing + * information about a thread whose ID is in the corresponding + * element of the input array of IDs. + * + * @throws IllegalArgumentException if {@code maxDepth} is negative. + * @throws java.lang.SecurityException if a security manager + * exists and the caller does not have + * ManagementPermission("monitor"). + * @throws java.lang.UnsupportedOperationException + *

    + *
  • if {@code lockedMonitors} is {@code true} but + * the Java virtual machine does not support monitoring + * of {@linkplain #isObjectMonitorUsageSupported + * object monitor usage}; or
  • + *
  • if {@code lockedSynchronizers} is {@code true} but + * the Java virtual machine does not support monitoring + * of {@linkplain #isSynchronizerUsageSupported + * ownable synchronizer usage}.
  • + *
+ * + * @see #isObjectMonitorUsageSupported + * @see #isSynchronizerUsageSupported + * + * @since 10 + */ + + public default ThreadInfo[] getThreadInfo(long[] ids, boolean lockedMonitors, + boolean lockedSynchronizers, int maxDepth) { + throw new UnsupportedOperationException(); + } /** * Returns the thread info for all live threads with stack trace * and synchronization information. - * Some threads included in the returned array - * may have been terminated when this method returns. - * - *

- * This method returns an array of {@link ThreadInfo} objects - * as specified in the {@link #getThreadInfo(long[], boolean, boolean)} - * method. + * This is equivalent to calling: + *

+ * {@link #dumpAllThreads(boolean, boolean, int) + * dumpAllThreads(lockedMonitors, lockedSynchronizers, Integer.MAX_VALUE)} + *
* * @param lockedMonitors if {@code true}, dump all locked monitors. * @param lockedSynchronizers if {@code true}, dump all locked @@ -803,4 +856,56 @@ public interface ThreadMXBean extends PlatformManagedObject { * @since 1.6 */ public ThreadInfo[] dumpAllThreads(boolean lockedMonitors, boolean lockedSynchronizers); + + + /** + * Returns the thread info for all live threads + * with stack trace of the specified maximum number of elements + * and synchronization information. + * if {@code maxDepth == 0}, no stack trace of the thread + * will be dumped. + * Some threads included in the returned array + * may have been terminated when this method returns. + * + *

+ * This method returns an array of {@link ThreadInfo} objects + * as specified in the {@link #getThreadInfo(long[], boolean, boolean, int)} + * method. + * + * @implSpec The default implementation throws + * {@code UnsupportedOperationException}. + * + * @param lockedMonitors if {@code true}, dump all locked monitors. + * @param lockedSynchronizers if {@code true}, dump all locked + * ownable synchronizers. + * @param maxDepth indicates the maximum number of + * {@link StackTraceElement} to be retrieved from the stack trace. + * + * @return an array of {@link ThreadInfo} for all live threads. + * + * @throws IllegalArgumentException if {@code maxDepth} is negative. + * @throws java.lang.SecurityException if a security manager + * exists and the caller does not have + * ManagementPermission("monitor"). + * @throws java.lang.UnsupportedOperationException + *

    + *
  • if {@code lockedMonitors} is {@code true} but + * the Java virtual machine does not support monitoring + * of {@linkplain #isObjectMonitorUsageSupported + * object monitor usage}; or
  • + *
  • if {@code lockedSynchronizers} is {@code true} but + * the Java virtual machine does not support monitoring + * of {@linkplain #isSynchronizerUsageSupported + * ownable synchronizer usage}.
  • + *
+ * + * @see #isObjectMonitorUsageSupported + * @see #isSynchronizerUsageSupported + * + * @since 10 + */ + public default ThreadInfo[] dumpAllThreads(boolean lockedMonitors, + boolean lockedSynchronizers, int maxDepth) { + throw new UnsupportedOperationException(); + } } diff --git a/src/java.management/share/classes/sun/management/ThreadImpl.java b/src/java.management/share/classes/sun/management/ThreadImpl.java index 129ecfcc5da..9e6d8e274bd 100644 --- a/src/java.management/share/classes/sun/management/ThreadImpl.java +++ b/src/java.management/share/classes/sun/management/ThreadImpl.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -463,20 +463,43 @@ public class ThreadImpl implements ThreadMXBean { public ThreadInfo[] getThreadInfo(long[] ids, boolean lockedMonitors, boolean lockedSynchronizers) { + return dumpThreads0(ids, lockedMonitors, lockedSynchronizers, + Integer.MAX_VALUE); + } + + public ThreadInfo[] getThreadInfo(long[] ids, + boolean lockedMonitors, + boolean lockedSynchronizers, + int maxDepth) { + if (maxDepth < 0) { + throw new IllegalArgumentException( + "Invalid maxDepth parameter: " + maxDepth); + } verifyThreadIds(ids); // ids has been verified to be non-null // an empty array of ids should return an empty array of ThreadInfos if (ids.length == 0) return new ThreadInfo[0]; verifyDumpThreads(lockedMonitors, lockedSynchronizers); - return dumpThreads0(ids, lockedMonitors, lockedSynchronizers); + return dumpThreads0(ids, lockedMonitors, lockedSynchronizers, maxDepth); } @Override public ThreadInfo[] dumpAllThreads(boolean lockedMonitors, boolean lockedSynchronizers) { + return dumpAllThreads(lockedMonitors, lockedSynchronizers, + Integer.MAX_VALUE); + } + + public ThreadInfo[] dumpAllThreads(boolean lockedMonitors, + boolean lockedSynchronizers, + int maxDepth) { + if (maxDepth < 0) { + throw new IllegalArgumentException( + "Invalid maxDepth parameter: " + maxDepth); + } verifyDumpThreads(lockedMonitors, lockedSynchronizers); - return dumpThreads0(null, lockedMonitors, lockedSynchronizers); + return dumpThreads0(null, lockedMonitors, lockedSynchronizers, maxDepth); } // VM support where maxDepth == -1 to request entire stack dump @@ -497,7 +520,8 @@ public class ThreadImpl implements ThreadMXBean { private static native void resetPeakThreadCount0(); private static native ThreadInfo[] dumpThreads0(long[] ids, boolean lockedMonitors, - boolean lockedSynchronizers); + boolean lockedSynchronizers, + int maxDepth); // tid == 0 to reset contention times for all threads private static native void resetContentionTimes0(long tid); diff --git a/src/java.management/share/native/include/jmm.h b/src/java.management/share/native/include/jmm.h index 9e21296bc0b..d4adc367fd9 100644 --- a/src/java.management/share/native/include/jmm.h +++ b/src/java.management/share/native/include/jmm.h @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2014, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -50,7 +50,8 @@ enum { JMM_VERSION_1_2 = 0x20010200, // JDK 7 JMM_VERSION_1_2_1 = 0x20010201, // JDK 7 GA JMM_VERSION_1_2_2 = 0x20010202, - JMM_VERSION = 0x20010203 + JMM_VERSION_2 = 0x20020000, // JDK 10 + JMM_VERSION = 0x20020000 }; typedef struct { @@ -315,7 +316,8 @@ typedef struct jmmInterface_1_ { jobjectArray (JNICALL *DumpThreads) (JNIEnv *env, jlongArray ids, jboolean lockedMonitors, - jboolean lockedSynchronizers); + jboolean lockedSynchronizers, + jint maxDepth); void (JNICALL *SetGCNotificationEnabled) (JNIEnv *env, jobject mgr, jboolean enabled); diff --git a/src/java.management/share/native/libmanagement/ThreadImpl.c b/src/java.management/share/native/libmanagement/ThreadImpl.c index 9e1baadf15c..1dd0b001cfc 100644 --- a/src/java.management/share/native/libmanagement/ThreadImpl.c +++ b/src/java.management/share/native/libmanagement/ThreadImpl.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2011, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -135,7 +135,9 @@ Java_sun_management_ThreadImpl_resetContentionTimes0 JNIEXPORT jobjectArray JNICALL Java_sun_management_ThreadImpl_dumpThreads0 - (JNIEnv *env, jclass cls, jlongArray ids, jboolean lockedMonitors, jboolean lockedSynchronizers) + (JNIEnv *env, jclass cls, jlongArray ids, jboolean lockedMonitors, + jboolean lockedSynchronizers, jint maxDepth) { - return jmm_interface->DumpThreads(env, ids, lockedMonitors, lockedSynchronizers); + return jmm_interface->DumpThreads(env, ids, lockedMonitors, + lockedSynchronizers, maxDepth); } diff --git a/src/java.management/share/native/libmanagement/management.c b/src/java.management/share/native/libmanagement/management.c index d909416719e..281e3d0ffac 100644 --- a/src/java.management/share/native/libmanagement/management.c +++ b/src/java.management/share/native/libmanagement/management.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -44,7 +44,7 @@ JNIEXPORT jint JNICALL return JNI_ERR; } - jmm_interface = (JmmInterface*) JVM_GetManagement(JMM_VERSION_1_0); + jmm_interface = (JmmInterface*) JVM_GetManagement(JMM_VERSION); if (jmm_interface == NULL) { JNU_ThrowInternalError(env, "Unsupported Management version"); return JNI_ERR; diff --git a/src/jdk.management/share/native/libmanagement_ext/management_ext.c b/src/jdk.management/share/native/libmanagement_ext/management_ext.c index dbb9f027137..02285521042 100644 --- a/src/jdk.management/share/native/libmanagement_ext/management_ext.c +++ b/src/jdk.management/share/native/libmanagement_ext/management_ext.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2015, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -44,7 +44,7 @@ JNIEXPORT jint JNICALL return JNI_ERR; } - jmm_interface = (JmmInterface*) JVM_GetManagement(JMM_VERSION_1_0); + jmm_interface = (JmmInterface*) JVM_GetManagement(JMM_VERSION); if (jmm_interface == NULL) { JNU_ThrowInternalError(env, "Unsupported Management version"); return JNI_ERR; diff --git a/test/jdk/java/lang/management/ThreadMXBean/MaxDepthForThreadInfoTest.java b/test/jdk/java/lang/management/ThreadMXBean/MaxDepthForThreadInfoTest.java new file mode 100644 index 00000000000..67a8a53913b --- /dev/null +++ b/test/jdk/java/lang/management/ThreadMXBean/MaxDepthForThreadInfoTest.java @@ -0,0 +1,101 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8185003 + * @build ThreadDump + * @run main MaxDepthForThreadInfoTest + * @summary verifies the functionality of ThreadMXBean.dumpAllThreads + * and ThreadMXBean.getThreadInfo with maxDepth argument + */ + +import java.lang.management.ManagementFactory; +import java.lang.management.ThreadInfo; +import java.lang.management.ThreadMXBean; + + + +public class MaxDepthForThreadInfoTest { + + + public static void main(String[] Args) { + + ThreadMXBean tmxb = ManagementFactory.getThreadMXBean(); + + long[] threadIds = tmxb.getAllThreadIds(); + + ThreadInfo[] tinfos = tmxb.getThreadInfo(threadIds, true, true, 0); + for (ThreadInfo ti : tinfos) { + if (ti.getStackTrace().length > 0) { + ThreadDump.printThreadInfo(ti); + throw new RuntimeException("more than requested " + + "number of frames dumped"); + } + } + + tinfos = tmxb.getThreadInfo(threadIds, true, true, 3); + for (ThreadInfo ti : tinfos) { + if (ti.getStackTrace().length > 3) { + ThreadDump.printThreadInfo(ti); + throw new RuntimeException("more than requested " + + "number of frames dumped"); + } + } + + try { + tmxb.getThreadInfo(threadIds, true, true, -1); + throw new RuntimeException("Didn't throw IllegalArgumentException " + + "for negative maxdepth value"); + } catch (IllegalArgumentException e) { + System.out.println("Throwed IllegalArgumentException as expected"); + } + + tinfos = tmxb.dumpAllThreads(true, true, 0); + for (ThreadInfo ti : tinfos) { + if (ti.getStackTrace().length > 0) { + ThreadDump.printThreadInfo(ti); + throw new RuntimeException("more than requested " + + "number of frames dumped"); + } + } + tinfos = tmxb.dumpAllThreads(true, true, 2); + for (ThreadInfo ti : tinfos) { + if (ti.getStackTrace().length > 2) { + ThreadDump.printThreadInfo(ti); + throw new RuntimeException("more than requested " + + "number of frames dumped"); + } + } + + try { + tmxb.dumpAllThreads(true, true, -1); + throw new RuntimeException("Didn't throw IllegalArgumentException " + + "for negative maxdepth value"); + } catch (IllegalArgumentException e) { + System.out.println("Throwed IllegalArgumentException as expected"); + } + + System.out.println("Test passed"); + } +} From b6bc02e70f139ad3ab98a75a78b30e5af63f1984 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Erik=20=C3=96sterlund?= Date: Thu, 5 Oct 2017 10:55:34 +0200 Subject: [PATCH 53/80] 8188224: Generalize Atomic::load/store to use templates Reviewed-by: dholmes, coleenp --- src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp | 16 -- src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp | 39 +--- .../os_cpu/bsd_zero/atomic_bsd_zero.hpp | 35 +-- .../linux_aarch64/atomic_linux_aarch64.hpp | 18 -- .../os_cpu/linux_arm/atomic_linux_arm.hpp | 47 ++-- .../os_cpu/linux_ppc/atomic_linux_ppc.hpp | 16 -- .../os_cpu/linux_s390/atomic_linux_s390.hpp | 16 -- .../os_cpu/linux_sparc/atomic_linux_sparc.hpp | 16 -- .../os_cpu/linux_x86/atomic_linux_x86.hpp | 38 +-- .../os_cpu/linux_zero/atomic_linux_zero.hpp | 29 +-- .../solaris_sparc/atomic_solaris_sparc.hpp | 16 -- .../os_cpu/solaris_x86/atomic_solaris_x86.hpp | 18 -- .../os_cpu/windows_x86/atomic_windows_x86.hpp | 41 +--- src/hotspot/share/runtime/atomic.hpp | 219 ++++++++++++++++-- 14 files changed, 279 insertions(+), 285 deletions(-) diff --git a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp index 5ef5ce7f1bf..c1c9132d672 100644 --- a/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp +++ b/src/hotspot/os_cpu/aix_ppc/atomic_aix_ppc.hpp @@ -34,22 +34,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - // // machine barrier instructions: // diff --git a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp index 4720e67e405..458dcf242c8 100644 --- a/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp +++ b/src/hotspot/os_cpu/bsd_x86/atomic_bsd_x86.hpp @@ -27,19 +27,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - - template struct Atomic::PlatformAdd : Atomic::FetchAndAdd > @@ -102,9 +89,6 @@ inline T Atomic::PlatformCmpxchg<4>::operator()(T exchange_value, } #ifdef AMD64 -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } - template<> template inline D Atomic::PlatformAdd<8>::fetch_and_add(I add_value, D volatile* dest) const { @@ -144,8 +128,6 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return exchange_value; } -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #else // !AMD64 extern "C" { @@ -164,18 +146,21 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return cmpxchg_using_helper(_Atomic_cmpxchg_long, exchange_value, dest, compare_value); } -inline jlong Atomic::load(const volatile jlong* src) { +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); volatile jlong dest; - _Atomic_move_long(src, &dest); - return dest; + _Atomic_move_long(reinterpret_cast(src), reinterpret_cast(&dest)); + return PrimitiveConversions::cast(dest); } -inline void Atomic::store(jlong store_value, jlong* dest) { - _Atomic_move_long((volatile jlong*)&store_value, (volatile jlong*)dest); -} - -inline void Atomic::store(jlong store_value, volatile jlong* dest) { - _Atomic_move_long((volatile jlong*)&store_value, dest); +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + _Atomic_move_long(reinterpret_cast(&store_value), reinterpret_cast(dest)); } #endif // AMD64 diff --git a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp index 7b76258649d..0daea3c6c4b 100644 --- a/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp +++ b/src/hotspot/os_cpu/bsd_zero/atomic_bsd_zero.hpp @@ -159,20 +159,6 @@ static inline int arm_lock_test_and_set(int newval, volatile int *ptr) { } #endif // ARM -inline void Atomic::store(jint store_value, volatile jint* dest) { -#if !defined(ARM) && !defined(M68K) - __sync_synchronize(); -#endif - *dest = store_value; -} - -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { -#if !defined(ARM) && !defined(M68K) - __sync_synchronize(); -#endif - *dest = store_value; -} - template struct Atomic::PlatformAdd : Atomic::AddAndFetch > @@ -275,18 +261,21 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return __sync_val_compare_and_swap(dest, compare_value, exchange_value); } -inline jlong Atomic::load(const volatile jlong* src) { +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); volatile jlong dest; - os::atomic_copy64(src, &dest); - return dest; + os::atomic_copy64(reinterpret_cast(src), reinterpret_cast(&dest)); + return PrimitiveConversions::cast(dest); } -inline void Atomic::store(jlong store_value, jlong* dest) { - os::atomic_copy64((volatile jlong*)&store_value, (volatile jlong*)dest); -} - -inline void Atomic::store(jlong store_value, volatile jlong* dest) { - os::atomic_copy64((volatile jlong*)&store_value, dest); +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + os::atomic_copy64(reinterpret_cast(&store_value), reinterpret_cast(dest)); } #endif // OS_CPU_BSD_ZERO_VM_ATOMIC_BSD_ZERO_HPP diff --git a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp index 88ba2654cc4..e4076609924 100644 --- a/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp +++ b/src/hotspot/os_cpu/linux_aarch64/atomic_linux_aarch64.hpp @@ -34,19 +34,6 @@ #define READ_MEM_BARRIER __atomic_thread_fence(__ATOMIC_ACQUIRE); #define WRITE_MEM_BARRIER __atomic_thread_fence(__ATOMIC_RELEASE); -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - - template struct Atomic::PlatformAdd : Atomic::AddAndFetch > @@ -84,9 +71,4 @@ inline T Atomic::PlatformCmpxchg::operator()(T exchange_value, } } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } - -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #endif // OS_CPU_LINUX_AARCH64_VM_ATOMIC_LINUX_AARCH64_HPP diff --git a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp index 930d79289c0..d5c6ecd9f8d 100644 --- a/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp +++ b/src/hotspot/os_cpu/linux_arm/atomic_linux_arm.hpp @@ -44,39 +44,24 @@ * kernel source or kernel_user_helpers.txt in Linux Doc. */ -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } +#ifndef AARCH64 +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); + return PrimitiveConversions::cast( + (*os::atomic_load_long_func)(reinterpret_cast(src))); +} -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - -inline jlong Atomic::load (const volatile jlong* src) { - assert(((intx)src & (sizeof(jlong)-1)) == 0, "Atomic load jlong mis-aligned"); -#ifdef AARCH64 - return *src; -#else - return (*os::atomic_load_long_func)(src); +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + (*os::atomic_store_long_func)( + PrimitiveConversions::cast(store_value), reinterpret_cast(dest)); +} #endif -} - -inline void Atomic::store (jlong value, volatile jlong* dest) { - assert(((intx)dest & (sizeof(jlong)-1)) == 0, "Atomic store jlong mis-aligned"); -#ifdef AARCH64 - *dest = value; -#else - (*os::atomic_store_long_func)(value, dest); -#endif -} - -inline void Atomic::store (jlong value, jlong* dest) { - store(value, (volatile jlong*)dest); -} // As per atomic.hpp all read-modify-write operations have to provide two-way // barriers semantics. For AARCH64 we are using load-acquire-with-reservation and diff --git a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp index 0056e306644..48680690591 100644 --- a/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp +++ b/src/hotspot/os_cpu/linux_ppc/atomic_linux_ppc.hpp @@ -32,22 +32,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - // // machine barrier instructions: // diff --git a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp index 1f5db81b853..5821bb018c3 100644 --- a/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp +++ b/src/hotspot/os_cpu/linux_s390/atomic_linux_s390.hpp @@ -53,20 +53,6 @@ // is an integer multiple of the data length. Furthermore, all stores are ordered: // a store which occurs conceptually before another store becomes visible to other CPUs // before the other store becomes visible. -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - //------------ // Atomic::add @@ -335,6 +321,4 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T xchg_val, return old; } -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #endif // OS_CPU_LINUX_S390_VM_ATOMIC_LINUX_S390_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp index c671af04417..46a1268347a 100644 --- a/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp +++ b/src/hotspot/os_cpu/linux_sparc/atomic_linux_sparc.hpp @@ -27,22 +27,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - template struct Atomic::PlatformAdd : Atomic::AddAndFetch > diff --git a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp index cbe5c3ede8a..be5649dc401 100644 --- a/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp +++ b/src/hotspot/os_cpu/linux_x86/atomic_linux_x86.hpp @@ -27,19 +27,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - - template struct Atomic::PlatformAdd : Atomic::FetchAndAdd > @@ -102,8 +89,6 @@ inline T Atomic::PlatformCmpxchg<4>::operator()(T exchange_value, } #ifdef AMD64 -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } template<> template @@ -144,8 +129,6 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return exchange_value; } -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #else // !AMD64 extern "C" { @@ -164,18 +147,21 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return cmpxchg_using_helper(_Atomic_cmpxchg_long, exchange_value, dest, compare_value); } -inline jlong Atomic::load(const volatile jlong* src) { +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); volatile jlong dest; - _Atomic_move_long(src, &dest); - return dest; + _Atomic_move_long(reinterpret_cast(src), reinterpret_cast(&dest)); + return PrimitiveConversions::cast(dest); } -inline void Atomic::store(jlong store_value, jlong* dest) { - _Atomic_move_long((volatile jlong*)&store_value, (volatile jlong*)dest); -} - -inline void Atomic::store(jlong store_value, volatile jlong* dest) { - _Atomic_move_long((volatile jlong*)&store_value, dest); +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + _Atomic_move_long(reinterpret_cast(&store_value), reinterpret_cast(dest)); } #endif // AMD64 diff --git a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp index 68d9575acae..0713b6de460 100644 --- a/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp +++ b/src/hotspot/os_cpu/linux_zero/atomic_linux_zero.hpp @@ -159,14 +159,6 @@ static inline int arm_lock_test_and_set(int newval, volatile int *ptr) { } #endif // ARM -inline void Atomic::store(jint store_value, volatile jint* dest) { - *dest = store_value; -} - -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { - *dest = store_value; -} - template struct Atomic::PlatformAdd : Atomic::AddAndFetch > @@ -269,18 +261,21 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, return __sync_val_compare_and_swap(dest, compare_value, exchange_value); } -inline jlong Atomic::load(const volatile jlong* src) { +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); volatile jlong dest; - os::atomic_copy64(src, &dest); - return dest; + os::atomic_copy64(reinterpret_cast(src), reinterpret_cast(&dest)); + return PrimitiveConversions::cast(dest); } -inline void Atomic::store(jlong store_value, jlong* dest) { - os::atomic_copy64((volatile jlong*)&store_value, (volatile jlong*)dest); -} - -inline void Atomic::store(jlong store_value, volatile jlong* dest) { - os::atomic_copy64((volatile jlong*)&store_value, dest); +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + os::atomic_copy64(reinterpret_cast(&store_value), reinterpret_cast(dest)); } #endif // OS_CPU_LINUX_ZERO_VM_ATOMIC_LINUX_ZERO_HPP diff --git a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp index b76aed3da85..a8e00217da5 100644 --- a/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp +++ b/src/hotspot/os_cpu/solaris_sparc/atomic_solaris_sparc.hpp @@ -27,22 +27,6 @@ // Implementation of class atomic -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - -inline void Atomic::store(jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store(jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - // Implement ADD using a CAS loop. template struct Atomic::PlatformAdd VALUE_OBJ_CLASS_SPEC { diff --git a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp index fdf6f47cdf0..4acd7df025d 100644 --- a/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp +++ b/src/hotspot/os_cpu/solaris_x86/atomic_solaris_x86.hpp @@ -25,20 +25,6 @@ #ifndef OS_CPU_SOLARIS_X86_VM_ATOMIC_SOLARIS_X86_HPP #define OS_CPU_SOLARIS_X86_VM_ATOMIC_SOLARIS_X86_HPP -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } - - -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - // For Sun Studio - implementation is in solaris_x86_64.il. extern "C" { @@ -151,8 +137,4 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, PrimitiveConversions::cast(compare_value))); } -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #endif // OS_CPU_SOLARIS_X86_VM_ATOMIC_SOLARIS_X86_HPP diff --git a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp index 15635f2d6ed..e9f7b761e35 100644 --- a/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp +++ b/src/hotspot/os_cpu/windows_x86/atomic_windows_x86.hpp @@ -42,21 +42,6 @@ #pragma warning(disable: 4035) // Disables warnings reporting missing return statement -inline void Atomic::store (jbyte store_value, jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, jint* dest) { *dest = store_value; } - -inline void Atomic::store_ptr(intptr_t store_value, intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, void* dest) { *(void**)dest = store_value; } - -inline void Atomic::store (jbyte store_value, volatile jbyte* dest) { *dest = store_value; } -inline void Atomic::store (jshort store_value, volatile jshort* dest) { *dest = store_value; } -inline void Atomic::store (jint store_value, volatile jint* dest) { *dest = store_value; } - - -inline void Atomic::store_ptr(intptr_t store_value, volatile intptr_t* dest) { *dest = store_value; } -inline void Atomic::store_ptr(void* store_value, volatile void* dest) { *(void* volatile *)dest = store_value; } - template struct Atomic::PlatformAdd : Atomic::AddAndFetch > @@ -66,9 +51,6 @@ struct Atomic::PlatformAdd }; #ifdef AMD64 -inline void Atomic::store (jlong store_value, jlong* dest) { *dest = store_value; } -inline void Atomic::store (jlong store_value, volatile jlong* dest) { *dest = store_value; } - template<> template inline D Atomic::PlatformAdd<4>::add_and_fetch(I add_value, D volatile* dest) const { @@ -112,8 +94,6 @@ DEFINE_STUB_CMPXCHG(8, jlong, os::atomic_cmpxchg_long_func) #undef DEFINE_STUB_CMPXCHG -inline jlong Atomic::load(const volatile jlong* src) { return *src; } - #else // !AMD64 template<> @@ -200,9 +180,12 @@ inline T Atomic::PlatformCmpxchg<8>::operator()(T exchange_value, } } -inline jlong Atomic::load(const volatile jlong* src) { - volatile jlong dest; - volatile jlong* pdest = &dest; +template<> +template +inline T Atomic::PlatformLoad<8>::operator()(T const volatile* src) const { + STATIC_ASSERT(8 == sizeof(T)); + volatile T dest; + volatile T* pdest = &dest; __asm { mov eax, src fild qword ptr [eax] @@ -212,8 +195,12 @@ inline jlong Atomic::load(const volatile jlong* src) { return dest; } -inline void Atomic::store(jlong store_value, volatile jlong* dest) { - volatile jlong* src = &store_value; +template<> +template +inline void Atomic::PlatformStore<8>::operator()(T store_value, + T volatile* dest) const { + STATIC_ASSERT(8 == sizeof(T)); + volatile T* src = &store_value; __asm { mov eax, src fild qword ptr [eax] @@ -222,10 +209,6 @@ inline void Atomic::store(jlong store_value, volatile jlong* dest) { } } -inline void Atomic::store(jlong store_value, jlong* dest) { - Atomic::store(store_value, (volatile jlong*)dest); -} - #endif // AMD64 #pragma warning(default: 4035) // Enables warnings reporting missing return statement diff --git a/src/hotspot/share/runtime/atomic.hpp b/src/hotspot/share/runtime/atomic.hpp index e6f94f6f169..69376db06ad 100644 --- a/src/hotspot/share/runtime/atomic.hpp +++ b/src/hotspot/share/runtime/atomic.hpp @@ -64,24 +64,25 @@ class Atomic : AllStatic { // we can prove that a weaker form is sufficiently safe. // Atomically store to a location - inline static void store (jbyte store_value, jbyte* dest); - inline static void store (jshort store_value, jshort* dest); - inline static void store (jint store_value, jint* dest); - // See comment above about using jlong atomics on 32-bit platforms - inline static void store (jlong store_value, jlong* dest); - inline static void store_ptr(intptr_t store_value, intptr_t* dest); - inline static void store_ptr(void* store_value, void* dest); + // The type T must be either a pointer type convertible to or equal + // to D, an integral/enum type equal to D, or a type equal to D that + // is primitive convertible using PrimitiveConversions. + template + inline static void store(T store_value, volatile D* dest); - inline static void store (jbyte store_value, volatile jbyte* dest); - inline static void store (jshort store_value, volatile jshort* dest); - inline static void store (jint store_value, volatile jint* dest); - // See comment above about using jlong atomics on 32-bit platforms - inline static void store (jlong store_value, volatile jlong* dest); - inline static void store_ptr(intptr_t store_value, volatile intptr_t* dest); - inline static void store_ptr(void* store_value, volatile void* dest); + inline static void store_ptr(intptr_t store_value, volatile intptr_t* dest) { + Atomic::store(store_value, dest); + } - // See comment above about using jlong atomics on 32-bit platforms - inline static jlong load(const volatile jlong* src); + inline static void store_ptr(void* store_value, volatile void* dest) { + Atomic::store(store_value, reinterpret_cast(dest)); + } + + // Atomically load from a location + // The type T must be either a pointer type, an integral/enum type, + // or a type that is primitive convertible using PrimitiveConversions. + template + inline static T load(const volatile T* dest); // Atomically add to a location. Returns updated value. add*() provide: // add-value-to-dest @@ -174,6 +175,57 @@ private: // that is needed here. template struct IsPointerConvertible; + // Dispatch handler for store. Provides type-based validity + // checking and limited conversions around calls to the platform- + // specific implementation layer provided by PlatformOp. + template + struct StoreImpl; + + // Platform-specific implementation of store. Support for sizes + // of 1, 2, 4, and (if different) pointer size bytes are required. + // The class is a function object that must be default constructable, + // with these requirements: + // + // either: + // - dest is of type D*, an integral, enum or pointer type. + // - new_value are of type T, an integral, enum or pointer type D or + // pointer type convertible to D. + // or: + // - T and D are the same and are primitive convertible using PrimitiveConversions + // and either way: + // - platform_store is an object of type PlatformStore. + // + // Then + // platform_store(new_value, dest) + // must be a valid expression. + // + // The default implementation is a volatile store. If a platform + // requires more for e.g. 64 bit stores, a specialization is required + template struct PlatformStore; + + // Dispatch handler for load. Provides type-based validity + // checking and limited conversions around calls to the platform- + // specific implementation layer provided by PlatformOp. + template + struct LoadImpl; + + // Platform-specific implementation of load. Support for sizes of + // 1, 2, 4 bytes and (if different) pointer size bytes are required. + // The class is a function object that must be default + // constructable, with these requirements: + // + // - dest is of type T*, an integral, enum or pointer type, or + // T is convertible to a primitive type using PrimitiveConversions + // - platform_load is an object of type PlatformLoad. + // + // Then + // platform_load(src) + // must be a valid expression, returning a result convertible to T. + // + // The default implementation is a volatile load. If a platform + // requires more for e.g. 64 bit loads, a specialization is required + template struct PlatformLoad; + // Dispatch handler for add. Provides type-based validity checking // and limited conversions around calls to the platform-specific // implementation layer provided by PlatformAdd. @@ -344,6 +396,131 @@ struct Atomic::IsPointerConvertible : AllStatic { static const bool value = (sizeof(yes) == sizeof(test(test_value))); }; +// Handle load for pointer, integral and enum types. +template +struct Atomic::LoadImpl< + T, + PlatformOp, + typename EnableIf::value || IsRegisteredEnum::value || IsPointer::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + T operator()(T const volatile* dest) const { + // Forward to the platform handler for the size of T. + return PlatformOp()(dest); + } +}; + +// Handle load for types that have a translator. +// +// All the involved types must be identical. +// +// This translates the original call into a call on the decayed +// arguments, and returns the recovered result of that translated +// call. +template +struct Atomic::LoadImpl< + T, + PlatformOp, + typename EnableIf::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + T operator()(T const volatile* dest) const { + typedef PrimitiveConversions::Translate Translator; + typedef typename Translator::Decayed Decayed; + STATIC_ASSERT(sizeof(T) == sizeof(Decayed)); + Decayed result = PlatformOp()(reinterpret_cast(dest)); + return Translator::recover(result); + } +}; + +// Default implementation of atomic load if a specific platform +// does not provide a specialization for a certain size class. +// For increased safety, the default implementation only allows +// load types that are pointer sized or smaller. If a platform still +// supports wide atomics, then it has to use specialization +// of Atomic::PlatformLoad for that wider size class. +template +struct Atomic::PlatformLoad VALUE_OBJ_CLASS_SPEC { + template + T operator()(T const volatile* dest) const { + STATIC_ASSERT(sizeof(T) <= sizeof(void*)); // wide atomics need specialization + return *dest; + } +}; + +// Handle store for integral and enum types. +// +// All the involved types must be identical. +template +struct Atomic::StoreImpl< + T, T, + PlatformOp, + typename EnableIf::value || IsRegisteredEnum::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + void operator()(T new_value, T volatile* dest) const { + // Forward to the platform handler for the size of T. + PlatformOp()(new_value, dest); + } +}; + +// Handle store for pointer types. +// +// The new_value must be implicitly convertible to the +// destination's type; it must be type-correct to store the +// new_value in the destination. +template +struct Atomic::StoreImpl< + T*, D*, + PlatformOp, + typename EnableIf::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + void operator()(T* new_value, D* volatile* dest) const { + // Allow derived to base conversion, and adding cv-qualifiers. + D* value = new_value; + PlatformOp()(value, dest); + } +}; + +// Handle store for types that have a translator. +// +// All the involved types must be identical. +// +// This translates the original call into a call on the decayed +// arguments. +template +struct Atomic::StoreImpl< + T, T, + PlatformOp, + typename EnableIf::value>::type> + VALUE_OBJ_CLASS_SPEC +{ + void operator()(T new_value, T volatile* dest) const { + typedef PrimitiveConversions::Translate Translator; + typedef typename Translator::Decayed Decayed; + STATIC_ASSERT(sizeof(T) == sizeof(Decayed)); + PlatformOp()(Translator::decay(new_value), + reinterpret_cast(dest)); + } +}; + +// Default implementation of atomic store if a specific platform +// does not provide a specialization for a certain size class. +// For increased safety, the default implementation only allows +// storing types that are pointer sized or smaller. If a platform still +// supports wide atomics, then it has to use specialization +// of Atomic::PlatformStore for that wider size class. +template +struct Atomic::PlatformStore VALUE_OBJ_CLASS_SPEC { + template + void operator()(T new_value, + T volatile* dest) const { + STATIC_ASSERT(sizeof(T) <= sizeof(void*)); // wide atomics need specialization + (void)const_cast(*dest = new_value); + } +}; + // Define FetchAndAdd and AddAndFetch helper classes before including // platform file, which may use these as base classes, requiring they // be complete. @@ -424,6 +601,16 @@ struct Atomic::PlatformXchg VALUE_OBJ_CLASS_SPEC { #error size_t is not WORD_SIZE, interesting platform, but missing implementation here #endif +template +inline T Atomic::load(const volatile T* dest) { + return LoadImpl >()(dest); +} + +template +inline void Atomic::store(T store_value, volatile D* dest) { + StoreImpl >()(store_value, dest); +} + template inline D Atomic::add(I add_value, D volatile* dest) { return AddImpl()(add_value, dest); From 36dec9793d9eb67ea25197a2c07149b8f23859d3 Mon Sep 17 00:00:00 2001 From: Michihiro Horie Date: Thu, 5 Oct 2017 12:56:42 +0200 Subject: [PATCH 54/80] 8188802: PPC64: Failure on assert(lrgmask.is_aligned_sets(RegMask::SlotsPerVecX)) Reviewed-by: mdoerr --- src/hotspot/cpu/ppc/globals_ppc.hpp | 3 +++ src/hotspot/cpu/ppc/ppc.ad | 33 +++++++++++------------ src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp | 6 +---- src/hotspot/cpu/ppc/vm_version_ppc.cpp | 15 ++++++++--- 4 files changed, 30 insertions(+), 27 deletions(-) diff --git a/src/hotspot/cpu/ppc/globals_ppc.hpp b/src/hotspot/cpu/ppc/globals_ppc.hpp index 56232e2ae30..b6d04455c84 100644 --- a/src/hotspot/cpu/ppc/globals_ppc.hpp +++ b/src/hotspot/cpu/ppc/globals_ppc.hpp @@ -103,6 +103,9 @@ define_pd_global(intx, InitArrayShortSize, 9*BytesPerLong); "CPU Version: x for PowerX. Currently recognizes Power5 to " \ "Power8. Default is 0. Newer CPUs will be recognized as Power8.") \ \ + product(bool, SuperwordUseVSX, false, \ + "Use Power8 VSX instructions for superword optimization.") \ + \ /* Reoptimize code-sequences of calls at runtime, e.g. replace an */ \ /* indirect call by a direct call. */ \ product(bool, ReoptimizeCallSequences, true, \ diff --git a/src/hotspot/cpu/ppc/ppc.ad b/src/hotspot/cpu/ppc/ppc.ad index 477aedf496f..789c91f2005 100644 --- a/src/hotspot/cpu/ppc/ppc.ad +++ b/src/hotspot/cpu/ppc/ppc.ad @@ -452,17 +452,6 @@ alloc_class chunk2 ( ); alloc_class chunk3 ( - // special registers - // These registers are not allocated, but used for nodes generated by postalloc expand. - SR_XER, - SR_LR, - SR_CTR, - SR_VRSAVE, - SR_SPEFSCR, - SR_PPR -); - -alloc_class chunk4 ( VSR0, VSR1, VSR2, @@ -529,6 +518,17 @@ alloc_class chunk4 ( VSR63 ); +alloc_class chunk4 ( + // special registers + // These registers are not allocated, but used for nodes generated by postalloc expand. + SR_XER, + SR_LR, + SR_CTR, + SR_VRSAVE, + SR_SPEFSCR, + SR_PPR +); + //-------Architecture Description Register Classes----------------------- // Several register classes are automatically defined based upon @@ -1675,7 +1675,7 @@ static enum RC rc_class(OptoReg::Name reg) { if (reg < 64+64) return rc_float; // Between float regs & stack are the flags regs. - assert(OptoReg::is_stack(reg), "blow up if spilling flags"); + assert(OptoReg::is_stack(reg) || reg < 64+64+64, "blow up if spilling flags"); return rc_stack; } @@ -2221,7 +2221,7 @@ const bool Matcher::convL2FSupported(void) { // Vector width in bytes. const int Matcher::vector_width_in_bytes(BasicType bt) { - if (VM_Version::has_vsx()) { + if (SuperwordUseVSX) { assert(MaxVectorSize == 16, ""); return 16; } else { @@ -2232,7 +2232,7 @@ const int Matcher::vector_width_in_bytes(BasicType bt) { // Vector ideal reg. const uint Matcher::vector_ideal_reg(int size) { - if (VM_Version::has_vsx()) { + if (SuperwordUseVSX) { assert(MaxVectorSize == 16 && size == 16, ""); return Op_VecX; } else { @@ -2258,10 +2258,7 @@ const int Matcher::min_vector_size(const BasicType bt) { // PPC doesn't support misaligned vectors store/load. const bool Matcher::misaligned_vectors_ok() { - if (VM_Version::has_vsx()) - return !AlignVector; // can be changed by flag - else - return false; + return !AlignVector; // can be changed by flag } // PPC AES support not yet implemented diff --git a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp index f68058e237e..4b879905afa 100644 --- a/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp +++ b/src/hotspot/cpu/ppc/sharedRuntime_ppc.cpp @@ -480,11 +480,7 @@ void RegisterSaver::restore_result_registers(MacroAssembler* masm, int frame_siz // Is vector's size (in bytes) bigger than a size saved by default? bool SharedRuntime::is_wide_vector(int size) { // Note, MaxVectorSize == 8/16 on PPC64. - if (VM_Version::has_vsx()) { - assert(size <= 16, "%d bytes vectors are not supported", size); - } else { - assert(size <= 8, "%d bytes vectors are not supported", size); - } + assert(size <= (SuperwordUseVSX ? 16 : 8), "%d bytes vectors are not supported", size); return size > 8; } diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.cpp b/src/hotspot/cpu/ppc/vm_version_ppc.cpp index 0bb6aeab787..6791e0e9040 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.cpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.cpp @@ -107,10 +107,17 @@ void VM_Version::initialize() { // TODO: PPC port PdScheduling::power6SectorSize = 0x20; } - if (VM_Version::has_vsx()) - MaxVectorSize = 16; - else - MaxVectorSize = 8; + if (PowerArchitecturePPC64 >= 8) { + if (FLAG_IS_DEFAULT(SuperwordUseVSX)) { + FLAG_SET_ERGO(bool, SuperwordUseVSX, true); + } + } else { + if (SuperwordUseVSX) { + warning("SuperwordUseVSX specified, but needs at least Power8."); + FLAG_SET_DEFAULT(SuperwordUseVSX, false); + } + } + MaxVectorSize = SuperwordUseVSX ? 16 : 8; #endif // Create and print feature-string. From 0c224245ce1d474bdedc9fc3572feddf80788f60 Mon Sep 17 00:00:00 2001 From: Vladimir Kozlov Date: Fri, 6 Oct 2017 10:39:09 -0700 Subject: [PATCH 55/80] 8188775: Module jdk.internal.vm.compiler.management has not been granted accessClassInPackage.org.graalvm.compiler.hotspot Add missed changes in default.policy for new module Reviewed-by: mchung --- src/java.base/share/lib/security/default.policy | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/java.base/share/lib/security/default.policy b/src/java.base/share/lib/security/default.policy index a68dfa1cdeb..c5d6fd9bf9b 100644 --- a/src/java.base/share/lib/security/default.policy +++ b/src/java.base/share/lib/security/default.policy @@ -154,6 +154,10 @@ grant codeBase "jrt:/jdk.internal.vm.compiler" { permission java.security.AllPermission; }; +grant codeBase "jrt:/jdk.internal.vm.compiler.management" { + permission java.security.AllPermission; +}; + grant codeBase "jrt:/jdk.jsobject" { permission java.security.AllPermission; }; From fd85805dc03405cd1f0abfb19000f9dd73404906 Mon Sep 17 00:00:00 2001 From: Coleen Phillimore Date: Fri, 6 Oct 2017 14:30:04 -0400 Subject: [PATCH 56/80] 8178870: instrumentation.retransformClasses cause coredump Don't double-free cached class bytes on redefinition loading failure. Reviewed-by: sspitsyn, jiangli --- make/test/JtregNativeHotspot.gmk | 2 + .../share/prims/jvmtiRedefineClasses.cpp | 11 +- .../RedefineTests/RedefineDoubleDelete.java | 88 ++++++++++ .../RedefineTests/libRedefineDoubleDelete.c | 164 ++++++++++++++++++ 4 files changed, 262 insertions(+), 3 deletions(-) create mode 100644 test/hotspot/jtreg/runtime/RedefineTests/RedefineDoubleDelete.java create mode 100644 test/hotspot/jtreg/runtime/RedefineTests/libRedefineDoubleDelete.c diff --git a/make/test/JtregNativeHotspot.gmk b/make/test/JtregNativeHotspot.gmk index 8079292213c..ff676ada67d 100644 --- a/make/test/JtregNativeHotspot.gmk +++ b/make/test/JtregNativeHotspot.gmk @@ -59,6 +59,7 @@ BUILD_HOTSPOT_JTREG_NATIVE_SRC += \ $(TOPDIR)/test/hotspot/jtreg/runtime/SameObject \ $(TOPDIR)/test/hotspot/jtreg/runtime/BoolReturn \ $(TOPDIR)/test/hotspot/jtreg/runtime/noClassDefFoundMsg \ + $(TOPDIR)/test/hotspot/jtreg/runtime/RedefineTests \ $(TOPDIR)/test/hotspot/jtreg/compiler/floatingpoint/ \ $(TOPDIR)/test/hotspot/jtreg/compiler/calls \ $(TOPDIR)/test/hotspot/jtreg/serviceability/jvmti/GetOwnedMonitorInfo \ @@ -103,6 +104,7 @@ ifeq ($(TOOLCHAIN_TYPE), solstudio) BUILD_HOTSPOT_JTREG_LIBRARIES_LIBS_libMAAClassLoadPrepare := -lc BUILD_HOTSPOT_JTREG_LIBRARIES_LIBS_libMAAThreadStart := -lc BUILD_HOTSPOT_JTREG_LIBRARIES_LIBS_libAllowedFunctions := -lc + BUILD_HOTSPOT_JTREG_LIBRARIES_LIBS_libRedefineDoubleDelete := -lc endif ifeq ($(OPENJDK_TARGET_OS), linux) diff --git a/src/hotspot/share/prims/jvmtiRedefineClasses.cpp b/src/hotspot/share/prims/jvmtiRedefineClasses.cpp index 336ac07b644..c73842e0500 100644 --- a/src/hotspot/share/prims/jvmtiRedefineClasses.cpp +++ b/src/hotspot/share/prims/jvmtiRedefineClasses.cpp @@ -158,6 +158,11 @@ bool VM_RedefineClasses::doit_prologue() { ClassLoaderData* cld = _scratch_classes[i]->class_loader_data(); // Free the memory for this class at class unloading time. Not before // because CMS might think this is still live. + InstanceKlass* ik = get_ik(_class_defs[i].klass); + if (ik->get_cached_class_file() == _scratch_classes[i]->get_cached_class_file()) { + // Don't double-free cached_class_file copied from the original class if error. + _scratch_classes[i]->set_cached_class_file(NULL); + } cld->add_to_deallocate_list(InstanceKlass::cast(_scratch_classes[i])); } } @@ -3946,12 +3951,12 @@ void VM_RedefineClasses::redefine_single_class(jclass the_jclass, // with them was cached on the scratch class, move to the_class. // Note: we still want to do this if nothing needed caching since it // should get cleared in the_class too. - if (the_class->get_cached_class_file_bytes() == 0) { + if (the_class->get_cached_class_file() == 0) { // the_class doesn't have a cache yet so copy it the_class->set_cached_class_file(scratch_class->get_cached_class_file()); } - else if (scratch_class->get_cached_class_file_bytes() != - the_class->get_cached_class_file_bytes()) { + else if (scratch_class->get_cached_class_file() != + the_class->get_cached_class_file()) { // The same class can be present twice in the scratch classes list or there // are multiple concurrent RetransformClasses calls on different threads. // In such cases we have to deallocate scratch_class cached_class_file. diff --git a/test/hotspot/jtreg/runtime/RedefineTests/RedefineDoubleDelete.java b/test/hotspot/jtreg/runtime/RedefineTests/RedefineDoubleDelete.java new file mode 100644 index 00000000000..a158771d63b --- /dev/null +++ b/test/hotspot/jtreg/runtime/RedefineTests/RedefineDoubleDelete.java @@ -0,0 +1,88 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +/* + * @test + * @bug 8178870 + * @summary Redefine class with CFLH twice to test deleting the cached_class_file + * @library /test/lib + * @modules java.base/jdk.internal.misc + * @modules java.compiler + * java.instrument + * jdk.jartool/sun.tools.jar + * @run main RedefineClassHelper + * @run main/othervm/native -Xlog:redefine+class+load+exceptions -agentlib:RedefineDoubleDelete -javaagent:redefineagent.jar RedefineDoubleDelete + */ + +public class RedefineDoubleDelete { + + // Class gets a redefinition error because it adds a data member + public static String newB = + "class RedefineDoubleDelete$B {" + + " int count1 = 0;" + + "}"; + + public static String newerB = + "class RedefineDoubleDelete$B { " + + " int faa() { System.out.println(\"baa\"); return 2; }" + + "}"; + + // The ClassFileLoadHook for this class turns foo into faa and prints out faa. + static class B { + int faa() { System.out.println("foo"); return 1; } + } + + public static void main(String args[]) throws Exception { + + B b = new B(); + int val = b.faa(); + if (val != 1) { + throw new RuntimeException("return value wrong " + val); + } + + // Redefine B twice to get cached_class_file in both B scratch classes + try { + RedefineClassHelper.redefineClass(B.class, newB); + } catch (java.lang.UnsupportedOperationException e) { + // this is expected + } + try { + RedefineClassHelper.redefineClass(B.class, newB); + } catch (java.lang.UnsupportedOperationException e) { + // this is expected + } + + // Do a full GC. + System.gc(); + + // Redefine with a compatible class + RedefineClassHelper.redefineClass(B.class, newerB); + val = b.faa(); + if (val != 2) { + throw new RuntimeException("return value wrong " + val); + } + + // Do another full GC to clean things up. + System.gc(); + } +} diff --git a/test/hotspot/jtreg/runtime/RedefineTests/libRedefineDoubleDelete.c b/test/hotspot/jtreg/runtime/RedefineTests/libRedefineDoubleDelete.c new file mode 100644 index 00000000000..b5d0dc0afe6 --- /dev/null +++ b/test/hotspot/jtreg/runtime/RedefineTests/libRedefineDoubleDelete.c @@ -0,0 +1,164 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +#include +#include +#include "jvmti.h" + +#ifdef __cplusplus +extern "C" { +#endif + +#ifndef JNI_ENV_ARG + +#ifdef __cplusplus +#define JNI_ENV_ARG(x, y) y +#define JNI_ENV_PTR(x) x +#else +#define JNI_ENV_ARG(x,y) x, y +#define JNI_ENV_PTR(x) (*x) +#endif + +#endif + +#define TranslateError(err) "JVMTI error" + +static jvmtiEnv *jvmti = NULL; + +static jint Agent_Initialize(JavaVM *jvm, char *options, void *reserved); + +JNIEXPORT +jint JNICALL Agent_OnLoad(JavaVM *jvm, char *options, void *reserved) { + return Agent_Initialize(jvm, options, reserved); +} + +JNIEXPORT +jint JNICALL Agent_OnAttach(JavaVM *jvm, char *options, void *reserved) { + return Agent_Initialize(jvm, options, reserved); +} + +JNIEXPORT +jint JNICALL JNI_OnLoad(JavaVM *jvm, void *reserved) { + return JNI_VERSION_9; +} + + +static jint newClassDataLen = 0; +static unsigned char* newClassData = NULL; + +static jint +getBytecodes(jvmtiEnv *jvmti_env, + jint class_data_len, const unsigned char* class_data) { + int i; + jint res; + + newClassDataLen = class_data_len; + res = (*jvmti_env)->Allocate(jvmti_env, newClassDataLen, &newClassData); + if (res != JNI_OK) { + printf(" Unable to allocate bytes\n"); + return JNI_ERR; + } + for (i = 0; i < newClassDataLen; i++) { + newClassData[i] = class_data[i]; + // Rewrite oo in class to aa + if (i > 0 && class_data[i] == 'o' && class_data[i-1] == 'o') { + newClassData[i] = newClassData[i-1] = 'a'; + } + } + printf(" ... copied bytecode: %d bytes\n", (int)newClassDataLen); + return JNI_OK; +} + + +static void JNICALL +Callback_ClassFileLoadHook(jvmtiEnv *jvmti_env, JNIEnv *env, + jclass class_being_redefined, + jobject loader, const char* name, jobject protection_domain, + jint class_data_len, const unsigned char* class_data, + jint *new_class_data_len, unsigned char** new_class_data) { + if (name != NULL && strcmp(name, "RedefineDoubleDelete$B") == 0) { + if (newClassData == NULL) { + jint res = getBytecodes(jvmti_env, class_data_len, class_data); + if (res == JNI_ERR) { + printf(">>> ClassFileLoadHook event: class name %s FAILED\n", name); + return; + } + // Only change for first CFLH event. + *new_class_data_len = newClassDataLen; + *new_class_data = newClassData; + } + printf(">>> ClassFileLoadHook event: class name %s\n", name); + } +} + +static +jint Agent_Initialize(JavaVM *jvm, char *options, void *reserved) { + jint res, size; + jvmtiCapabilities caps; + jvmtiEventCallbacks callbacks; + jvmtiError err; + + res = JNI_ENV_PTR(jvm)->GetEnv(JNI_ENV_ARG(jvm, (void **) &jvmti), + JVMTI_VERSION_9); + if (res != JNI_OK || jvmti == NULL) { + printf(" Error: wrong result of a valid call to GetEnv!\n"); + return JNI_ERR; + } + + printf("Enabling following capabilities: can_generate_all_class_hook_events, " + "can_retransform_classes, can_redefine_classes"); + memset(&caps, 0, sizeof(caps)); + caps.can_generate_all_class_hook_events = 1; + caps.can_retransform_classes = 1; + caps.can_redefine_classes = 1; + printf("\n"); + + err = (*jvmti)->AddCapabilities(jvmti, &caps); + if (err != JVMTI_ERROR_NONE) { + printf(" Error in AddCapabilites: %s (%d)\n", TranslateError(err), err); + return JNI_ERR; + } + + size = (jint)sizeof(callbacks); + + memset(&callbacks, 0, sizeof(callbacks)); + callbacks.ClassFileLoadHook = Callback_ClassFileLoadHook; + + err = (*jvmti)->SetEventCallbacks(jvmti, &callbacks, size); + if (err != JVMTI_ERROR_NONE) { + printf(" Error in SetEventCallbacks: %s (%d)\n", TranslateError(err), err); + return JNI_ERR; + } + + err = (*jvmti)->SetEventNotificationMode(jvmti, JVMTI_ENABLE, JVMTI_EVENT_CLASS_FILE_LOAD_HOOK, NULL); + if (err != JVMTI_ERROR_NONE) { + printf(" Error in SetEventNotificationMode: %s (%d)\n", TranslateError(err), err); + return JNI_ERR; + } + + return JNI_OK; +} + +#ifdef __cplusplus +} +#endif From e24a5bc2ff4af559f21b5b17a826b47d4d5a5cba Mon Sep 17 00:00:00 2001 From: Vladimir Kozlov Date: Fri, 6 Oct 2017 13:00:18 -0700 Subject: [PATCH 57/80] 8188776: jdk.internal.vm.ci can't export package to upgradeable modules Added missing exception in JdkQualifiedExportTest.java test Reviewed-by: mchung --- test/jdk/jdk/modules/etc/JdkQualifiedExportTest.java | 1 + 1 file changed, 1 insertion(+) diff --git a/test/jdk/jdk/modules/etc/JdkQualifiedExportTest.java b/test/jdk/jdk/modules/etc/JdkQualifiedExportTest.java index dcc6579f618..626602bf5ae 100644 --- a/test/jdk/jdk/modules/etc/JdkQualifiedExportTest.java +++ b/test/jdk/jdk/modules/etc/JdkQualifiedExportTest.java @@ -70,6 +70,7 @@ public class JdkQualifiedExportTest { static Set KNOWN_EXCEPTIONS = Set.of("jdk.internal.vm.ci/jdk.vm.ci.services", + "jdk.internal.vm.ci/jdk.vm.ci.runtime", "jdk.jsobject/jdk.internal.netscape.javascript.spi"); static void checkExports(ModuleDescriptor md) { From 3ccd60110d752e4d0bb2ab7fdd396494aa5318ed Mon Sep 17 00:00:00 2001 From: Jiangli Zhou Date: Fri, 6 Oct 2017 19:33:27 -0400 Subject: [PATCH 58/80] 8174986: CDS archived java heap region may not compatible with AOT Always uses LogKlassAlignmentInBytes for narrow_klass_shift when CDS is enabled. Reviewed-by: iklam, ccheung --- src/hotspot/share/memory/filemap.cpp | 12 ++++ src/hotspot/share/memory/filemap.hpp | 12 ++-- src/hotspot/share/memory/metaspace.cpp | 57 +++++++------------ src/hotspot/share/memory/metaspace.hpp | 6 +- src/hotspot/share/memory/metaspaceShared.cpp | 58 +++++++++++++++----- src/hotspot/share/memory/metaspaceShared.hpp | 3 +- 6 files changed, 89 insertions(+), 59 deletions(-) diff --git a/src/hotspot/share/memory/filemap.cpp b/src/hotspot/share/memory/filemap.cpp index e45401f01d8..e4127d05b4e 100644 --- a/src/hotspot/share/memory/filemap.cpp +++ b/src/hotspot/share/memory/filemap.cpp @@ -182,6 +182,7 @@ void FileMapInfo::FileMapHeader::populate(FileMapInfo* mapinfo, size_t alignment _obj_alignment = ObjectAlignmentInBytes; _compact_strings = CompactStrings; _narrow_oop_mode = Universe::narrow_oop_mode(); + _narrow_oop_base = Universe::narrow_oop_base(); _narrow_oop_shift = Universe::narrow_oop_shift(); _max_heap_size = MaxHeapSize; _narrow_klass_base = Universe::narrow_klass_base(); @@ -687,8 +688,14 @@ static int num_open_archive_heap_ranges = 0; // open archive objects. void FileMapInfo::map_heap_regions() { if (MetaspaceShared::is_heap_object_archiving_allowed()) { + log_info(cds)("Archived narrow_oop_mode = %d, narrow_oop_base = " PTR_FORMAT ", narrow_oop_shift = %d", + narrow_oop_mode(), p2i(narrow_oop_base()), narrow_oop_shift()); + log_info(cds)("Archived narrow_klass_base = " PTR_FORMAT ", narrow_klass_shift = %d", + p2i(narrow_klass_base()), narrow_klass_shift()); + // Check that all the narrow oop and klass encodings match the archive if (narrow_oop_mode() != Universe::narrow_oop_mode() || + narrow_oop_base() != Universe::narrow_oop_base() || narrow_oop_shift() != Universe::narrow_oop_shift() || narrow_klass_base() != Universe::narrow_klass_base() || narrow_klass_shift() != Universe::narrow_klass_shift()) { @@ -697,6 +704,11 @@ void FileMapInfo::map_heap_regions() { "The current CompressedOops/CompressedClassPointers encoding differs from " "that archived due to heap size change. The archive was dumped using max heap " "size " UINTX_FORMAT "M.", max_heap_size()/M); + log_info(cds)("Current narrow_oop_mode = %d, narrow_oop_base = " PTR_FORMAT ", narrow_oop_shift = %d", + Universe::narrow_oop_mode(), p2i(Universe::narrow_oop_base()), + Universe::narrow_oop_shift()); + log_info(cds)("Current narrow_klass_base = " PTR_FORMAT ", narrow_klass_shift = %d", + p2i(Universe::narrow_klass_base()), Universe::narrow_klass_shift()); } } else { // First, map string regions as closed archive heap regions. diff --git a/src/hotspot/share/memory/filemap.hpp b/src/hotspot/share/memory/filemap.hpp index f636e64b1b7..781e34e370c 100644 --- a/src/hotspot/share/memory/filemap.hpp +++ b/src/hotspot/share/memory/filemap.hpp @@ -112,6 +112,7 @@ public: int _version; // (from enum, above.) size_t _alignment; // how shared archive should be aligned int _obj_alignment; // value of ObjectAlignmentInBytes + address _narrow_oop_base; // compressed oop encoding base int _narrow_oop_shift; // compressed oop encoding shift bool _compact_strings; // value of CompactStrings uintx _max_heap_size; // java max heap size during dumping @@ -203,12 +204,13 @@ public: int version() { return _header->_version; } size_t alignment() { return _header->_alignment; } Universe::NARROW_OOP_MODE narrow_oop_mode() { return _header->_narrow_oop_mode; } - int narrow_oop_shift() { return _header->_narrow_oop_shift; } - uintx max_heap_size() { return _header->_max_heap_size; } - address narrow_klass_base() const { return _header->_narrow_klass_base; } + address narrow_oop_base() const { return _header->_narrow_oop_base; } + int narrow_oop_shift() const { return _header->_narrow_oop_shift; } + uintx max_heap_size() const { return _header->_max_heap_size; } + address narrow_klass_base() const { return _header->_narrow_klass_base; } int narrow_klass_shift() const { return _header->_narrow_klass_shift; } - struct FileMapHeader* header() { return _header; } - char* misc_data_patching_start() { return _header->_misc_data_patching_start; } + struct FileMapHeader* header() { return _header; } + char* misc_data_patching_start() { return _header->_misc_data_patching_start; } void set_misc_data_patching_start(char* p) { _header->_misc_data_patching_start = p; } char* read_only_tables_start() { return _header->_read_only_tables_start; } void set_read_only_tables_start(char* p) { _header->_read_only_tables_start = p; } diff --git a/src/hotspot/share/memory/metaspace.cpp b/src/hotspot/share/memory/metaspace.cpp index c4c306aae84..8dd4c4fec4e 100644 --- a/src/hotspot/share/memory/metaspace.cpp +++ b/src/hotspot/share/memory/metaspace.cpp @@ -3103,10 +3103,16 @@ void Metaspace::set_narrow_klass_base_and_shift(address metaspace_base, address Universe::set_narrow_klass_base(lower_base); - if ((uint64_t)(higher_address - lower_base) <= UnscaledClassSpaceMax) { + // CDS uses LogKlassAlignmentInBytes for narrow_klass_shift. See + // MetaspaceShared::initialize_dumptime_shared_and_meta_spaces() for + // how dump time narrow_klass_shift is set. Although, CDS can work + // with zero-shift mode also, to be consistent with AOT it uses + // LogKlassAlignmentInBytes for klass shift so archived java heap objects + // can be used at same time as AOT code. + if (!UseSharedSpaces + && (uint64_t)(higher_address - lower_base) <= UnscaledClassSpaceMax) { Universe::set_narrow_klass_shift(0); } else { - assert(!UseSharedSpaces, "Cannot shift with UseSharedSpaces"); Universe::set_narrow_klass_shift(LogKlassAlignmentInBytes); } AOTLoader::set_narrow_klass_shift(); @@ -3325,50 +3331,25 @@ void Metaspace::global_initialize() { #if INCLUDE_CDS if (DumpSharedSpaces) { - MetaspaceShared::initialize_shared_rs(); + MetaspaceShared::initialize_dumptime_shared_and_meta_spaces(); } else if (UseSharedSpaces) { - // If using shared space, open the file that contains the shared space - // and map in the memory before initializing the rest of metaspace (so - // the addresses don't conflict) - address cds_address = NULL; - FileMapInfo* mapinfo = new FileMapInfo(); - - // Open the shared archive file, read and validate the header. If - // initialization fails, shared spaces [UseSharedSpaces] are - // disabled and the file is closed. - // Map in spaces now also - if (mapinfo->initialize() && MetaspaceShared::map_shared_spaces(mapinfo)) { - size_t cds_total = MetaspaceShared::core_spaces_size(); - cds_address = (address)mapinfo->header()->region_addr(0); -#ifdef _LP64 - if (using_class_space()) { - char* cds_end = (char*)(cds_address + cds_total); - cds_end = (char *)align_up(cds_end, _reserve_alignment); - // If UseCompressedClassPointers is set then allocate the metaspace area - // above the heap and above the CDS area (if it exists). - allocate_metaspace_compressed_klass_ptrs(cds_end, cds_address); - // map_heap_regions() compares the current narrow oop and klass encodings - // with the archived ones, so it must be done after all encodings are determined. - mapinfo->map_heap_regions(); - } -#endif // _LP64 - } else { - assert(!mapinfo->is_open() && !UseSharedSpaces, - "archive file not closed or shared spaces not disabled."); - } + // If any of the archived space fails to map, UseSharedSpaces + // is reset to false. Fall through to the + // (!DumpSharedSpaces && !UseSharedSpaces) case to set up class + // metaspace. + MetaspaceShared::initialize_runtime_shared_and_meta_spaces(); } -#endif // INCLUDE_CDS + if (!DumpSharedSpaces && !UseSharedSpaces) +#endif // INCLUDE_CDS + { #ifdef _LP64 - if (!UseSharedSpaces && using_class_space()) { - if (DumpSharedSpaces) { - // Already initialized inside MetaspaceShared::initialize_shared_rs() - } else { + if (using_class_space()) { char* base = (char*)align_up(Universe::heap()->reserved_region().end(), _reserve_alignment); allocate_metaspace_compressed_klass_ptrs(base, 0); } - } #endif // _LP64 + } // Initialize these before initializing the VirtualSpaceList _first_chunk_word_size = InitialBootClassLoaderMetaspaceSize / BytesPerWord; diff --git a/src/hotspot/share/memory/metaspace.hpp b/src/hotspot/share/memory/metaspace.hpp index 81ad7288676..bda5190c314 100644 --- a/src/hotspot/share/memory/metaspace.hpp +++ b/src/hotspot/share/memory/metaspace.hpp @@ -179,6 +179,10 @@ class Metaspace : public CHeapObj { assert(DumpSharedSpaces, "sanity"); DEBUG_ONLY(_frozen = true;) } +#ifdef _LP64 + static void allocate_metaspace_compressed_klass_ptrs(char* requested_addr, address cds_base); +#endif + private: #ifdef _LP64 @@ -187,8 +191,6 @@ class Metaspace : public CHeapObj { // Returns true if can use CDS with metaspace allocated as specified address. static bool can_use_cds_with_metaspace_addr(char* metaspace_base, address cds_base); - static void allocate_metaspace_compressed_klass_ptrs(char* requested_addr, address cds_base); - static void initialize_class_space(ReservedSpace rs); #endif size_t class_chunk_size(size_t word_size); diff --git a/src/hotspot/share/memory/metaspaceShared.cpp b/src/hotspot/share/memory/metaspaceShared.cpp index 1b7df68e3bb..d7bc3548820 100644 --- a/src/hotspot/share/memory/metaspaceShared.cpp +++ b/src/hotspot/share/memory/metaspaceShared.cpp @@ -214,7 +214,42 @@ char* MetaspaceShared::read_only_space_alloc(size_t num_bytes) { return _ro_region.allocate(num_bytes); } -void MetaspaceShared::initialize_shared_rs() { +void MetaspaceShared::initialize_runtime_shared_and_meta_spaces() { + assert(UseSharedSpaces, "Must be called when UseSharedSpaces is enabled"); + + // If using shared space, open the file that contains the shared space + // and map in the memory before initializing the rest of metaspace (so + // the addresses don't conflict) + address cds_address = NULL; + FileMapInfo* mapinfo = new FileMapInfo(); + + // Open the shared archive file, read and validate the header. If + // initialization fails, shared spaces [UseSharedSpaces] are + // disabled and the file is closed. + // Map in spaces now also + if (mapinfo->initialize() && map_shared_spaces(mapinfo)) { + size_t cds_total = core_spaces_size(); + cds_address = (address)mapinfo->header()->region_addr(0); +#ifdef _LP64 + if (Metaspace::using_class_space()) { + char* cds_end = (char*)(cds_address + cds_total); + cds_end = (char *)align_up(cds_end, Metaspace::reserve_alignment()); + // If UseCompressedClassPointers is set then allocate the metaspace area + // above the heap and above the CDS area (if it exists). + Metaspace::allocate_metaspace_compressed_klass_ptrs(cds_end, cds_address); + // map_heap_regions() compares the current narrow oop and klass encodings + // with the archived ones, so it must be done after all encodings are determined. + mapinfo->map_heap_regions(); + } +#endif // _LP64 + } else { + assert(!mapinfo->is_open() && !UseSharedSpaces, + "archive file not closed or shared spaces not disabled."); + } +} + +void MetaspaceShared::initialize_dumptime_shared_and_meta_spaces() { + assert(DumpSharedSpaces, "should be called for dump time only"); const size_t reserve_alignment = Metaspace::reserve_alignment(); bool large_pages = false; // No large pages when dumping the CDS archive. char* shared_base = (char*)align_up((char*)SharedBaseAddress, reserve_alignment); @@ -223,12 +258,12 @@ void MetaspaceShared::initialize_shared_rs() { // On 64-bit VM, the heap and class space layout will be the same as if // you're running in -Xshare:on mode: // - // +-- SharedBaseAddress (default = 0x800000000) - // v - // +-..---------+----+ ... +----+----+----+----+----+---------------+ - // | Heap | ST | | MC | RW | RO | MD | OD | class space | - // +-..---------+----+ ... +----+----+----+----+----+---------------+ - // |<--MaxHeapSize->| |<-- UnscaledClassSpaceMax = 4GB ------->| + // +-- SharedBaseAddress (default = 0x800000000) + // v + // +-..---------+---------+ ... +----+----+----+----+----+---------------+ + // | Heap | Archive | | MC | RW | RO | MD | OD | class space | + // +-..---------+---------+ ... +----+----+----+----+----+---------------+ + // |<-- MaxHeapSize -->| |<-- UnscaledClassSpaceMax = 4GB ------->| // const uint64_t UnscaledClassSpaceMax = (uint64_t(max_juint) + 1); const size_t cds_total = align_down(UnscaledClassSpaceMax, reserve_alignment); @@ -268,12 +303,9 @@ void MetaspaceShared::initialize_shared_rs() { // Set up compress class pointers. Universe::set_narrow_klass_base((address)_shared_rs.base()); - if (UseAOT || cds_total > UnscaledClassSpaceMax) { - // AOT forces narrow_klass_shift=LogKlassAlignmentInBytes - Universe::set_narrow_klass_shift(LogKlassAlignmentInBytes); - } else { - Universe::set_narrow_klass_shift(0); - } + // Set narrow_klass_shift to be LogKlassAlignmentInBytes. This is consistent + // with AOT. + Universe::set_narrow_klass_shift(LogKlassAlignmentInBytes); Metaspace::initialize_class_space(tmp_class_space); tty->print_cr("narrow_klass_base = " PTR_FORMAT ", narrow_klass_shift = %d", diff --git a/src/hotspot/share/memory/metaspaceShared.hpp b/src/hotspot/share/memory/metaspaceShared.hpp index d93dea2809d..972b15261e4 100644 --- a/src/hotspot/share/memory/metaspaceShared.hpp +++ b/src/hotspot/share/memory/metaspaceShared.hpp @@ -146,7 +146,8 @@ class MetaspaceShared : AllStatic { static size_t core_spaces_size() { return _core_spaces_size; } - static void initialize_shared_rs() NOT_CDS_RETURN; + static void initialize_dumptime_shared_and_meta_spaces() NOT_CDS_RETURN; + static void initialize_runtime_shared_and_meta_spaces() NOT_CDS_RETURN; // Delta of this object from the bottom of the archive. static uintx object_delta(void* obj) { From 0d8679e1786761786f79cdc5f7a56e7b194178a7 Mon Sep 17 00:00:00 2001 From: Zhengyu Gu Date: Fri, 6 Oct 2017 22:40:31 -0400 Subject: [PATCH 59/80] 8187685: NMT: Tracking compiler memory usage of thread's resource area Bias compiler thread's resource area to mtCompiler Reviewed-by: kvn, coleenp --- src/hotspot/share/memory/resourceArea.cpp | 11 ++++++++++- src/hotspot/share/memory/resourceArea.hpp | 6 +++++- src/hotspot/share/runtime/thread.cpp | 3 +++ 3 files changed, 18 insertions(+), 2 deletions(-) diff --git a/src/hotspot/share/memory/resourceArea.cpp b/src/hotspot/share/memory/resourceArea.cpp index 767e45ec148..3995e6335db 100644 --- a/src/hotspot/share/memory/resourceArea.cpp +++ b/src/hotspot/share/memory/resourceArea.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 1997, 2010, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -27,6 +27,15 @@ #include "memory/resourceArea.hpp" #include "runtime/mutexLocker.hpp" #include "runtime/thread.inline.hpp" +#include "services/memTracker.hpp" + +void ResourceArea::bias_to(MEMFLAGS new_flags) { + if (new_flags != _flags) { + MemTracker::record_arena_free(_flags); + MemTracker::record_new_arena(new_flags); + _flags = new_flags; + } +} //------------------------------ResourceMark----------------------------------- debug_only(int ResourceArea::_warned;) // to suppress multiple warnings diff --git a/src/hotspot/share/memory/resourceArea.hpp b/src/hotspot/share/memory/resourceArea.hpp index 72dcddf0f0d..5fc13ac9243 100644 --- a/src/hotspot/share/memory/resourceArea.hpp +++ b/src/hotspot/share/memory/resourceArea.hpp @@ -70,7 +70,11 @@ public: return (char*)Amalloc(size, alloc_failmode); } - debug_only(int nesting() const { return _nesting; }); + // Bias this resource area to specific memory type + // (by default, ResourceArea is tagged as mtThread, per-thread general purpose storage) + void bias_to(MEMFLAGS flags); + + debug_only(int nesting() const { return _nesting; }) }; diff --git a/src/hotspot/share/runtime/thread.cpp b/src/hotspot/share/runtime/thread.cpp index b1e7da21c7f..9663e183340 100644 --- a/src/hotspot/share/runtime/thread.cpp +++ b/src/hotspot/share/runtime/thread.cpp @@ -3263,6 +3263,9 @@ CompilerThread::CompilerThread(CompileQueue* queue, _buffer_blob = NULL; _compiler = NULL; + // Compiler uses resource area for compilation, let's bias it to mtCompiler + resource_area()->bias_to(mtCompiler); + #ifndef PRODUCT _ideal_graph_printer = NULL; #endif From b1a725dff0d77e52b7c600adb2d38385319db7d3 Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Sat, 7 Oct 2017 22:42:35 +0900 Subject: [PATCH 60/80] 8187401: Java Stack cannot be shown on HSDB Reviewed-by: sspitsyn, jgeorge --- .../sun/jvm/hotspot/runtime/BasicType.java | 48 +++++++++++++------ .../hotspot/runtime/StackValueCollection.java | 11 ++++- .../ui/classbrowser/HTMLGenerator.java | 14 ++++-- 3 files changed, 53 insertions(+), 20 deletions(-) diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/BasicType.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/BasicType.java index 825541c0ea3..8331b5d34ca 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/BasicType.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/BasicType.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2004, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -28,20 +28,23 @@ package sun.jvm.hotspot.runtime; VM. */ public class BasicType { - public static final int tBoolean = 4; - public static final int tChar = 5; - public static final int tFloat = 6; - public static final int tDouble = 7; - public static final int tByte = 8; - public static final int tShort = 9; - public static final int tInt = 10; - public static final int tLong = 11; - public static final int tObject = 12; - public static final int tArray = 13; - public static final int tVoid = 14; - public static final int tAddress = 15; - public static final int tConflict = 16; - public static final int tIllegal = 99; + public static final int tBoolean = 4; + public static final int tChar = 5; + public static final int tFloat = 6; + public static final int tDouble = 7; + public static final int tByte = 8; + public static final int tShort = 9; + public static final int tInt = 10; + public static final int tLong = 11; + public static final int tObject = 12; + public static final int tArray = 13; + public static final int tVoid = 14; + public static final int tAddress = 15; + public static final int tNarrowOop = 16; + public static final int tMetadata = 17; + public static final int tNarrowKlass = 18; + public static final int tConflict = 19; + public static final int tIllegal = 99; public static final BasicType T_BOOLEAN = new BasicType(tBoolean); public static final BasicType T_CHAR = new BasicType(tChar); @@ -55,6 +58,9 @@ public class BasicType { public static final BasicType T_ARRAY = new BasicType(tArray); public static final BasicType T_VOID = new BasicType(tVoid); public static final BasicType T_ADDRESS = new BasicType(tAddress); + public static final BasicType T_NARROWOOP = new BasicType(tNarrowOop); + public static final BasicType T_METADATA = new BasicType(tMetadata); + public static final BasicType T_NARROWKLASS = new BasicType(tNarrowKlass); public static final BasicType T_CONFLICT = new BasicType(tConflict); public static final BasicType T_ILLEGAL = new BasicType(tIllegal); @@ -106,6 +112,18 @@ public class BasicType { return tAddress; } + public static int getTNarrowOop() { + return tNarrowOop; + } + + public static int getTMetadata() { + return tMetadata; + } + + public static int getTNarrowKlass() { + return tNarrowKlass; + } + /** For stack value type with conflicting contents */ public static int getTConflict() { return tConflict; diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/StackValueCollection.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/StackValueCollection.java index 2da587843ac..39b12e2489a 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/StackValueCollection.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/runtime/StackValueCollection.java @@ -27,6 +27,7 @@ package sun.jvm.hotspot.runtime; import java.util.*; import sun.jvm.hotspot.debugger.*; +import sun.jvm.hotspot.types.*; public class StackValueCollection { private List list; @@ -48,7 +49,15 @@ public class StackValueCollection { public int intAt(int slot) { return (int) get(slot).getInteger(); } public long longAt(int slot) { return VM.getVM().buildLongFromIntsPD((int) get(slot).getInteger(), (int) get(slot+1).getInteger()); } - public OopHandle oopHandleAt(int slot) { return get(slot).getObject(); } + + public OopHandle oopHandleAt(int slot) { + StackValue sv = get(slot); + if (sv.getType() == BasicType.getTConflict()) { + throw new WrongTypeException("Conflict type"); + } + return sv.getObject(); + } + public float floatAt(int slot) { return Float.intBitsToFloat(intAt(slot)); } public double doubleAt(int slot) { return Double.longBitsToDouble(longAt(slot)); } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/ui/classbrowser/HTMLGenerator.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/ui/classbrowser/HTMLGenerator.java index 17d24d4f145..d2d639214af 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/ui/classbrowser/HTMLGenerator.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/ui/classbrowser/HTMLGenerator.java @@ -34,6 +34,7 @@ import sun.jvm.hotspot.interpreter.*; import sun.jvm.hotspot.oops.*; import sun.jvm.hotspot.runtime.*; import sun.jvm.hotspot.tools.jcore.*; +import sun.jvm.hotspot.types.*; import sun.jvm.hotspot.utilities.*; public class HTMLGenerator implements /* imports */ ClassConstants { @@ -1928,11 +1929,16 @@ public class HTMLGenerator implements /* imports */ ClassConstants { } if (!method.isStatic() && !method.isNative()) { - OopHandle oopHandle = vf.getLocals().oopHandleAt(0); + try { + OopHandle oopHandle = vf.getLocals().oopHandleAt(0); - if (oopHandle != null) { - buf.append(", oop = "); - buf.append(oopHandle.toString()); + if (oopHandle != null) { + buf.append(", oop = "); + buf.append(oopHandle.toString()); + } + } catch (WrongTypeException e) { + // Do nothing. + // It might be caused by JIT'ed inline frame. } } From 72ef94f770313a341ea670ed1433ca80f3a75008 Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Sat, 7 Oct 2017 22:45:12 +0900 Subject: [PATCH 61/80] 8187403: [Unknown generation] is shown in Stack Memory on HSDB Reviewed-by: sspitsyn, jgeorge --- src/hotspot/share/gc/g1/heapRegionType.hpp | 2 + src/hotspot/share/gc/g1/vmStructs_g1.hpp | 18 +++- src/hotspot/share/runtime/vmStructs.cpp | 4 +- .../share/classes/sun/jvm/hotspot/HSDB.java | 23 ++++- .../jvm/hotspot/gc/g1/G1CollectedHeap.java | 4 +- .../jvm/hotspot/gc/g1/G1HeapRegionTable.java | 13 ++- .../sun/jvm/hotspot/gc/g1/HeapRegion.java | 42 ++++++++- .../jvm/hotspot/gc/g1/HeapRegionManager.java | 6 +- .../sun/jvm/hotspot/gc/g1/HeapRegionType.java | 92 +++++++++++++++++++ 9 files changed, 195 insertions(+), 9 deletions(-) create mode 100644 src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionType.java diff --git a/src/hotspot/share/gc/g1/heapRegionType.hpp b/src/hotspot/share/gc/g1/heapRegionType.hpp index e0829c00c8c..f6900d2070f 100644 --- a/src/hotspot/share/gc/g1/heapRegionType.hpp +++ b/src/hotspot/share/gc/g1/heapRegionType.hpp @@ -32,6 +32,8 @@ assert(is_valid((tag)), "invalid HR type: %u", (uint) (tag)) class HeapRegionType VALUE_OBJ_CLASS_SPEC { +friend class VMStructs; + private: // We encode the value of the heap region type so the generation can be // determined quickly. The tag is split into two parts: diff --git a/src/hotspot/share/gc/g1/vmStructs_g1.hpp b/src/hotspot/share/gc/g1/vmStructs_g1.hpp index 5026d6ee7ac..19f338dc20c 100644 --- a/src/hotspot/share/gc/g1/vmStructs_g1.hpp +++ b/src/hotspot/share/gc/g1/vmStructs_g1.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -35,6 +35,10 @@ static_field(HeapRegion, GrainBytes, size_t) \ static_field(HeapRegion, LogOfHRGrainBytes, int) \ \ + nonstatic_field(HeapRegion, _type, HeapRegionType) \ + \ + nonstatic_field(HeapRegionType, _tag, HeapRegionType::Tag volatile) \ + \ nonstatic_field(G1ContiguousSpace, _top, HeapWord* volatile) \ \ nonstatic_field(G1HeapRegionTable, _base, address) \ @@ -67,9 +71,16 @@ #define VM_INT_CONSTANTS_G1(declare_constant, declare_constant_with_value) \ + declare_constant(HeapRegionType::FreeTag) \ + declare_constant(HeapRegionType::YoungMask) \ + declare_constant(HeapRegionType::HumongousMask) \ + declare_constant(HeapRegionType::PinnedMask) \ + declare_constant(HeapRegionType::OldMask) -#define VM_TYPES_G1(declare_type, declare_toplevel_type) \ +#define VM_TYPES_G1(declare_type, \ + declare_toplevel_type, \ + declare_integer_type) \ \ declare_toplevel_type(G1HeapRegionTable) \ \ @@ -81,9 +92,12 @@ declare_toplevel_type(HeapRegionSetBase) \ declare_toplevel_type(G1MonitoringSupport) \ declare_toplevel_type(PtrQueue) \ + declare_toplevel_type(HeapRegionType) \ \ declare_toplevel_type(G1CollectedHeap*) \ declare_toplevel_type(HeapRegion*) \ declare_toplevel_type(G1MonitoringSupport*) \ + \ + declare_integer_type(HeapRegionType::Tag volatile) #endif // SHARE_VM_GC_G1_VMSTRUCTS_G1_HPP diff --git a/src/hotspot/share/runtime/vmStructs.cpp b/src/hotspot/share/runtime/vmStructs.cpp index 93e9abf209b..47049345b87 100644 --- a/src/hotspot/share/runtime/vmStructs.cpp +++ b/src/hotspot/share/runtime/vmStructs.cpp @@ -3013,7 +3013,8 @@ VMTypeEntry VMStructs::localHotSpotVMTypes[] = { VM_TYPES_PARNEW(GENERATE_VM_TYPE_ENTRY) VM_TYPES_G1(GENERATE_VM_TYPE_ENTRY, - GENERATE_TOPLEVEL_VM_TYPE_ENTRY) + GENERATE_TOPLEVEL_VM_TYPE_ENTRY, + GENERATE_INTEGER_VM_TYPE_ENTRY) #endif // INCLUDE_ALL_GCS #if INCLUDE_TRACE @@ -3211,6 +3212,7 @@ VMStructs::init() { VM_TYPES_PARNEW(CHECK_VM_TYPE_ENTRY) VM_TYPES_G1(CHECK_VM_TYPE_ENTRY, + CHECK_SINGLE_ARG_VM_TYPE_NO_OP, CHECK_SINGLE_ARG_VM_TYPE_NO_OP); #endif // INCLUDE_ALL_GCS diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/HSDB.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/HSDB.java index 4a7094463d7..6d5720b63a6 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/HSDB.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/HSDB.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -35,6 +35,7 @@ import sun.jvm.hotspot.compiler.*; import sun.jvm.hotspot.debugger.*; import sun.jvm.hotspot.gc.parallel.*; import sun.jvm.hotspot.gc.shared.*; +import sun.jvm.hotspot.gc.g1.*; import sun.jvm.hotspot.interpreter.*; import sun.jvm.hotspot.memory.*; import sun.jvm.hotspot.oops.*; @@ -1078,6 +1079,26 @@ public class HSDB implements ObjectHistogramPanel.Listener, SAListener { } } + } else if (collHeap instanceof G1CollectedHeap) { + G1CollectedHeap heap = (G1CollectedHeap)collHeap; + HeapRegion region = heap.hrm().getByAddress(handle); + + if (region.isFree()) { + anno = "Free "; + bad = false; + } else if (region.isYoung()) { + anno = "Young "; + bad = false; + } else if (region.isHumongous()) { + anno = "Humongous "; + bad = false; + } else if (region.isPinned()) { + anno = "Pinned "; + bad = false; + } else if (region.isOld()) { + anno = "Old "; + bad = false; + } } else if (collHeap instanceof ParallelScavengeHeap) { ParallelScavengeHeap heap = (ParallelScavengeHeap) collHeap; if (heap.youngGen().isIn(handle)) { diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1CollectedHeap.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1CollectedHeap.java index a9e91802bba..24ebfe905d3 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1CollectedHeap.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1CollectedHeap.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -87,7 +87,7 @@ public class G1CollectedHeap extends CollectedHeap { return hrm().length(); } - private HeapRegionManager hrm() { + public HeapRegionManager hrm() { Address hrmAddr = addr.addOffsetTo(hrmFieldOffset); return (HeapRegionManager) VMObjectFactory.newObject(HeapRegionManager.class, hrmAddr); diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java index da8abd80223..331a8eb1499 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2013, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2013, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -29,6 +29,7 @@ import java.util.Observable; import java.util.Observer; import sun.jvm.hotspot.debugger.Address; +import sun.jvm.hotspot.debugger.OopHandle; import sun.jvm.hotspot.runtime.VM; import sun.jvm.hotspot.runtime.VMObject; import sun.jvm.hotspot.runtime.VMObjectFactory; @@ -36,6 +37,7 @@ import sun.jvm.hotspot.types.AddressField; import sun.jvm.hotspot.types.CIntegerField; import sun.jvm.hotspot.types.Type; import sun.jvm.hotspot.types.TypeDataBase; +import sun.jvm.hotspot.utilities.Assert; // Mirror class for G1HeapRegionTable. It's essentially an index -> HeapRegion map. @@ -132,4 +134,13 @@ public class G1HeapRegionTable extends VMObject { public G1HeapRegionTable(Address addr) { super(addr); } + + public HeapRegion getByAddress(Address addr) { + if (Assert.ASSERTS_ENABLED) { + Assert.that(addr instanceof OopHandle, "addr should be OopHandle"); + } + + long biasedIndex = addr.asLongValue() >>> shiftBy(); + return new HeapRegion(addr.addOffsetToAsOopHandle(biasedIndex * HeapRegion.getPointerSize())); + } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java index 61b2bb1aec5..608bab9fb30 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -29,13 +29,16 @@ import java.util.List; import java.util.Observable; import java.util.Observer; import sun.jvm.hotspot.debugger.Address; +import sun.jvm.hotspot.debugger.OopHandle; import sun.jvm.hotspot.gc.shared.CompactibleSpace; import sun.jvm.hotspot.memory.MemRegion; import sun.jvm.hotspot.runtime.VM; +import sun.jvm.hotspot.runtime.VMObjectFactory; import sun.jvm.hotspot.types.AddressField; import sun.jvm.hotspot.types.CIntegerField; import sun.jvm.hotspot.types.Type; import sun.jvm.hotspot.types.TypeDataBase; +import sun.jvm.hotspot.utilities.Assert; // Mirror class for HeapRegion. Currently we don't actually include // any of its fields but only iterate over it. @@ -44,6 +47,10 @@ public class HeapRegion extends CompactibleSpace { // static int GrainBytes; static private CIntegerField grainBytesField; static private AddressField topField; + private static long typeFieldOffset; + private static long pointerSize; + + private HeapRegionType type; static { VM.registerVMInitializedObserver(new Observer() { @@ -58,7 +65,9 @@ public class HeapRegion extends CompactibleSpace { grainBytesField = type.getCIntegerField("GrainBytes"); topField = type.getAddressField("_top"); + typeFieldOffset = type.getField("_type").getOffset(); + pointerSize = db.lookupType("HeapRegion*").getSize(); } static public long grainBytes() { @@ -67,6 +76,13 @@ public class HeapRegion extends CompactibleSpace { public HeapRegion(Address addr) { super(addr); + + if (Assert.ASSERTS_ENABLED) { + Assert.that(addr instanceof OopHandle, "addr should be OopHandle"); + } + + Address typeAddr = addr.addOffsetToAsOopHandle(typeFieldOffset); + type = (HeapRegionType)VMObjectFactory.newObject(HeapRegionType.class, typeAddr); } public Address top() { @@ -89,4 +105,28 @@ public class HeapRegion extends CompactibleSpace { public long free() { return end().minus(top()); } + + public boolean isFree() { + return type.isFree(); + } + + public boolean isYoung() { + return type.isYoung(); + } + + public boolean isHumongous() { + return type.isHumongous(); + } + + public boolean isPinned() { + return type.isPinned(); + } + + public boolean isOld() { + return type.isOld(); + } + + public static long getPointerSize() { + return pointerSize; + } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionManager.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionManager.java index b80c60350f4..79f32d857b9 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionManager.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionManager.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2011, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2011, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -85,4 +85,8 @@ public class HeapRegionManager extends VMObject { public HeapRegionManager(Address addr) { super(addr); } + + public HeapRegion getByAddress(Address addr) { + return regions().getByAddress(addr); + } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionType.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionType.java new file mode 100644 index 00000000000..cdc706d23bc --- /dev/null +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegionType.java @@ -0,0 +1,92 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + * + */ + +package sun.jvm.hotspot.gc.g1; + +import java.util.Observable; +import java.util.Observer; +import sun.jvm.hotspot.debugger.Address; +import sun.jvm.hotspot.runtime.VM; +import sun.jvm.hotspot.runtime.VMObject; +import sun.jvm.hotspot.types.CIntegerField; +import sun.jvm.hotspot.types.Type; +import sun.jvm.hotspot.types.TypeDataBase; + +// Mirror class for HeapRegionType. Currently we don't actually include +// any of its fields but only iterate over it. + +public class HeapRegionType extends VMObject { + + private static int freeTag; + private static int youngMask; + private static int humongousMask; + private static int pinnedMask; + private static int oldMask; + private static CIntegerField tagField; + private int tag; + + static { + VM.registerVMInitializedObserver(new Observer() { + public void update(Observable o, Object data) { + initialize(VM.getVM().getTypeDataBase()); + } + }); + } + + private static synchronized void initialize(TypeDataBase db) { + Type type = db.lookupType("HeapRegionType"); + + tagField = type.getCIntegerField("_tag"); + + freeTag = db.lookupIntConstant("HeapRegionType::FreeTag"); + youngMask = db.lookupIntConstant("HeapRegionType::YoungMask"); + humongousMask = db.lookupIntConstant("HeapRegionType::HumongousMask"); + pinnedMask = db.lookupIntConstant("HeapRegionType::PinnedMask"); + oldMask = db.lookupIntConstant("HeapRegionType::OldMask"); + } + + public boolean isFree() { + return tagField.getValue(addr) == freeTag; + } + + public boolean isYoung() { + return (tagField.getValue(addr) & youngMask) != 0; + } + + public boolean isHumongous() { + return (tagField.getValue(addr) & humongousMask) != 0; + } + + public boolean isPinned() { + return (tagField.getValue(addr) & pinnedMask) != 0; + } + + public boolean isOld() { + return (tagField.getValue(addr) & oldMask) != 0; + } + + public HeapRegionType(Address addr) { + super(addr); + } +} From 2d8670326d88913a5547268443278ffdcb63995b Mon Sep 17 00:00:00 2001 From: David Holmes Date: Mon, 9 Oct 2017 01:23:13 -0400 Subject: [PATCH 62/80] 8185529: JCK api/java_lang/Object/WaitTests failed with jdk10/hs nightly Reviewed-by: dcubed, ccheung --- src/hotspot/os/posix/os_posix.cpp | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/src/hotspot/os/posix/os_posix.cpp b/src/hotspot/os/posix/os_posix.cpp index 554238313f8..422f7fcac3c 100644 --- a/src/hotspot/os/posix/os_posix.cpp +++ b/src/hotspot/os/posix/os_posix.cpp @@ -1770,6 +1770,12 @@ int os::PlatformEvent::park(jlong millis) { if (v == 0) { // Do this the hard way by blocking ... struct timespec abst; + // We have to watch for overflow when converting millis to nanos, + // but if millis is that large then we will end up limiting to + // MAX_SECS anyway, so just do that here. + if (millis / MILLIUNITS > MAX_SECS) { + millis = jlong(MAX_SECS) * MILLIUNITS; + } to_abstime(&abst, millis * (NANOUNITS / MILLIUNITS), false); int ret = OS_TIMEOUT; From 75a4bdf2180ac85ae7a021a2289a1e4f35fd24cc Mon Sep 17 00:00:00 2001 From: Lutz Schmidt Date: Mon, 9 Oct 2017 11:43:42 +0200 Subject: [PATCH 63/80] 8187964: [s390][ppc]: Intrinsify Math.multiplyHigh(long, long) Reviewed-by: mdoerr --- src/hotspot/cpu/s390/assembler_s390.hpp | 17 +++++++-- .../cpu/s390/assembler_s390.inline.hpp | 3 ++ src/hotspot/cpu/s390/s390.ad | 38 ++++++++++++++++--- 3 files changed, 49 insertions(+), 9 deletions(-) diff --git a/src/hotspot/cpu/s390/assembler_s390.hpp b/src/hotspot/cpu/s390/assembler_s390.hpp index 7b431307458..a06b43ae3a8 100644 --- a/src/hotspot/cpu/s390/assembler_s390.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.hpp @@ -1437,10 +1437,18 @@ class Assembler : public AbstractAssembler { // unsigned arithmetic calculation instructions // Mask bit#0 is not used by these instructions. // There is no indication of overflow for these instr. - bcondLogZero = 2, - bcondLogNotZero = 5, + bcondLogZero_NoCarry = 8, + bcondLogZero_Carry = 2, + // bcondLogZero_Borrow = 8, // This CC is never generated. + bcondLogZero_NoBorrow = 2, + bcondLogZero = bcondLogZero_Carry | bcondLogZero_NoCarry, + bcondLogNotZero_NoCarry = 4, + bcondLogNotZero_Carry = 1, bcondLogNotZero_Borrow = 4, bcondLogNotZero_NoBorrow = 1, + bcondLogNotZero = bcondLogNotZero_Carry | bcondLogNotZero_NoCarry, + bcondLogCarry = bcondLogZero_Carry | bcondLogNotZero_Carry, + bcondLogBorrow = /* bcondLogZero_Borrow | */ bcondLogNotZero_Borrow, // string search instructions bcondFound = 4, bcondNotFound = 2, @@ -2117,13 +2125,16 @@ class Assembler : public AbstractAssembler { inline void z_alsi( const Address& d, int64_t i2); // add logical *(d) += i2_imm8 ; uint32 -- z10 inline void z_algsi(const Address& d, int64_t i2); // add logical *(d) += i2_imm8 ; uint64 -- z10 - // negate + // sign adjustment inline void z_lcr( Register r1, Register r2 = noreg); // neg r1 = -r2 ; int32 inline void z_lcgr( Register r1, Register r2 = noreg); // neg r1 = -r2 ; int64 inline void z_lcgfr(Register r1, Register r2); // neg r1 = -r2 ; int64 <- int32 inline void z_lnr( Register r1, Register r2 = noreg); // neg r1 = -|r2| ; int32 inline void z_lngr( Register r1, Register r2 = noreg); // neg r1 = -|r2| ; int64 inline void z_lngfr(Register r1, Register r2); // neg r1 = -|r2| ; int64 <- int32 + inline void z_lpr( Register r1, Register r2 = noreg); // r1 = |r2| ; int32 + inline void z_lpgr( Register r1, Register r2 = noreg); // r1 = |r2| ; int64 + inline void z_lpgfr(Register r1, Register r2); // r1 = |r2| ; int64 <- int32 // subtract intstructions // sub registers diff --git a/src/hotspot/cpu/s390/assembler_s390.inline.hpp b/src/hotspot/cpu/s390/assembler_s390.inline.hpp index bfa4646a42a..eaeb9d3ea1e 100644 --- a/src/hotspot/cpu/s390/assembler_s390.inline.hpp +++ b/src/hotspot/cpu/s390/assembler_s390.inline.hpp @@ -309,6 +309,9 @@ inline void Assembler::z_lcgfr(Register r1, Register r2) { emit_32( LCGFR_ZOPC | inline void Assembler::z_lnr( Register r1, Register r2) { emit_16( LNR_ZOPC | regt( r1, 8, 16) | reg((r2 == noreg) ? r1:r2, 12, 16)); } inline void Assembler::z_lngr( Register r1, Register r2) { emit_32( LNGR_ZOPC | regt( r1, 24, 32) | reg((r2 == noreg) ? r1:r2, 28, 32)); } inline void Assembler::z_lngfr(Register r1, Register r2) { emit_32( LNGFR_ZOPC | regt( r1, 24, 32) | reg((r2 == noreg) ? r1:r2, 28, 32)); } +inline void Assembler::z_lpr( Register r1, Register r2) { emit_16( LPR_ZOPC | regt( r1, 8, 16) | reg((r2 == noreg) ? r1:r2, 12, 16)); } +inline void Assembler::z_lpgr( Register r1, Register r2) { emit_32( LPGR_ZOPC | regt( r1, 24, 32) | reg((r2 == noreg) ? r1:r2, 28, 32)); } +inline void Assembler::z_lpgfr(Register r1, Register r2) { emit_32( LPGFR_ZOPC | regt( r1, 24, 32) | reg((r2 == noreg) ? r1:r2, 28, 32)); } inline void Assembler::z_lrvr( Register r1, Register r2) { emit_32( LRVR_ZOPC | regt(r1, 24, 32) | reg(r2, 28, 32)); } inline void Assembler::z_lrvgr(Register r1, Register r2) { emit_32( LRVGR_ZOPC | regt(r1, 24, 32) | reg(r2, 28, 32)); } diff --git a/src/hotspot/cpu/s390/s390.ad b/src/hotspot/cpu/s390/s390.ad index b30437e0faf..15902d9f7aa 100644 --- a/src/hotspot/cpu/s390/s390.ad +++ b/src/hotspot/cpu/s390/s390.ad @@ -3149,7 +3149,7 @@ operand noArg_iRegI() %{ interface(REG_INTER); %} -// Revenregi and roddRegI constitute and even-odd-pair. +// revenRegI and roddRegI constitute and even-odd-pair. operand revenRegI() %{ constraint(ALLOC_IN_RC(z_rarg3_int_reg)); match(iRegI); @@ -3157,7 +3157,7 @@ operand revenRegI() %{ interface(REG_INTER); %} -// Revenregi and roddRegI constitute and even-odd-pair. +// revenRegI and roddRegI constitute and even-odd-pair. operand roddRegI() %{ constraint(ALLOC_IN_RC(z_rarg4_int_reg)); match(iRegI); @@ -3283,7 +3283,7 @@ operand memoryRegP() %{ interface(REG_INTER); %} -// Revenregp and roddRegP constitute and even-odd-pair. +// revenRegP and roddRegP constitute and even-odd-pair. operand revenRegP() %{ constraint(ALLOC_IN_RC(z_rarg3_ptr_reg)); match(iRegP); @@ -3291,7 +3291,7 @@ operand revenRegP() %{ interface(REG_INTER); %} -// Revenregl and roddRegL constitute and even-odd-pair. +// revenRegP and roddRegP constitute and even-odd-pair. operand roddRegP() %{ constraint(ALLOC_IN_RC(z_rarg4_ptr_reg)); match(iRegP); @@ -3380,7 +3380,7 @@ operand iRegL() %{ interface(REG_INTER); %} -// Revenregl and roddRegL constitute and even-odd-pair. +// revenRegL and roddRegL constitute and even-odd-pair. operand revenRegL() %{ constraint(ALLOC_IN_RC(z_rarg3_long_reg)); match(iRegL); @@ -3388,7 +3388,7 @@ operand revenRegL() %{ interface(REG_INTER); %} -// Revenregl and roddRegL constitute and even-odd-pair. +// revenRegL and roddRegL constitute and even-odd-pair. operand roddRegL() %{ constraint(ALLOC_IN_RC(z_rarg4_long_reg)); match(iRegL); @@ -6443,6 +6443,32 @@ instruct mulL_Reg_mem(iRegL dst, memory src)%{ ins_pipe(pipe_class_dummy); %} +instruct mulHiL_reg_reg(revenRegL Rdst, roddRegL Rsrc1, iRegL Rsrc2, iRegL Rtmp1, flagsReg cr)%{ + match(Set Rdst (MulHiL Rsrc1 Rsrc2)); + effect(TEMP_DEF Rdst, USE_KILL Rsrc1, TEMP Rtmp1, KILL cr); + ins_cost(7*DEFAULT_COST); + // TODO: s390 port size(VARIABLE_SIZE); + format %{ "MulHiL $Rdst, $Rsrc1, $Rsrc2\t # Multiply High Long" %} + ins_encode%{ + Register dst = $Rdst$$Register; + Register src1 = $Rsrc1$$Register; + Register src2 = $Rsrc2$$Register; + Register tmp1 = $Rtmp1$$Register; + Register tmp2 = $Rdst$$Register; + // z/Architecture has only unsigned multiply (64 * 64 -> 128). + // implementing mulhs(a,b) = mulhu(a,b) – (a & (b>>63)) – (b & (a>>63)) + __ z_srag(tmp2, src1, 63); // a>>63 + __ z_srag(tmp1, src2, 63); // b>>63 + __ z_ngr(tmp2, src2); // b & (a>>63) + __ z_ngr(tmp1, src1); // a & (b>>63) + __ z_agr(tmp1, tmp2); // ((a & (b>>63)) + (b & (a>>63))) + __ z_mlgr(dst, src2); // tricky: 128-bit product is written to even/odd pair (dst,src1), + // multiplicand is taken from oddReg (src1), multiplier in src2. + __ z_sgr(dst, tmp1); + %} + ins_pipe(pipe_class_dummy); +%} + // DIV // Integer DIVMOD with Register, both quotient and mod results From ccbba3fe489d700018c41f6df26491b5d466be6f Mon Sep 17 00:00:00 2001 From: Lutz Schmidt Date: Mon, 9 Oct 2017 11:51:20 +0200 Subject: [PATCH 64/80] 8188857: [s390]: CPU feature detection incomplete Reviewed-by: mdoerr --- src/hotspot/cpu/s390/vm_version_s390.cpp | 23 ++++++++++++++++++- src/hotspot/cpu/s390/vm_version_s390.hpp | 2 ++ .../os_cpu/linux_s390/os_linux_s390.cpp | 12 +++++++--- 3 files changed, 33 insertions(+), 4 deletions(-) diff --git a/src/hotspot/cpu/s390/vm_version_s390.cpp b/src/hotspot/cpu/s390/vm_version_s390.cpp index 709a9fdf6ed..291577c81c5 100644 --- a/src/hotspot/cpu/s390/vm_version_s390.cpp +++ b/src/hotspot/cpu/s390/vm_version_s390.cpp @@ -706,12 +706,13 @@ void VM_Version::determine_features() { Label getCPUFEATURES; // fcode = -1 (cache) Label getCIPHERFEATURES; // fcode = -2 (cipher) Label getMSGDIGESTFEATURES; // fcode = -3 (SHA) + Label getVECTORFEATURES; // fcode = -4 (OS support for vector instructions) Label checkLongDispFast; Label noLongDisp; Label posDisp, negDisp; Label errRTN; a->z_ltgfr(Z_R0, Z_ARG2); // Buf len to r0 and test. - a->z_brl(getFEATURES); // negative -> Get machine features. + a->z_brl(getFEATURES); // negative -> Get machine features not covered by facility list. a->z_brz(checkLongDispFast); // zero -> Check for high-speed Long Displacement Facility. a->z_aghi(Z_R0, -1); a->z_stfle(0, Z_ARG1); @@ -736,6 +737,8 @@ void VM_Version::determine_features() { a->z_bre(getCIPHERFEATURES); a->z_cghi(Z_R0, -3); // -3: Extract detailed crypto capabilities (msg digest instructions). a->z_bre(getMSGDIGESTFEATURES); + a->z_cghi(Z_R0, -4); // -4: Verify vector instruction availability (OS support). + a->z_bre(getVECTORFEATURES); a->z_xgr(Z_RET, Z_RET); // Not a valid function code. a->z_br(Z_R14); // Return "operation aborted". @@ -766,6 +769,11 @@ void VM_Version::determine_features() { a->z_ecag(Z_RET,Z_R0,0,Z_ARG3); // Extract information as requested by Z_ARG1 contents. a->z_br(Z_R14); + // Use a vector instruction to verify OS support. Will fail with SIGFPE if OS support is missing. + a->bind(getVECTORFEATURES); + a->z_vtm(Z_V0,Z_V0); // non-destructive vector instruction. Will cause SIGFPE if not supported. + a->z_br(Z_R14); + // Check the performance of the Long Displacement Facility, i.e. find out if we are running on z900 or newer. a->bind(checkLongDispFast); a->z_llill(Z_R0, 0xffff); // preset #iterations @@ -962,6 +970,19 @@ void VM_Version::determine_features() { _nfeatures = 0; } + if (has_VectorFacility()) { + // Verify that feature can actually be used. OS support required. + call_getFeatures(buffer, -4, 0); + if (printVerbose) { + ttyLocker ttyl; + if (has_VectorFacility()) { + tty->print_cr(" Vector Facility has been verified to be supported by OS"); + } else { + tty->print_cr(" Vector Facility has been disabled - not supported by OS"); + } + } + } + // Extract Crypto Facility details. if (has_Crypto()) { // Get cipher features. diff --git a/src/hotspot/cpu/s390/vm_version_s390.hpp b/src/hotspot/cpu/s390/vm_version_s390.hpp index 7aa66bffc39..0f5d754707b 100644 --- a/src/hotspot/cpu/s390/vm_version_s390.hpp +++ b/src/hotspot/cpu/s390/vm_version_s390.hpp @@ -473,6 +473,8 @@ class VM_Version: public Abstract_VM_Version { static void set_has_CryptoExt5() { _features[0] |= CryptoExtension5Mask; } static void set_has_VectorFacility() { _features[2] |= VectorFacilityMask; } + static void reset_has_VectorFacility() { _features[2] &= ~VectorFacilityMask; } + // Assembler testing. static void allow_all(); static void revert(); diff --git a/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp b/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp index f7ab305f709..272c3e0f46b 100644 --- a/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp +++ b/src/hotspot/os_cpu/linux_s390/os_linux_s390.cpp @@ -448,11 +448,17 @@ JVM_handle_linux_signal(int sig, } else { // thread->thread_state() != _thread_in_Java - if (sig == SIGILL && VM_Version::is_determine_features_test_running()) { - // SIGILL must be caused by VM_Version::determine_features(). + if ((sig == SIGILL) && VM_Version::is_determine_features_test_running()) { + // SIGILL must be caused by VM_Version::determine_features() + // when attempting to execute a non-existing instruction. //*(int *) (pc-6)=0; // Patch instruction to 0 to indicate that it causes a SIGILL. // Flushing of icache is not necessary. stub = pc; // Continue with next instruction. + } else if ((sig == SIGFPE) && VM_Version::is_determine_features_test_running()) { + // SIGFPE is known to be caused by trying to execute a vector instruction + // when the vector facility is installed, but operating system support is missing. + VM_Version::reset_has_VectorFacility(); + stub = pc; // Continue with next instruction. } else if (thread->thread_state() == _thread_in_vm && sig == SIGBUS && thread->doing_unsafe_access()) { // We don't really need a stub here! Just set the pending exeption and @@ -510,7 +516,7 @@ JVM_handle_linux_signal(int sig, // Note: this should be combined with the trap_pc handling above, // because it handles the same issue. if (sig == SIGILL || sig == SIGFPE) { - pc = (address) info->si_addr; + pc = (address)info->si_addr; } VMError::report_and_die(t, sig, pc, info, ucVoid); From 21ee7f4b2a275cf9f12b0aa17b41ac80f88e5075 Mon Sep 17 00:00:00 2001 From: Martin Doerr Date: Mon, 9 Oct 2017 13:56:59 +0200 Subject: [PATCH 65/80] 8188868: PPC64: Support AES intrinsics on Big Endian Reviewed-by: goetz --- src/hotspot/cpu/ppc/assembler_ppc.hpp | 1 + src/hotspot/cpu/ppc/assembler_ppc.inline.hpp | 8 + src/hotspot/cpu/ppc/stubGenerator_ppc.cpp | 371 ++++++++++--------- src/hotspot/cpu/ppc/stubRoutines_ppc.hpp | 2 +- src/hotspot/cpu/ppc/vm_version_ppc.cpp | 13 - 5 files changed, 201 insertions(+), 194 deletions(-) diff --git a/src/hotspot/cpu/ppc/assembler_ppc.hpp b/src/hotspot/cpu/ppc/assembler_ppc.hpp index 0b56f9bbe58..03be7f4bdcb 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.hpp @@ -2299,6 +2299,7 @@ class Assembler : public AbstractAssembler { // Endianess specific concatenation of 2 loaded vectors. inline void load_perm(VectorRegister perm, Register addr); inline void vec_perm(VectorRegister first_dest, VectorRegister second, VectorRegister perm); + inline void vec_perm(VectorRegister dest, VectorRegister first, VectorRegister second, VectorRegister perm); // RegisterOrConstant versions. // These emitters choose between the versions using two registers and diff --git a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp index da496abd5d7..3931b56093e 100644 --- a/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp +++ b/src/hotspot/cpu/ppc/assembler_ppc.inline.hpp @@ -1057,6 +1057,14 @@ inline void Assembler::vec_perm(VectorRegister first_dest, VectorRegister second #endif } +inline void Assembler::vec_perm(VectorRegister dest, VectorRegister first, VectorRegister second, VectorRegister perm) { +#if defined(VM_LITTLE_ENDIAN) + vperm(dest, second, first, perm); +#else + vperm(dest, first, second, perm); +#endif +} + inline void Assembler::load_const(Register d, void* x, Register tmp) { load_const(d, (long)x, tmp); } diff --git a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp index acfae9cfcba..16cb6149f77 100644 --- a/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp +++ b/src/hotspot/cpu/ppc/stubGenerator_ppc.cpp @@ -2667,7 +2667,7 @@ class StubGenerator: public StubCodeGenerator { return start; } - // Arguments for generated stub (little endian only): + // Arguments for generated stub: // R3_ARG1 - source byte array address // R4_ARG2 - destination byte array address // R5_ARG3 - round key array @@ -2686,7 +2686,6 @@ class StubGenerator: public StubCodeGenerator { Register keylen = R8; Register temp = R9; Register keypos = R10; - Register hex = R11; Register fifteen = R12; VectorRegister vRet = VR0; @@ -2706,164 +2705,170 @@ class StubGenerator: public StubCodeGenerator { VectorRegister vTmp3 = VR11; VectorRegister vTmp4 = VR12; - VectorRegister vLow = VR13; - VectorRegister vHigh = VR14; - - __ li (hex, 16); __ li (fifteen, 15); - __ vspltisb (fSplt, 0x0f); // load unaligned from[0-15] to vsRet __ lvx (vRet, from); __ lvx (vTmp1, fifteen, from); __ lvsl (fromPerm, from); +#ifdef VM_LITTLE_ENDIAN + __ vspltisb (fSplt, 0x0f); __ vxor (fromPerm, fromPerm, fSplt); +#endif __ vperm (vRet, vRet, vTmp1, fromPerm); // load keylen (44 or 52 or 60) __ lwz (keylen, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT), key); // to load keys - __ lvsr (keyPerm, key); - __ vxor (vTmp2, vTmp2, vTmp2); + __ load_perm (keyPerm, key); +#ifdef VM_LITTLE_ENDIAN __ vspltisb (vTmp2, -16); __ vrld (keyPerm, keyPerm, vTmp2); __ vrld (keyPerm, keyPerm, vTmp2); __ vsldoi (keyPerm, keyPerm, keyPerm, 8); +#endif - // load the 1st round key to vKey1 - __ li (keypos, 0); + // load the 1st round key to vTmp1 + __ lvx (vTmp1, key); + __ li (keypos, 16); __ lvx (vKey1, keypos, key); - __ addi (keypos, keypos, 16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey1, vTmp1, vKey1, keyPerm); + __ vec_perm (vTmp1, vKey1, keyPerm); // 1st round - __ vxor (vRet, vRet, vKey1); + __ vxor (vRet, vRet, vTmp1); // load the 2nd round key to vKey1 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); + __ li (keypos, 32); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vKey2, keyPerm); // load the 3rd round key to vKey2 - __ addi (keypos, keypos, 16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); + __ li (keypos, 48); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, keyPerm); // load the 4th round key to vKey3 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey3, vTmp2, vTmp1, keyPerm); + __ li (keypos, 64); + __ lvx (vKey4, keypos, key); + __ vec_perm (vKey3, vKey4, keyPerm); // load the 5th round key to vKey4 - __ addi (keypos, keypos, 16); + __ li (keypos, 80); __ lvx (vTmp1, keypos, key); - __ vperm (vKey4, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey4, vTmp1, keyPerm); // 2nd - 5th rounds - __ vcipher (vRet, vRet, vKey1); - __ vcipher (vRet, vRet, vKey2); - __ vcipher (vRet, vRet, vKey3); - __ vcipher (vRet, vRet, vKey4); + __ vcipher (vRet, vRet, vKey1); + __ vcipher (vRet, vRet, vKey2); + __ vcipher (vRet, vRet, vKey3); + __ vcipher (vRet, vRet, vKey4); // load the 6th round key to vKey1 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); + __ li (keypos, 96); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vTmp1, vKey2, keyPerm); // load the 7th round key to vKey2 - __ addi (keypos, keypos, 16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); + __ li (keypos, 112); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, keyPerm); // load the 8th round key to vKey3 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey3, vTmp2, vTmp1, keyPerm); + __ li (keypos, 128); + __ lvx (vKey4, keypos, key); + __ vec_perm (vKey3, vKey4, keyPerm); // load the 9th round key to vKey4 - __ addi (keypos, keypos, 16); + __ li (keypos, 144); __ lvx (vTmp1, keypos, key); - __ vperm (vKey4, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey4, vTmp1, keyPerm); // 6th - 9th rounds - __ vcipher (vRet, vRet, vKey1); - __ vcipher (vRet, vRet, vKey2); - __ vcipher (vRet, vRet, vKey3); - __ vcipher (vRet, vRet, vKey4); + __ vcipher (vRet, vRet, vKey1); + __ vcipher (vRet, vRet, vKey2); + __ vcipher (vRet, vRet, vKey3); + __ vcipher (vRet, vRet, vKey4); // load the 10th round key to vKey1 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); + __ li (keypos, 160); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vTmp1, vKey2, keyPerm); // load the 11th round key to vKey2 - __ addi (keypos, keypos, 16); + __ li (keypos, 176); __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey2, vTmp1, keyPerm); // if all round keys are loaded, skip next 4 rounds __ cmpwi (CCR0, keylen, 44); __ beq (CCR0, L_doLast); // 10th - 11th rounds - __ vcipher (vRet, vRet, vKey1); - __ vcipher (vRet, vRet, vKey2); + __ vcipher (vRet, vRet, vKey1); + __ vcipher (vRet, vRet, vKey2); // load the 12th round key to vKey1 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); + __ li (keypos, 192); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vTmp1, vKey2, keyPerm); // load the 13th round key to vKey2 - __ addi (keypos, keypos, 16); + __ li (keypos, 208); __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey2, vTmp1, keyPerm); // if all round keys are loaded, skip next 2 rounds __ cmpwi (CCR0, keylen, 52); __ beq (CCR0, L_doLast); // 12th - 13th rounds - __ vcipher (vRet, vRet, vKey1); - __ vcipher (vRet, vRet, vKey2); + __ vcipher (vRet, vRet, vKey1); + __ vcipher (vRet, vRet, vKey2); // load the 14th round key to vKey1 - __ addi (keypos, keypos, 16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); + __ li (keypos, 224); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vTmp1, vKey2, keyPerm); // load the 15th round key to vKey2 - __ addi (keypos, keypos, 16); + __ li (keypos, 240); __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey2, vTmp1, keyPerm); __ bind(L_doLast); // last two rounds - __ vcipher (vRet, vRet, vKey1); - __ vcipherlast (vRet, vRet, vKey2); + __ vcipher (vRet, vRet, vKey1); + __ vcipherlast (vRet, vRet, vKey2); - __ neg (temp, to); - __ lvsr (toPerm, temp); - __ vspltisb (vTmp2, -1); - __ vxor (vTmp1, vTmp1, vTmp1); - __ vperm (vTmp2, vTmp2, vTmp1, toPerm); - __ vxor (toPerm, toPerm, fSplt); + // store result (unaligned) +#ifdef VM_LITTLE_ENDIAN + __ lvsl (toPerm, to); +#else + __ lvsr (toPerm, to); +#endif + __ vspltisb (vTmp3, -1); + __ vspltisb (vTmp4, 0); __ lvx (vTmp1, to); - __ vperm (vRet, vRet, vRet, toPerm); - __ vsel (vTmp1, vTmp1, vRet, vTmp2); - __ lvx (vTmp4, fifteen, to); + __ lvx (vTmp2, fifteen, to); +#ifdef VM_LITTLE_ENDIAN + __ vperm (vTmp3, vTmp3, vTmp4, toPerm); // generate select mask + __ vxor (toPerm, toPerm, fSplt); // swap bytes +#else + __ vperm (vTmp3, vTmp4, vTmp3, toPerm); // generate select mask +#endif + __ vperm (vTmp4, vRet, vRet, toPerm); // rotate data + __ vsel (vTmp2, vTmp4, vTmp2, vTmp3); + __ vsel (vTmp1, vTmp1, vTmp4, vTmp3); + __ stvx (vTmp2, fifteen, to); // store this one first (may alias) __ stvx (vTmp1, to); - __ vsel (vRet, vRet, vTmp4, vTmp2); - __ stvx (vRet, fifteen, to); __ blr(); return start; } - // Arguments for generated stub (little endian only): + // Arguments for generated stub: // R3_ARG1 - source byte array address // R4_ARG2 - destination byte array address // R5_ARG3 - K (key) in little endian int array @@ -2885,7 +2890,6 @@ class StubGenerator: public StubCodeGenerator { Register keylen = R8; Register temp = R9; Register keypos = R10; - Register hex = R11; Register fifteen = R12; VectorRegister vRet = VR0; @@ -2906,30 +2910,30 @@ class StubGenerator: public StubCodeGenerator { VectorRegister vTmp3 = VR12; VectorRegister vTmp4 = VR13; - VectorRegister vLow = VR14; - VectorRegister vHigh = VR15; - - __ li (hex, 16); __ li (fifteen, 15); - __ vspltisb (fSplt, 0x0f); // load unaligned from[0-15] to vsRet __ lvx (vRet, from); __ lvx (vTmp1, fifteen, from); __ lvsl (fromPerm, from); +#ifdef VM_LITTLE_ENDIAN + __ vspltisb (fSplt, 0x0f); __ vxor (fromPerm, fromPerm, fSplt); +#endif __ vperm (vRet, vRet, vTmp1, fromPerm); // align [and byte swap in LE] // load keylen (44 or 52 or 60) __ lwz (keylen, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT), key); // to load keys - __ lvsr (keyPerm, key); + __ load_perm (keyPerm, key); +#ifdef VM_LITTLE_ENDIAN __ vxor (vTmp2, vTmp2, vTmp2); __ vspltisb (vTmp2, -16); __ vrld (keyPerm, keyPerm, vTmp2); __ vrld (keyPerm, keyPerm, vTmp2); __ vsldoi (keyPerm, keyPerm, keyPerm, 8); +#endif __ cmpwi (CCR0, keylen, 44); __ beq (CCR0, L_do44); @@ -2937,32 +2941,32 @@ class StubGenerator: public StubCodeGenerator { __ cmpwi (CCR0, keylen, 52); __ beq (CCR0, L_do52); - // load the 15th round key to vKey11 + // load the 15th round key to vKey1 __ li (keypos, 240); + __ lvx (vKey1, keypos, key); + __ li (keypos, 224); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vKey2, vKey1, keyPerm); + + // load the 14th round key to vKey2 + __ li (keypos, 208); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, vKey2, keyPerm); + + // load the 13th round key to vKey3 + __ li (keypos, 192); + __ lvx (vKey4, keypos, key); + __ vec_perm (vKey3, vKey4, vKey3, keyPerm); + + // load the 12th round key to vKey4 + __ li (keypos, 176); + __ lvx (vKey5, keypos, key); + __ vec_perm (vKey4, vKey5, vKey4, keyPerm); + + // load the 11th round key to vKey5 + __ li (keypos, 160); __ lvx (vTmp1, keypos, key); - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp1, vTmp2, keyPerm); - - // load the 14th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp2, vTmp1, keyPerm); - - // load the 13th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey3, vTmp1, vTmp2, keyPerm); - - // load the 12th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey4, vTmp2, vTmp1, keyPerm); - - // load the 11th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey5, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey5, vTmp1, vKey5, keyPerm); // 1st - 5th rounds __ vxor (vRet, vRet, vKey1); @@ -2975,22 +2979,22 @@ class StubGenerator: public StubCodeGenerator { __ bind (L_do52); - // load the 13th round key to vKey11 + // load the 13th round key to vKey1 __ li (keypos, 208); - __ lvx (vTmp1, keypos, key); - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp1, vTmp2, keyPerm); + __ lvx (vKey1, keypos, key); + __ li (keypos, 192); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vKey2, vKey1, keyPerm); - // load the 12th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp2, vTmp1, keyPerm); + // load the 12th round key to vKey2 + __ li (keypos, 176); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, vKey2, keyPerm); - // load the 11th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey3, vTmp1, vTmp2, keyPerm); + // load the 11th round key to vKey3 + __ li (keypos, 160); + __ lvx (vTmp1, keypos, key); + __ vec_perm (vKey3, vTmp1, vKey3, keyPerm); // 1st - 3rd rounds __ vxor (vRet, vRet, vKey1); @@ -3001,42 +3005,42 @@ class StubGenerator: public StubCodeGenerator { __ bind (L_do44); - // load the 11th round key to vKey11 + // load the 11th round key to vKey1 __ li (keypos, 176); + __ lvx (vKey1, keypos, key); + __ li (keypos, 160); __ lvx (vTmp1, keypos, key); - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp1, vTmp2, keyPerm); + __ vec_perm (vKey1, vTmp1, vKey1, keyPerm); // 1st round __ vxor (vRet, vRet, vKey1); __ bind (L_doLast); - // load the 10th round key to vKey10 - __ addi (keypos, keypos, -16); + // load the 10th round key to vKey1 + __ li (keypos, 144); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vKey2, vTmp1, keyPerm); + + // load the 9th round key to vKey2 + __ li (keypos, 128); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, vKey2, keyPerm); + + // load the 8th round key to vKey3 + __ li (keypos, 112); + __ lvx (vKey4, keypos, key); + __ vec_perm (vKey3, vKey4, vKey3, keyPerm); + + // load the 7th round key to vKey4 + __ li (keypos, 96); + __ lvx (vKey5, keypos, key); + __ vec_perm (vKey4, vKey5, vKey4, keyPerm); + + // load the 6th round key to vKey5 + __ li (keypos, 80); __ lvx (vTmp1, keypos, key); - __ vperm (vKey1, vTmp2, vTmp1, keyPerm); - - // load the 9th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey2, vTmp1, vTmp2, keyPerm); - - // load the 8th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey3, vTmp2, vTmp1, keyPerm); - - // load the 7th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey4, vTmp1, vTmp2, keyPerm); - - // load the 6th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey5, vTmp2, vTmp1, keyPerm); + __ vec_perm (vKey5, vTmp1, vKey5, keyPerm); // last 10th - 6th rounds __ vncipher (vRet, vRet, vKey1); @@ -3045,30 +3049,29 @@ class StubGenerator: public StubCodeGenerator { __ vncipher (vRet, vRet, vKey4); __ vncipher (vRet, vRet, vKey5); - // load the 5th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey1, vTmp1, vTmp2, keyPerm); + // load the 5th round key to vKey1 + __ li (keypos, 64); + __ lvx (vKey2, keypos, key); + __ vec_perm (vKey1, vKey2, vTmp1, keyPerm); - // load the 4th round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey2, vTmp2, vTmp1, keyPerm); + // load the 4th round key to vKey2 + __ li (keypos, 48); + __ lvx (vKey3, keypos, key); + __ vec_perm (vKey2, vKey3, vKey2, keyPerm); - // load the 3rd round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey3, vTmp1, vTmp2, keyPerm); + // load the 3rd round key to vKey3 + __ li (keypos, 32); + __ lvx (vKey4, keypos, key); + __ vec_perm (vKey3, vKey4, vKey3, keyPerm); - // load the 2nd round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp1, keypos, key); - __ vperm (vKey4, vTmp2, vTmp1, keyPerm); + // load the 2nd round key to vKey4 + __ li (keypos, 16); + __ lvx (vKey5, keypos, key); + __ vec_perm (vKey4, vKey5, vKey4, keyPerm); - // load the 1st round key to vKey10 - __ addi (keypos, keypos, -16); - __ lvx (vTmp2, keypos, key); - __ vperm (vKey5, vTmp1, vTmp2, keyPerm); + // load the 1st round key to vKey5 + __ lvx (vTmp1, key); + __ vec_perm (vKey5, vTmp1, vKey5, keyPerm); // last 5th - 1th rounds __ vncipher (vRet, vRet, vKey1); @@ -3077,19 +3080,27 @@ class StubGenerator: public StubCodeGenerator { __ vncipher (vRet, vRet, vKey4); __ vncipherlast (vRet, vRet, vKey5); - __ neg (temp, to); - __ lvsr (toPerm, temp); - __ vspltisb (vTmp2, -1); - __ vxor (vTmp1, vTmp1, vTmp1); - __ vperm (vTmp2, vTmp2, vTmp1, toPerm); - __ vxor (toPerm, toPerm, fSplt); + // store result (unaligned) +#ifdef VM_LITTLE_ENDIAN + __ lvsl (toPerm, to); +#else + __ lvsr (toPerm, to); +#endif + __ vspltisb (vTmp3, -1); + __ vspltisb (vTmp4, 0); __ lvx (vTmp1, to); - __ vperm (vRet, vRet, vRet, toPerm); - __ vsel (vTmp1, vTmp1, vRet, vTmp2); - __ lvx (vTmp4, fifteen, to); + __ lvx (vTmp2, fifteen, to); +#ifdef VM_LITTLE_ENDIAN + __ vperm (vTmp3, vTmp3, vTmp4, toPerm); // generate select mask + __ vxor (toPerm, toPerm, fSplt); // swap bytes +#else + __ vperm (vTmp3, vTmp4, vTmp3, toPerm); // generate select mask +#endif + __ vperm (vTmp4, vRet, vRet, toPerm); // rotate data + __ vsel (vTmp2, vTmp4, vTmp2, vTmp3); + __ vsel (vTmp1, vTmp1, vTmp4, vTmp3); + __ stvx (vTmp2, fifteen, to); // store this one first (may alias) __ stvx (vTmp1, to); - __ vsel (vRet, vRet, vTmp4, vTmp2); - __ stvx (vRet, fifteen, to); __ blr(); return start; diff --git a/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp b/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp index a012175c493..da480d73aee 100644 --- a/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp +++ b/src/hotspot/cpu/ppc/stubRoutines_ppc.hpp @@ -34,7 +34,7 @@ static bool returns_to_call_stub(address return_pc) { return return_pc == _call_ enum platform_dependent_constants { code_size1 = 20000, // simply increase if too small (assembler will crash if too small) - code_size2 = 22000 // simply increase if too small (assembler will crash if too small) + code_size2 = 24000 // simply increase if too small (assembler will crash if too small) }; // CRC32 Intrinsics. diff --git a/src/hotspot/cpu/ppc/vm_version_ppc.cpp b/src/hotspot/cpu/ppc/vm_version_ppc.cpp index 6791e0e9040..5faf652a119 100644 --- a/src/hotspot/cpu/ppc/vm_version_ppc.cpp +++ b/src/hotspot/cpu/ppc/vm_version_ppc.cpp @@ -211,7 +211,6 @@ void VM_Version::initialize() { } // The AES intrinsic stubs require AES instruction support. -#if defined(VM_LITTLE_ENDIAN) if (has_vcipher()) { if (FLAG_IS_DEFAULT(UseAES)) { UseAES = true; @@ -232,18 +231,6 @@ void VM_Version::initialize() { FLAG_SET_DEFAULT(UseAESIntrinsics, false); } -#else - if (UseAES) { - warning("AES instructions are not available on this CPU"); - FLAG_SET_DEFAULT(UseAES, false); - } - if (UseAESIntrinsics) { - if (!FLAG_IS_DEFAULT(UseAESIntrinsics)) - warning("AES intrinsics are not available on this CPU"); - FLAG_SET_DEFAULT(UseAESIntrinsics, false); - } -#endif - if (UseAESCTRIntrinsics) { warning("AES/CTR intrinsics are not available on this CPU"); FLAG_SET_DEFAULT(UseAESCTRIntrinsics, false); From bf5816a2c5f61f71eb2317259ce73aced682520e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Erik=20=C3=96sterlund?= Date: Mon, 9 Oct 2017 14:39:59 +0200 Subject: [PATCH 66/80] 8188813: Generalize OrderAccess to use templates Reviewed-by: dholmes, coleenp --- .../aix_ppc/orderAccess_aix_ppc.inline.hpp | 13 +- .../bsd_x86/orderAccess_bsd_x86.inline.hpp | 83 ++++---- .../bsd_zero/orderAccess_bsd_zero.inline.hpp | 4 +- .../orderAccess_linux_aarch64.inline.hpp | 107 ++-------- .../orderAccess_linux_arm.inline.hpp | 190 +++++++++++------- .../orderAccess_linux_ppc.inline.hpp | 14 +- .../orderAccess_linux_s390.inline.hpp | 15 +- .../orderAccess_linux_sparc.inline.hpp | 4 +- .../orderAccess_linux_x86.inline.hpp | 83 ++++---- .../orderAccess_linux_zero.inline.hpp | 4 +- .../orderAccess_solaris_sparc.inline.hpp | 4 +- .../orderAccess_solaris_x86.inline.hpp | 4 +- .../orderAccess_windows_x86.inline.hpp | 64 +++--- .../gc/shared/cardTableModRefBS.inline.hpp | 6 +- .../metaprogramming/primitiveConversions.hpp | 20 ++ src/hotspot/share/oops/oop.inline.hpp | 2 +- src/hotspot/share/oops/oopsHierarchy.hpp | 9 + src/hotspot/share/runtime/atomic.hpp | 4 +- src/hotspot/share/runtime/mutex.cpp | 2 +- src/hotspot/share/runtime/orderAccess.hpp | 88 +++----- .../share/runtime/orderAccess.inline.hpp | 89 +++----- 21 files changed, 376 insertions(+), 433 deletions(-) diff --git a/src/hotspot/os_cpu/aix_ppc/orderAccess_aix_ppc.inline.hpp b/src/hotspot/os_cpu/aix_ppc/orderAccess_aix_ppc.inline.hpp index b6214c15aea..7e71e11d2a3 100644 --- a/src/hotspot/os_cpu/aix_ppc/orderAccess_aix_ppc.inline.hpp +++ b/src/hotspot/os_cpu/aix_ppc/orderAccess_aix_ppc.inline.hpp @@ -78,16 +78,17 @@ inline void OrderAccess::acquire() { inlasm_lwsync(); } inline void OrderAccess::release() { inlasm_lwsync(); } inline void OrderAccess::fence() { inlasm_sync(); } -template<> inline jbyte OrderAccess::specialized_load_acquire (const volatile jbyte* p) { register jbyte t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jshort OrderAccess::specialized_load_acquire(const volatile jshort* p) { register jshort t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jint OrderAccess::specialized_load_acquire (const volatile jint* p) { register jint t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jlong OrderAccess::specialized_load_acquire (const volatile jlong* p) { register jlong t = load(p); inlasm_acquire_reg(t); return t; } +template +struct OrderAccess::PlatformOrderedLoad + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { register T t = Atomic::load(p); inlasm_acquire_reg(t); return t; } +}; #undef inlasm_sync #undef inlasm_lwsync #undef inlasm_eieio #undef inlasm_isync -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_AIX_OJDKPPC_VM_ORDERACCESS_AIX_PPC_INLINE_HPP diff --git a/src/hotspot/os_cpu/bsd_x86/orderAccess_bsd_x86.inline.hpp b/src/hotspot/os_cpu/bsd_x86/orderAccess_bsd_x86.inline.hpp index 038d6f985d5..d2b0674a36d 100644 --- a/src/hotspot/os_cpu/bsd_x86/orderAccess_bsd_x86.inline.hpp +++ b/src/hotspot/os_cpu/bsd_x86/orderAccess_bsd_x86.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -64,46 +64,57 @@ inline void OrderAccess::fence() { } template<> -inline void OrderAccess::specialized_release_store_fence (volatile jbyte* p, jbyte v) { - __asm__ volatile ( "xchgb (%2),%0" - : "=q" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<1, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgb (%2),%0" + : "=q" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; + template<> -inline void OrderAccess::specialized_release_store_fence(volatile jshort* p, jshort v) { - __asm__ volatile ( "xchgw (%2),%0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<2, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgw (%2),%0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; + template<> -inline void OrderAccess::specialized_release_store_fence (volatile jint* p, jint v) { - __asm__ volatile ( "xchgl (%2),%0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<4, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgl (%2),%0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; #ifdef AMD64 template<> -inline void OrderAccess::specialized_release_store_fence (volatile jlong* p, jlong v) { - __asm__ volatile ( "xchgq (%2), %0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<8, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgq (%2), %0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; #endif // AMD64 -template<> -inline void OrderAccess::specialized_release_store_fence (volatile jfloat* p, jfloat v) { - release_store_fence((volatile jint*)p, jint_cast(v)); -} -template<> -inline void OrderAccess::specialized_release_store_fence(volatile jdouble* p, jdouble v) { - release_store_fence((volatile jlong*)p, jlong_cast(v)); -} - -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_BSD_X86_VM_ORDERACCESS_BSD_X86_INLINE_HPP diff --git a/src/hotspot/os_cpu/bsd_zero/orderAccess_bsd_zero.inline.hpp b/src/hotspot/os_cpu/bsd_zero/orderAccess_bsd_zero.inline.hpp index fb3017ce9d1..96ea19a4a70 100644 --- a/src/hotspot/os_cpu/bsd_zero/orderAccess_bsd_zero.inline.hpp +++ b/src/hotspot/os_cpu/bsd_zero/orderAccess_bsd_zero.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * Copyright 2007, 2008, 2009 Red Hat, Inc. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * @@ -74,6 +74,4 @@ inline void OrderAccess::acquire() { LIGHT_MEM_BARRIER; } inline void OrderAccess::release() { LIGHT_MEM_BARRIER; } inline void OrderAccess::fence() { FULL_MEM_BARRIER; } -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_BSD_ZERO_VM_ORDERACCESS_BSD_ZERO_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_aarch64/orderAccess_linux_aarch64.inline.hpp b/src/hotspot/os_cpu/linux_aarch64/orderAccess_linux_aarch64.inline.hpp index dcbce021456..32164dd3058 100644 --- a/src/hotspot/os_cpu/linux_aarch64/orderAccess_linux_aarch64.inline.hpp +++ b/src/hotspot/os_cpu/linux_aarch64/orderAccess_linux_aarch64.inline.hpp @@ -50,93 +50,28 @@ inline void OrderAccess::fence() { FULL_MEM_BARRIER; } -inline jbyte OrderAccess::load_acquire(const volatile jbyte* p) -{ jbyte data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jshort OrderAccess::load_acquire(const volatile jshort* p) -{ jshort data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jint OrderAccess::load_acquire(const volatile jint* p) -{ jint data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jlong OrderAccess::load_acquire(const volatile jlong* p) -{ jlong data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jubyte OrderAccess::load_acquire(const volatile jubyte* p) -{ jubyte data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jushort OrderAccess::load_acquire(const volatile jushort* p) -{ jushort data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline juint OrderAccess::load_acquire(const volatile juint* p) -{ juint data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline julong OrderAccess::load_acquire(const volatile julong* p) -{ julong data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jfloat OrderAccess::load_acquire(const volatile jfloat* p) -{ jfloat data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline jdouble OrderAccess::load_acquire(const volatile jdouble* p) -{ jdouble data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline intptr_t OrderAccess::load_ptr_acquire(const volatile intptr_t* p) -{ intptr_t data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } -inline void* OrderAccess::load_ptr_acquire(const volatile void* p) -{ void* data; __atomic_load((void* const volatile *)p, &data, __ATOMIC_ACQUIRE); return data; } +template +struct OrderAccess::PlatformOrderedLoad + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { T data; __atomic_load(p, &data, __ATOMIC_ACQUIRE); return data; } +}; -inline void OrderAccess::release_store(volatile jbyte* p, jbyte v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jshort* p, jshort v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jint* p, jint v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jlong* p, jlong v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jubyte* p, jubyte v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jushort* p, jushort v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile juint* p, juint v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile julong* p, julong v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jfloat* p, jfloat v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store(volatile jdouble* p, jdouble v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store_ptr(volatile intptr_t* p, intptr_t v) -{ __atomic_store(p, &v, __ATOMIC_RELEASE); } -inline void OrderAccess::release_store_ptr(volatile void* p, void* v) -{ __atomic_store((void* volatile *)p, &v, __ATOMIC_RELEASE); } +template +struct OrderAccess::PlatformOrderedStore + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { __atomic_store(p, &v, __ATOMIC_RELEASE); } +}; -inline void OrderAccess::store_fence(jbyte* p, jbyte v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jshort* p, jshort v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jint* p, jint v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jlong* p, jlong v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jubyte* p, jubyte v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jushort* p, jushort v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(juint* p, juint v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(julong* p, julong v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jfloat* p, jfloat v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_fence(jdouble* p, jdouble v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_ptr_fence(intptr_t* p, intptr_t v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } -inline void OrderAccess::store_ptr_fence(void** p, void* v) -{ __atomic_store(p, &v, __ATOMIC_RELAXED); fence(); } - -inline void OrderAccess::release_store_fence(volatile jbyte* p, jbyte v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jshort* p, jshort v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jint* p, jint v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jlong* p, jlong v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jubyte* p, jubyte v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jushort* p, jushort v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile juint* p, juint v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile julong* p, julong v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jfloat* p, jfloat v) { release_store(p, v); fence(); } -inline void OrderAccess::release_store_fence(volatile jdouble* p, jdouble v) { release_store(p, v); fence(); } - -inline void OrderAccess::release_store_ptr_fence(volatile intptr_t* p, intptr_t v) { release_store_ptr(p, v); fence(); } -inline void OrderAccess::release_store_ptr_fence(volatile void* p, void* v) { release_store_ptr(p, v); fence(); } +template +struct OrderAccess::PlatformOrderedStore + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { release_store(p, v); fence(); } +}; #endif // OS_CPU_LINUX_AARCH64_VM_ORDERACCESS_LINUX_AARCH64_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_arm/orderAccess_linux_arm.inline.hpp b/src/hotspot/os_cpu/linux_arm/orderAccess_linux_arm.inline.hpp index a115dd82311..4a737c12a90 100644 --- a/src/hotspot/os_cpu/linux_arm/orderAccess_linux_arm.inline.hpp +++ b/src/hotspot/os_cpu/linux_arm/orderAccess_linux_arm.inline.hpp @@ -33,7 +33,6 @@ // - we define the high level barriers below and use the general // implementation in orderAccess.inline.hpp, with customizations // on AARCH64 via the specialized_* template functions -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 // Memory Ordering on ARM is weak. // @@ -131,91 +130,126 @@ inline void OrderAccess::fence() { dmb_sy(); } #ifdef AARCH64 -template<> inline jbyte OrderAccess::specialized_load_acquire(const volatile jbyte* p) { - volatile jbyte result; - __asm__ volatile( - "ldarb %w[res], [%[ptr]]" - : [res] "=&r" (result) - : [ptr] "r" (p) - : "memory"); - return result; -} +template<> +struct OrderAccess::PlatformOrderedLoad<1, X_ACQUIRE> + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { + volatile T result; + __asm__ volatile( + "ldarb %w[res], [%[ptr]]" + : [res] "=&r" (result) + : [ptr] "r" (p) + : "memory"); + return result; + } +}; -template<> inline jshort OrderAccess::specialized_load_acquire(const volatile jshort* p) { - volatile jshort result; - __asm__ volatile( - "ldarh %w[res], [%[ptr]]" - : [res] "=&r" (result) - : [ptr] "r" (p) - : "memory"); - return result; -} +template<> +struct OrderAccess::PlatformOrderedLoad<2, X_ACQUIRE> + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { + volatile T result; + __asm__ volatile( + "ldarh %w[res], [%[ptr]]" + : [res] "=&r" (result) + : [ptr] "r" (p) + : "memory"); + return result; + } +}; -template<> inline jint OrderAccess::specialized_load_acquire(const volatile jint* p) { - volatile jint result; - __asm__ volatile( - "ldar %w[res], [%[ptr]]" - : [res] "=&r" (result) - : [ptr] "r" (p) - : "memory"); - return result; -} +template<> +struct OrderAccess::PlatformOrderedLoad<4, X_ACQUIRE> + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { + volatile T result; + __asm__ volatile( + "ldar %w[res], [%[ptr]]" + : [res] "=&r" (result) + : [ptr] "r" (p) + : "memory"); + return result; + } +}; -template<> inline jfloat OrderAccess::specialized_load_acquire(const volatile jfloat* p) { - return jfloat_cast(specialized_load_acquire((const volatile jint*)p)); -} +template<> +struct OrderAccess::PlatformOrderedLoad<8, X_ACQUIRE> + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { + volatile T result; + __asm__ volatile( + "ldar %[res], [%[ptr]]" + : [res] "=&r" (result) + : [ptr] "r" (p) + : "memory"); + return result; + } +}; -// This is implicit as jlong and intptr_t are both "long int" -//template<> inline jlong OrderAccess::specialized_load_acquire(const volatile jlong* p) { -// return (volatile jlong)specialized_load_acquire((const volatile intptr_t*)p); -//} +template<> +struct OrderAccess::PlatformOrderedStore<1, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile( + "stlrb %w[val], [%[ptr]]" + : + : [ptr] "r" (p), [val] "r" (v) + : "memory"); + } +}; -template<> inline intptr_t OrderAccess::specialized_load_acquire(const volatile intptr_t* p) { - volatile intptr_t result; - __asm__ volatile( - "ldar %[res], [%[ptr]]" - : [res] "=&r" (result) - : [ptr] "r" (p) - : "memory"); - return result; -} +template<> +struct OrderAccess::PlatformOrderedStore<2, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile( + "stlrh %w[val], [%[ptr]]" + : + : [ptr] "r" (p), [val] "r" (v) + : "memory"); + } +}; -template<> inline jdouble OrderAccess::specialized_load_acquire(const volatile jdouble* p) { - return jdouble_cast(specialized_load_acquire((const volatile intptr_t*)p)); -} +template<> +struct OrderAccess::PlatformOrderedStore<4, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile( + "stlr %w[val], [%[ptr]]" + : + : [ptr] "r" (p), [val] "r" (v) + : "memory"); + } +}; +template<> +struct OrderAccess::PlatformOrderedStore<8, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile( + "stlr %[val], [%[ptr]]" + : + : [ptr] "r" (p), [val] "r" (v) + : "memory"); + } +}; -template<> inline void OrderAccess::specialized_release_store(volatile jbyte* p, jbyte v) { - __asm__ volatile( - "stlrb %w[val], [%[ptr]]" - : - : [ptr] "r" (p), [val] "r" (v) - : "memory"); -} - -template<> inline void OrderAccess::specialized_release_store(volatile jshort* p, jshort v) { - __asm__ volatile( - "stlrh %w[val], [%[ptr]]" - : - : [ptr] "r" (p), [val] "r" (v) - : "memory"); -} - -template<> inline void OrderAccess::specialized_release_store(volatile jint* p, jint v) { - __asm__ volatile( - "stlr %w[val], [%[ptr]]" - : - : [ptr] "r" (p), [val] "r" (v) - : "memory"); -} - -template<> inline void OrderAccess::specialized_release_store(volatile jlong* p, jlong v) { - __asm__ volatile( - "stlr %[val], [%[ptr]]" - : - : [ptr] "r" (p), [val] "r" (v) - : "memory"); -} #endif // AARCH64 #endif // OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_ppc/orderAccess_linux_ppc.inline.hpp b/src/hotspot/os_cpu/linux_ppc/orderAccess_linux_ppc.inline.hpp index d41b788ab68..2f600407727 100644 --- a/src/hotspot/os_cpu/linux_ppc/orderAccess_linux_ppc.inline.hpp +++ b/src/hotspot/os_cpu/linux_ppc/orderAccess_linux_ppc.inline.hpp @@ -80,10 +80,14 @@ inline void OrderAccess::acquire() { inlasm_lwsync(); } inline void OrderAccess::release() { inlasm_lwsync(); } inline void OrderAccess::fence() { inlasm_sync(); } -template<> inline jbyte OrderAccess::specialized_load_acquire (const volatile jbyte* p) { register jbyte t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jshort OrderAccess::specialized_load_acquire(const volatile jshort* p) { register jshort t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jint OrderAccess::specialized_load_acquire (const volatile jint* p) { register jint t = load(p); inlasm_acquire_reg(t); return t; } -template<> inline jlong OrderAccess::specialized_load_acquire (const volatile jlong* p) { register jlong t = load(p); inlasm_acquire_reg(t); return t; } + +template +struct OrderAccess::PlatformOrderedLoad + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { register T t = Atomic::load(p); inlasm_acquire_reg(t); return t; } +}; #undef inlasm_sync #undef inlasm_lwsync @@ -91,6 +95,4 @@ template<> inline jlong OrderAccess::specialized_load_acquire (const vol #undef inlasm_isync #undef inlasm_acquire_reg -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_LINUX_PPC_VM_ORDERACCESS_LINUX_PPC_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_s390/orderAccess_linux_s390.inline.hpp b/src/hotspot/os_cpu/linux_s390/orderAccess_linux_s390.inline.hpp index 2de7fb6a81f..89401f03553 100644 --- a/src/hotspot/os_cpu/linux_s390/orderAccess_linux_s390.inline.hpp +++ b/src/hotspot/os_cpu/linux_s390/orderAccess_linux_s390.inline.hpp @@ -74,10 +74,13 @@ inline void OrderAccess::acquire() { inlasm_zarch_acquire(); } inline void OrderAccess::release() { inlasm_zarch_release(); } inline void OrderAccess::fence() { inlasm_zarch_sync(); } -template<> inline jbyte OrderAccess::specialized_load_acquire (const volatile jbyte* p) { register jbyte t = *p; inlasm_zarch_acquire(); return t; } -template<> inline jshort OrderAccess::specialized_load_acquire(const volatile jshort* p) { register jshort t = *p; inlasm_zarch_acquire(); return t; } -template<> inline jint OrderAccess::specialized_load_acquire (const volatile jint* p) { register jint t = *p; inlasm_zarch_acquire(); return t; } -template<> inline jlong OrderAccess::specialized_load_acquire (const volatile jlong* p) { register jlong t = *p; inlasm_zarch_acquire(); return t; } +template +struct OrderAccess::PlatformOrderedLoad + VALUE_OBJ_CLASS_SPEC +{ + template + T operator()(const volatile T* p) const { register T t = *p; inlasm_zarch_acquire(); return t; } +}; #undef inlasm_compiler_barrier #undef inlasm_zarch_sync @@ -85,8 +88,4 @@ template<> inline jlong OrderAccess::specialized_load_acquire (const vol #undef inlasm_zarch_acquire #undef inlasm_zarch_fence -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_LINUX_S390_VM_ORDERACCESS_LINUX_S390_INLINE_HPP - - diff --git a/src/hotspot/os_cpu/linux_sparc/orderAccess_linux_sparc.inline.hpp b/src/hotspot/os_cpu/linux_sparc/orderAccess_linux_sparc.inline.hpp index fd6078fcd31..c9fde925f7e 100644 --- a/src/hotspot/os_cpu/linux_sparc/orderAccess_linux_sparc.inline.hpp +++ b/src/hotspot/os_cpu/linux_sparc/orderAccess_linux_sparc.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -48,6 +48,4 @@ inline void OrderAccess::fence() { __asm__ volatile ("membar #StoreLoad" : : : "memory"); } -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_LINUX_SPARC_VM_ORDERACCESS_LINUX_SPARC_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_x86/orderAccess_linux_x86.inline.hpp b/src/hotspot/os_cpu/linux_x86/orderAccess_linux_x86.inline.hpp index 0f564216e13..0d5585b6e70 100644 --- a/src/hotspot/os_cpu/linux_x86/orderAccess_linux_x86.inline.hpp +++ b/src/hotspot/os_cpu/linux_x86/orderAccess_linux_x86.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -60,46 +60,57 @@ inline void OrderAccess::fence() { } template<> -inline void OrderAccess::specialized_release_store_fence (volatile jbyte* p, jbyte v) { - __asm__ volatile ( "xchgb (%2),%0" - : "=q" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<1, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgb (%2),%0" + : "=q" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; + template<> -inline void OrderAccess::specialized_release_store_fence(volatile jshort* p, jshort v) { - __asm__ volatile ( "xchgw (%2),%0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<2, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgw (%2),%0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; + template<> -inline void OrderAccess::specialized_release_store_fence (volatile jint* p, jint v) { - __asm__ volatile ( "xchgl (%2),%0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<4, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgl (%2),%0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; #ifdef AMD64 template<> -inline void OrderAccess::specialized_release_store_fence (volatile jlong* p, jlong v) { - __asm__ volatile ( "xchgq (%2), %0" - : "=r" (v) - : "0" (v), "r" (p) - : "memory"); -} +struct OrderAccess::PlatformOrderedStore<8, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm__ volatile ( "xchgq (%2), %0" + : "=r" (v) + : "0" (v), "r" (p) + : "memory"); + } +}; #endif // AMD64 -template<> -inline void OrderAccess::specialized_release_store_fence (volatile jfloat* p, jfloat v) { - release_store_fence((volatile jint*)p, jint_cast(v)); -} -template<> -inline void OrderAccess::specialized_release_store_fence(volatile jdouble* p, jdouble v) { - release_store_fence((volatile jlong*)p, jlong_cast(v)); -} - -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_LINUX_X86_VM_ORDERACCESS_LINUX_X86_INLINE_HPP diff --git a/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp b/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp index 6bda67d54d6..8c4cd1c7a1c 100644 --- a/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp +++ b/src/hotspot/os_cpu/linux_zero/orderAccess_linux_zero.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * Copyright 2007, 2008, 2009 Red Hat, Inc. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * @@ -83,6 +83,4 @@ inline void OrderAccess::release() { LIGHT_MEM_BARRIER; } inline void OrderAccess::fence() { FULL_MEM_BARRIER; } -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_LINUX_ZERO_VM_ORDERACCESS_LINUX_ZERO_INLINE_HPP diff --git a/src/hotspot/os_cpu/solaris_sparc/orderAccess_solaris_sparc.inline.hpp b/src/hotspot/os_cpu/solaris_sparc/orderAccess_solaris_sparc.inline.hpp index 7a74147d6a0..b60cd092c50 100644 --- a/src/hotspot/os_cpu/solaris_sparc/orderAccess_solaris_sparc.inline.hpp +++ b/src/hotspot/os_cpu/solaris_sparc/orderAccess_solaris_sparc.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -52,6 +52,4 @@ inline void OrderAccess::fence() { __asm__ volatile ("membar #StoreLoad" : : : "memory"); } -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_SOLARIS_SPARC_VM_ORDERACCESS_SOLARIS_SPARC_INLINE_HPP diff --git a/src/hotspot/os_cpu/solaris_x86/orderAccess_solaris_x86.inline.hpp b/src/hotspot/os_cpu/solaris_x86/orderAccess_solaris_x86.inline.hpp index b88e715e4d4..bd676dbe62f 100644 --- a/src/hotspot/os_cpu/solaris_x86/orderAccess_solaris_x86.inline.hpp +++ b/src/hotspot/os_cpu/solaris_x86/orderAccess_solaris_x86.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -58,6 +58,4 @@ inline void OrderAccess::fence() { compiler_barrier(); } -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_SOLARIS_X86_VM_ORDERACCESS_SOLARIS_X86_INLINE_HPP diff --git a/src/hotspot/os_cpu/windows_x86/orderAccess_windows_x86.inline.hpp b/src/hotspot/os_cpu/windows_x86/orderAccess_windows_x86.inline.hpp index 36c1c4a42c0..57488f4acf7 100644 --- a/src/hotspot/os_cpu/windows_x86/orderAccess_windows_x86.inline.hpp +++ b/src/hotspot/os_cpu/windows_x86/orderAccess_windows_x86.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2003, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2003, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -74,42 +74,46 @@ inline void OrderAccess::fence() { #ifndef AMD64 template<> -inline void OrderAccess::specialized_release_store_fence (volatile jbyte* p, jbyte v) { - __asm { - mov edx, p; - mov al, v; - xchg al, byte ptr [edx]; +struct OrderAccess::PlatformOrderedStore<1, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm { + mov edx, p; + mov al, v; + xchg al, byte ptr [edx]; + } } -} +}; template<> -inline void OrderAccess::specialized_release_store_fence(volatile jshort* p, jshort v) { - __asm { - mov edx, p; - mov ax, v; - xchg ax, word ptr [edx]; +struct OrderAccess::PlatformOrderedStore<2, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm { + mov edx, p; + mov ax, v; + xchg ax, word ptr [edx]; + } } -} +}; template<> -inline void OrderAccess::specialized_release_store_fence (volatile jint* p, jint v) { - __asm { - mov edx, p; - mov eax, v; - xchg eax, dword ptr [edx]; +struct OrderAccess::PlatformOrderedStore<4, RELEASE_X_FENCE> + VALUE_OBJ_CLASS_SPEC +{ + template + void operator()(T v, volatile T* p) const { + __asm { + mov edx, p; + mov eax, v; + xchg eax, dword ptr [edx]; + } } -} +}; #endif // AMD64 -template<> -inline void OrderAccess::specialized_release_store_fence(volatile jfloat* p, jfloat v) { - release_store_fence((volatile jint*)p, jint_cast(v)); -} -template<> -inline void OrderAccess::specialized_release_store_fence(volatile jdouble* p, jdouble v) { - release_store_fence((volatile jlong*)p, jlong_cast(v)); -} - -#define VM_HAS_GENERALIZED_ORDER_ACCESS 1 - #endif // OS_CPU_WINDOWS_X86_VM_ORDERACCESS_WINDOWS_X86_INLINE_HPP diff --git a/src/hotspot/share/gc/shared/cardTableModRefBS.inline.hpp b/src/hotspot/share/gc/shared/cardTableModRefBS.inline.hpp index 7b01a379558..bce8661cf86 100644 --- a/src/hotspot/share/gc/shared/cardTableModRefBS.inline.hpp +++ b/src/hotspot/share/gc/shared/cardTableModRefBS.inline.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -30,10 +30,10 @@ #include "runtime/orderAccess.inline.hpp" template inline void CardTableModRefBS::inline_write_ref_field(T* field, oop newVal, bool release) { - jbyte* byte = byte_for((void*)field); + volatile jbyte* byte = byte_for((void*)field); if (release) { // Perform a releasing store if requested. - OrderAccess::release_store((volatile jbyte*) byte, dirty_card); + OrderAccess::release_store(byte, jbyte(dirty_card)); } else { *byte = dirty_card; } diff --git a/src/hotspot/share/metaprogramming/primitiveConversions.hpp b/src/hotspot/share/metaprogramming/primitiveConversions.hpp index c3482d7c0d1..8041492e9cb 100644 --- a/src/hotspot/share/metaprogramming/primitiveConversions.hpp +++ b/src/hotspot/share/metaprogramming/primitiveConversions.hpp @@ -167,4 +167,24 @@ inline T PrimitiveConversions::cast(U x) { return Cast()(x); } +// jfloat and jdouble translation to integral types + +template<> +struct PrimitiveConversions::Translate : public TrueType { + typedef double Value; + typedef int64_t Decayed; + + static Decayed decay(Value x) { return PrimitiveConversions::cast(x); } + static Value recover(Decayed x) { return PrimitiveConversions::cast(x); } +}; + +template<> +struct PrimitiveConversions::Translate : public TrueType { + typedef float Value; + typedef int32_t Decayed; + + static Decayed decay(Value x) { return PrimitiveConversions::cast(x); } + static Value recover(Decayed x) { return PrimitiveConversions::cast(x); } +}; + #endif // SHARE_VM_METAPROGRAMMING_PRIMITIVECONVERSIONS_HPP diff --git a/src/hotspot/share/oops/oop.inline.hpp b/src/hotspot/share/oops/oop.inline.hpp index 3e33fd35d81..83c5b564b85 100644 --- a/src/hotspot/share/oops/oop.inline.hpp +++ b/src/hotspot/share/oops/oop.inline.hpp @@ -501,7 +501,7 @@ jchar oopDesc::char_field_acquire(int offset) const { return O void oopDesc::release_char_field_put(int offset, jchar contents) { OrderAccess::release_store(char_field_addr(offset), contents); } jboolean oopDesc::bool_field_acquire(int offset) const { return OrderAccess::load_acquire(bool_field_addr(offset)); } -void oopDesc::release_bool_field_put(int offset, jboolean contents) { OrderAccess::release_store(bool_field_addr(offset), (contents & 1)); } +void oopDesc::release_bool_field_put(int offset, jboolean contents) { OrderAccess::release_store(bool_field_addr(offset), jboolean(contents & 1)); } jint oopDesc::int_field_acquire(int offset) const { return OrderAccess::load_acquire(int_field_addr(offset)); } void oopDesc::release_int_field_put(int offset, jint contents) { OrderAccess::release_store(int_field_addr(offset), contents); } diff --git a/src/hotspot/share/oops/oopsHierarchy.hpp b/src/hotspot/share/oops/oopsHierarchy.hpp index 36c93c12c13..bbab7d2428d 100644 --- a/src/hotspot/share/oops/oopsHierarchy.hpp +++ b/src/hotspot/share/oops/oopsHierarchy.hpp @@ -177,6 +177,15 @@ struct PrimitiveConversions::Translate : public TrueType { (void)const_cast(oop::operator=(o)); \ return *this; \ } \ + }; \ + \ + template<> \ + struct PrimitiveConversions::Translate : public TrueType { \ + typedef type##Oop Value; \ + typedef type##OopDesc* Decayed; \ + \ + static Decayed decay(Value x) { return (type##OopDesc*)x.obj(); } \ + static Value recover(Decayed x) { return type##Oop(x); } \ }; DEF_OOP(instance); diff --git a/src/hotspot/share/runtime/atomic.hpp b/src/hotspot/share/runtime/atomic.hpp index 69376db06ad..0522f295d7c 100644 --- a/src/hotspot/share/runtime/atomic.hpp +++ b/src/hotspot/share/runtime/atomic.hpp @@ -44,7 +44,7 @@ enum cmpxchg_memory_order { }; class Atomic : AllStatic { - public: +public: // Atomic operations on jlong types are not available on all 32-bit // platforms. If atomic ops on jlongs are defined here they must only // be used from code that verifies they are available at runtime and @@ -175,6 +175,7 @@ private: // that is needed here. template struct IsPointerConvertible; +protected: // Dispatch handler for store. Provides type-based validity // checking and limited conversions around calls to the platform- // specific implementation layer provided by PlatformOp. @@ -226,6 +227,7 @@ private: // requires more for e.g. 64 bit loads, a specialization is required template struct PlatformLoad; +private: // Dispatch handler for add. Provides type-based validity checking // and limited conversions around calls to the platform-specific // implementation layer provided by PlatformAdd. diff --git a/src/hotspot/share/runtime/mutex.cpp b/src/hotspot/share/runtime/mutex.cpp index b04d185bd8e..db56894fddb 100644 --- a/src/hotspot/share/runtime/mutex.cpp +++ b/src/hotspot/share/runtime/mutex.cpp @@ -526,7 +526,7 @@ void Monitor::IUnlock(bool RelaxAssert) { // Note that the OrderAccess::storeload() fence that appears after unlock store // provides for progress conditions and succession and is _not related to exclusion // safety or lock release consistency. - OrderAccess::release_store(&_LockWord.Bytes[_LSBINDEX], 0); // drop outer lock + OrderAccess::release_store(&_LockWord.Bytes[_LSBINDEX], jbyte(0)); // drop outer lock OrderAccess::storeload(); ParkEvent * const w = _OnDeck; // raw load as we will just return if non-NULL diff --git a/src/hotspot/share/runtime/orderAccess.hpp b/src/hotspot/share/runtime/orderAccess.hpp index f0970986437..1682395fdfe 100644 --- a/src/hotspot/share/runtime/orderAccess.hpp +++ b/src/hotspot/share/runtime/orderAccess.hpp @@ -26,6 +26,7 @@ #define SHARE_VM_RUNTIME_ORDERACCESS_HPP #include "memory/allocation.hpp" +#include "runtime/atomic.hpp" // Memory Access Ordering Model // @@ -252,7 +253,7 @@ class ScopedFence : public ScopedFenceGeneral { void postfix() { ScopedFenceGeneral::postfix(); } }; -class OrderAccess : AllStatic { +class OrderAccess : private Atomic { public: // barriers static void loadload(); @@ -264,44 +265,20 @@ class OrderAccess : AllStatic { static void release(); static void fence(); - static jbyte load_acquire(const volatile jbyte* p); - static jshort load_acquire(const volatile jshort* p); - static jint load_acquire(const volatile jint* p); - static jlong load_acquire(const volatile jlong* p); - static jubyte load_acquire(const volatile jubyte* p); - static jushort load_acquire(const volatile jushort* p); - static juint load_acquire(const volatile juint* p); - static julong load_acquire(const volatile julong* p); - static jfloat load_acquire(const volatile jfloat* p); - static jdouble load_acquire(const volatile jdouble* p); + template + static T load_acquire(const volatile T* p); static intptr_t load_ptr_acquire(const volatile intptr_t* p); static void* load_ptr_acquire(const volatile void* p); - static void release_store(volatile jbyte* p, jbyte v); - static void release_store(volatile jshort* p, jshort v); - static void release_store(volatile jint* p, jint v); - static void release_store(volatile jlong* p, jlong v); - static void release_store(volatile jubyte* p, jubyte v); - static void release_store(volatile jushort* p, jushort v); - static void release_store(volatile juint* p, juint v); - static void release_store(volatile julong* p, julong v); - static void release_store(volatile jfloat* p, jfloat v); - static void release_store(volatile jdouble* p, jdouble v); + template + static void release_store(volatile D* p, T v); static void release_store_ptr(volatile intptr_t* p, intptr_t v); static void release_store_ptr(volatile void* p, void* v); - static void release_store_fence(volatile jbyte* p, jbyte v); - static void release_store_fence(volatile jshort* p, jshort v); - static void release_store_fence(volatile jint* p, jint v); - static void release_store_fence(volatile jlong* p, jlong v); - static void release_store_fence(volatile jubyte* p, jubyte v); - static void release_store_fence(volatile jushort* p, jushort v); - static void release_store_fence(volatile juint* p, juint v); - static void release_store_fence(volatile julong* p, julong v); - static void release_store_fence(volatile jfloat* p, jfloat v); - static void release_store_fence(volatile jdouble* p, jdouble v); + template + static void release_store_fence(volatile D* p, T v); static void release_store_ptr_fence(volatile intptr_t* p, intptr_t v); static void release_store_ptr_fence(volatile void* p, void* v); @@ -313,45 +290,34 @@ class OrderAccess : AllStatic { static void StubRoutines_fence(); // Give platforms a variation point to specialize. - template static T specialized_load_acquire (const volatile T* p); - template static void specialized_release_store (volatile T* p, T v); - template static void specialized_release_store_fence(volatile T* p, T v); + template struct PlatformOrderedStore; + template struct PlatformOrderedLoad; template static void ordered_store(volatile FieldType* p, FieldType v); template static FieldType ordered_load(const volatile FieldType* p); +}; - static void store(volatile jbyte* p, jbyte v); - static void store(volatile jshort* p, jshort v); - static void store(volatile jint* p, jint v); - static void store(volatile jlong* p, jlong v); - static void store(volatile jdouble* p, jdouble v); - static void store(volatile jfloat* p, jfloat v); +// The following methods can be specialized using simple template specialization +// in the platform specific files for optimization purposes. Otherwise the +// generalized variant is used. - static jbyte load(const volatile jbyte* p); - static jshort load(const volatile jshort* p); - static jint load(const volatile jint* p); - static jlong load(const volatile jlong* p); - static jdouble load(const volatile jdouble* p); - static jfloat load(const volatile jfloat* p); +template +struct OrderAccess::PlatformOrderedStore VALUE_OBJ_CLASS_SPEC { + template + void operator()(T v, volatile T* p) const { + ordered_store(p, v); + } +}; - // The following store_fence methods are deprecated and will be removed - // when all repos conform to the new generalized OrderAccess. - static void store_fence(jbyte* p, jbyte v); - static void store_fence(jshort* p, jshort v); - static void store_fence(jint* p, jint v); - static void store_fence(jlong* p, jlong v); - static void store_fence(jubyte* p, jubyte v); - static void store_fence(jushort* p, jushort v); - static void store_fence(juint* p, juint v); - static void store_fence(julong* p, julong v); - static void store_fence(jfloat* p, jfloat v); - static void store_fence(jdouble* p, jdouble v); - - static void store_ptr_fence(intptr_t* p, intptr_t v); - static void store_ptr_fence(void** p, void* v); +template +struct OrderAccess::PlatformOrderedLoad VALUE_OBJ_CLASS_SPEC { + template + T operator()(const volatile T* p) const { + return ordered_load(p); + } }; #endif // SHARE_VM_RUNTIME_ORDERACCESS_HPP diff --git a/src/hotspot/share/runtime/orderAccess.inline.hpp b/src/hotspot/share/runtime/orderAccess.inline.hpp index 1fa2185dd45..4b7ab3911ff 100644 --- a/src/hotspot/share/runtime/orderAccess.inline.hpp +++ b/src/hotspot/share/runtime/orderAccess.inline.hpp @@ -26,14 +26,11 @@ #ifndef SHARE_VM_RUNTIME_ORDERACCESS_INLINE_HPP #define SHARE_VM_RUNTIME_ORDERACCESS_INLINE_HPP -#include "runtime/atomic.hpp" #include "runtime/orderAccess.hpp" #include "utilities/macros.hpp" #include OS_CPU_HEADER_INLINE(orderAccess) -#ifdef VM_HAS_GENERALIZED_ORDER_ACCESS - template<> inline void ScopedFenceGeneral::postfix() { OrderAccess::acquire(); } template<> inline void ScopedFenceGeneral::prefix() { OrderAccess::release(); } template<> inline void ScopedFenceGeneral::prefix() { OrderAccess::release(); } @@ -43,80 +40,42 @@ template<> inline void ScopedFenceGeneral::postfix() { OrderAcc template inline void OrderAccess::ordered_store(volatile FieldType* p, FieldType v) { ScopedFence f((void*)p); - store(p, v); + Atomic::store(v, p); } template inline FieldType OrderAccess::ordered_load(const volatile FieldType* p) { ScopedFence f((void*)p); - return load(p); + return Atomic::load(p); } -inline jbyte OrderAccess::load_acquire(const volatile jbyte* p) { return specialized_load_acquire(p); } -inline jshort OrderAccess::load_acquire(const volatile jshort* p) { return specialized_load_acquire(p); } -inline jint OrderAccess::load_acquire(const volatile jint* p) { return specialized_load_acquire(p); } -inline jlong OrderAccess::load_acquire(const volatile jlong* p) { return specialized_load_acquire(p); } -inline jfloat OrderAccess::load_acquire(const volatile jfloat* p) { return specialized_load_acquire(p); } -inline jdouble OrderAccess::load_acquire(const volatile jdouble* p) { return specialized_load_acquire(p); } -inline jubyte OrderAccess::load_acquire(const volatile jubyte* p) { return (jubyte) specialized_load_acquire((const volatile jbyte*)p); } -inline jushort OrderAccess::load_acquire(const volatile jushort* p) { return (jushort)specialized_load_acquire((const volatile jshort*)p); } -inline juint OrderAccess::load_acquire(const volatile juint* p) { return (juint) specialized_load_acquire((const volatile jint*)p); } -inline julong OrderAccess::load_acquire(const volatile julong* p) { return (julong) specialized_load_acquire((const volatile jlong*)p); } +template +inline T OrderAccess::load_acquire(const volatile T* p) { + return LoadImpl >()(p); +} -inline intptr_t OrderAccess::load_ptr_acquire(const volatile intptr_t* p) { return (intptr_t)specialized_load_acquire(p); } -inline void* OrderAccess::load_ptr_acquire(const volatile void* p) { return (void*)specialized_load_acquire((const volatile intptr_t*)p); } +inline intptr_t OrderAccess::load_ptr_acquire(const volatile intptr_t* p) { + return load_acquire(p); +} -inline void OrderAccess::release_store(volatile jbyte* p, jbyte v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jshort* p, jshort v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jint* p, jint v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jlong* p, jlong v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jfloat* p, jfloat v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jdouble* p, jdouble v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store(volatile jubyte* p, jubyte v) { specialized_release_store((volatile jbyte*) p, (jbyte) v); } -inline void OrderAccess::release_store(volatile jushort* p, jushort v) { specialized_release_store((volatile jshort*)p, (jshort)v); } -inline void OrderAccess::release_store(volatile juint* p, juint v) { specialized_release_store((volatile jint*) p, (jint) v); } -inline void OrderAccess::release_store(volatile julong* p, julong v) { specialized_release_store((volatile jlong*) p, (jlong) v); } +inline void* OrderAccess::load_ptr_acquire(const volatile void* p) { + return load_acquire(static_cast(p)); +} -inline void OrderAccess::release_store_ptr(volatile intptr_t* p, intptr_t v) { specialized_release_store(p, v); } -inline void OrderAccess::release_store_ptr(volatile void* p, void* v) { specialized_release_store((volatile intptr_t*)p, (intptr_t)v); } +template +inline void OrderAccess::release_store(volatile D* p, T v) { + StoreImpl >()(v, p); +} -inline void OrderAccess::release_store_fence(volatile jbyte* p, jbyte v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jshort* p, jshort v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jint* p, jint v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jlong* p, jlong v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jfloat* p, jfloat v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jdouble* p, jdouble v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_fence(volatile jubyte* p, jubyte v) { specialized_release_store_fence((volatile jbyte*) p, (jbyte) v); } -inline void OrderAccess::release_store_fence(volatile jushort* p, jushort v) { specialized_release_store_fence((volatile jshort*)p, (jshort)v); } -inline void OrderAccess::release_store_fence(volatile juint* p, juint v) { specialized_release_store_fence((volatile jint*) p, (jint) v); } -inline void OrderAccess::release_store_fence(volatile julong* p, julong v) { specialized_release_store_fence((volatile jlong*) p, (jlong) v); } +inline void OrderAccess::release_store_ptr(volatile intptr_t* p, intptr_t v) { release_store(p, v); } +inline void OrderAccess::release_store_ptr(volatile void* p, void* v) { release_store(static_cast(p), v); } -inline void OrderAccess::release_store_ptr_fence(volatile intptr_t* p, intptr_t v) { specialized_release_store_fence(p, v); } -inline void OrderAccess::release_store_ptr_fence(volatile void* p, void* v) { specialized_release_store_fence((volatile intptr_t*)p, (intptr_t)v); } +template +inline void OrderAccess::release_store_fence(volatile D* p, T v) { + StoreImpl >()(v, p); +} -// The following methods can be specialized using simple template specialization -// in the platform specific files for optimization purposes. Otherwise the -// generalized variant is used. -template inline T OrderAccess::specialized_load_acquire (const volatile T* p) { return ordered_load(p); } -template inline void OrderAccess::specialized_release_store (volatile T* p, T v) { ordered_store(p, v); } -template inline void OrderAccess::specialized_release_store_fence(volatile T* p, T v) { ordered_store(p, v); } - -// Generalized atomic volatile accesses valid in OrderAccess -// All other types can be expressed in terms of these. -inline void OrderAccess::store(volatile jbyte* p, jbyte v) { *p = v; } -inline void OrderAccess::store(volatile jshort* p, jshort v) { *p = v; } -inline void OrderAccess::store(volatile jint* p, jint v) { *p = v; } -inline void OrderAccess::store(volatile jlong* p, jlong v) { Atomic::store(v, p); } -inline void OrderAccess::store(volatile jdouble* p, jdouble v) { Atomic::store(jlong_cast(v), (volatile jlong*)p); } -inline void OrderAccess::store(volatile jfloat* p, jfloat v) { *p = v; } - -inline jbyte OrderAccess::load(const volatile jbyte* p) { return *p; } -inline jshort OrderAccess::load(const volatile jshort* p) { return *p; } -inline jint OrderAccess::load(const volatile jint* p) { return *p; } -inline jlong OrderAccess::load(const volatile jlong* p) { return Atomic::load(p); } -inline jdouble OrderAccess::load(const volatile jdouble* p) { return jdouble_cast(Atomic::load((const volatile jlong*)p)); } -inline jfloat OrderAccess::load(const volatile jfloat* p) { return *p; } - -#endif // VM_HAS_GENERALIZED_ORDER_ACCESS +inline void OrderAccess::release_store_ptr_fence(volatile intptr_t* p, intptr_t v) { release_store_fence(p, v); } +inline void OrderAccess::release_store_ptr_fence(volatile void* p, void* v) { release_store_fence(static_cast(p), v); } #endif // SHARE_VM_RUNTIME_ORDERACCESS_INLINE_HPP From 94760c81301ddd9facd08f2f2375eda1713c698a Mon Sep 17 00:00:00 2001 From: Ioi Lam Date: Mon, 9 Oct 2017 13:11:25 -0700 Subject: [PATCH 67/80] 8188828: Intermittent ClassNotFoundException: jdk.test.lib.Platform for compiler tests As a work around, remove dependency from jdk.test.lib.FileInstaller to other classes in this library Reviewed-by: iignatyev, gtriantafill, kvn, dholmes --- test/lib/jdk/test/lib/FileInstaller.java | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/test/lib/jdk/test/lib/FileInstaller.java b/test/lib/jdk/test/lib/FileInstaller.java index 5e16b315153..73bc23f3238 100644 --- a/test/lib/jdk/test/lib/FileInstaller.java +++ b/test/lib/jdk/test/lib/FileInstaller.java @@ -1,5 +1,5 @@ /* - * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2015, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -32,11 +32,18 @@ import java.nio.file.SimpleFileVisitor; import java.nio.file.StandardCopyOption; import java.nio.file.attribute.BasicFileAttributes; +// !!! +// NOTE: this class is widely used. DO NOT depend on any other classes in any test library, or else +// you may see intermittent ClassNotFoundException as in JDK-8188828 +// !!! + /** * Copy a resource: file or directory recursively, using relative path(src and dst) * which are applied to test source directory(src) and current directory(dst) */ public class FileInstaller { + public static final String TEST_SRC = System.getProperty("test.src", "").trim(); + /** * @param args source and destination * @throws IOException if an I/O error occurs @@ -45,7 +52,7 @@ public class FileInstaller { if (args.length != 2) { throw new IllegalArgumentException("Unexpected number of arguments for file copy"); } - Path src = Paths.get(Utils.TEST_SRC, args[0]).toAbsolutePath().normalize(); + Path src = Paths.get(TEST_SRC, args[0]).toAbsolutePath().normalize(); Path dst = Paths.get(args[1]).toAbsolutePath().normalize(); if (src.toFile().exists()) { System.out.printf("copying %s to %s%n", src, dst); From f8b593cb6645e08c7f2c5d00b3e0a5003301fa71 Mon Sep 17 00:00:00 2001 From: Jesper Wilhelmsson Date: Tue, 10 Oct 2017 03:54:49 +0200 Subject: [PATCH 68/80] 8189071: Require jtreg 4.2 b09 Reviewed-by: dholmes, gtriantafill --- make/conf/jib-profiles.js | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/make/conf/jib-profiles.js b/make/conf/jib-profiles.js index 2758d9772e1..1d1c57ecd74 100644 --- a/make/conf/jib-profiles.js +++ b/make/conf/jib-profiles.js @@ -1063,7 +1063,7 @@ var getJibProfilesDependencies = function (input, common) { jtreg: { server: "javare", revision: "4.2", - build_number: "b08", + build_number: "b09", checksum_file: "MD5_VALUES", file: "jtreg_bin-4.2.zip", environment_name: "JT_HOME", From 4c1297b778f7873df8ed04791d2d199ed97fd362 Mon Sep 17 00:00:00 2001 From: Mandy Chung Date: Tue, 10 Oct 2017 11:52:42 -0700 Subject: [PATCH 69/80] 8188052: JNI FindClass needs to specify the class loading context used for library lifecycle hooks Reviewed-by: alanb, coleenp, dholmes --- src/hotspot/share/prims/jni.cpp | 32 ++++++++++--------- src/hotspot/share/prims/jni.h | 1 + src/hotspot/share/runtime/thread.cpp | 1 + .../share/classes/java/lang/ClassLoader.java | 4 ++- src/java.base/share/native/include/jni.h | 1 + .../libmanagement_agent/FileSystemImpl.c | 2 +- .../libmanagement_agent/FileSystemImpl.c | 2 +- .../jtreg/native_sanity/JniVersion.java | 4 +-- 8 files changed, 27 insertions(+), 20 deletions(-) diff --git a/src/hotspot/share/prims/jni.cpp b/src/hotspot/share/prims/jni.cpp index 19910ed4734..454511c4fbc 100644 --- a/src/hotspot/share/prims/jni.cpp +++ b/src/hotspot/share/prims/jni.cpp @@ -92,7 +92,7 @@ #include "jvmci/jvmciRuntime.hpp" #endif -static jint CurrentVersion = JNI_VERSION_9; +static jint CurrentVersion = JNI_VERSION_10; #ifdef _WIN32 extern LONG WINAPI topLevelExceptionFilter(_EXCEPTION_POINTERS* ); @@ -401,29 +401,31 @@ JNI_ENTRY(jclass, jni_FindClass(JNIEnv *env, const char *name)) // Find calling class Klass* k = thread->security_get_caller_class(0); if (k != NULL) { - loader = Handle(THREAD, k->class_loader()); // Special handling to make sure JNI_OnLoad and JNI_OnUnload are executed // in the correct class context. - if (loader.is_null() && + if (k->class_loader() == NULL && k->name() == vmSymbols::java_lang_ClassLoader_NativeLibrary()) { JavaValue result(T_OBJECT); JavaCalls::call_static(&result, k, vmSymbols::getFromClass_name(), vmSymbols::void_class_signature(), - thread); - if (HAS_PENDING_EXCEPTION) { - Handle ex(thread, thread->pending_exception()); - CLEAR_PENDING_EXCEPTION; - THROW_HANDLE_0(ex); - } + CHECK_NULL); + // When invoked from JNI_OnLoad, NativeLibrary::getFromClass returns + // a non-NULL Class object. When invoked from JNI_OnUnload, + // it will return NULL to indicate no context. oop mirror = (oop) result.get_jobject(); - loader = Handle(THREAD, - InstanceKlass::cast(java_lang_Class::as_Klass(mirror))->class_loader()); - protection_domain = Handle(THREAD, - InstanceKlass::cast(java_lang_Class::as_Klass(mirror))->protection_domain()); + if (mirror != NULL) { + Klass* fromClass = java_lang_Class::as_Klass(mirror); + loader = Handle(THREAD, fromClass->class_loader()); + protection_domain = Handle(THREAD, fromClass->protection_domain()); + } + } else { + loader = Handle(THREAD, k->class_loader()); } - } else { - // We call ClassLoader.getSystemClassLoader to obtain the system class loader. + } + + if (loader.is_null()) { + // No context and use the system class loader loader = Handle(THREAD, SystemDictionary::java_system_loader()); } diff --git a/src/hotspot/share/prims/jni.h b/src/hotspot/share/prims/jni.h index d5de88d0dd8..49b07f1b7d1 100644 --- a/src/hotspot/share/prims/jni.h +++ b/src/hotspot/share/prims/jni.h @@ -1964,6 +1964,7 @@ JNI_OnUnload(JavaVM *vm, void *reserved); #define JNI_VERSION_1_6 0x00010006 #define JNI_VERSION_1_8 0x00010008 #define JNI_VERSION_9 0x00090000 +#define JNI_VERSION_10 0x000a0000 #ifdef __cplusplus } /* extern "C" */ diff --git a/src/hotspot/share/runtime/thread.cpp b/src/hotspot/share/runtime/thread.cpp index 9663e183340..3eca85744cd 100644 --- a/src/hotspot/share/runtime/thread.cpp +++ b/src/hotspot/share/runtime/thread.cpp @@ -4195,6 +4195,7 @@ jboolean Threads::is_supported_jni_version(jint version) { if (version == JNI_VERSION_1_6) return JNI_TRUE; if (version == JNI_VERSION_1_8) return JNI_TRUE; if (version == JNI_VERSION_9) return JNI_TRUE; + if (version == JNI_VERSION_10) return JNI_TRUE; return JNI_FALSE; } diff --git a/src/java.base/share/classes/java/lang/ClassLoader.java b/src/java.base/share/classes/java/lang/ClassLoader.java index 7815bde0c61..a949b558bff 100644 --- a/src/java.base/share/classes/java/lang/ClassLoader.java +++ b/src/java.base/share/classes/java/lang/ClassLoader.java @@ -2381,7 +2381,7 @@ public abstract class ClassLoader { private int jniVersion; // the class from which the library is loaded, also indicates // the loader this native library belongs. - private final Class fromClass; + private Class fromClass; // the canonicalized name of the native library. // or static library name String name; @@ -2404,6 +2404,8 @@ public abstract class ClassLoader { protected void finalize() { synchronized (loadedLibraryNames) { if (fromClass.getClassLoader() != null && loaded) { + this.fromClass = null; // no context when unloaded + /* remove the native library name */ int size = loadedLibraryNames.size(); for (int i = 0; i < size; i++) { diff --git a/src/java.base/share/native/include/jni.h b/src/java.base/share/native/include/jni.h index e29bf04b4cc..e15503f4d4f 100644 --- a/src/java.base/share/native/include/jni.h +++ b/src/java.base/share/native/include/jni.h @@ -1964,6 +1964,7 @@ JNI_OnUnload(JavaVM *vm, void *reserved); #define JNI_VERSION_1_6 0x00010006 #define JNI_VERSION_1_8 0x00010008 #define JNI_VERSION_9 0x00090000 +#define JNI_VERSION_10 0x000a0000 #ifdef __cplusplus } /* extern "C" */ diff --git a/src/jdk.management.agent/unix/native/libmanagement_agent/FileSystemImpl.c b/src/jdk.management.agent/unix/native/libmanagement_agent/FileSystemImpl.c index ba780592811..ad3f7b95473 100644 --- a/src/jdk.management.agent/unix/native/libmanagement_agent/FileSystemImpl.c +++ b/src/jdk.management.agent/unix/native/libmanagement_agent/FileSystemImpl.c @@ -45,7 +45,7 @@ JNIEXPORT jint JNICALL DEF_JNI_OnLoad(JavaVM *vm, void *reserved) return JNI_EVERSION; /* JNI version not supported */ } - return JNI_VERSION_9; + return JNI_VERSION_10; } /* diff --git a/src/jdk.management.agent/windows/native/libmanagement_agent/FileSystemImpl.c b/src/jdk.management.agent/windows/native/libmanagement_agent/FileSystemImpl.c index 62ad33c78b8..ea6559c2a3a 100644 --- a/src/jdk.management.agent/windows/native/libmanagement_agent/FileSystemImpl.c +++ b/src/jdk.management.agent/windows/native/libmanagement_agent/FileSystemImpl.c @@ -39,7 +39,7 @@ JNIEXPORT jint JNICALL DEF_JNI_OnLoad(JavaVM *vm, void *reserved) return JNI_EVERSION; /* JNI version not supported */ } - return JNI_VERSION_9; + return JNI_VERSION_10; } diff --git a/test/hotspot/jtreg/native_sanity/JniVersion.java b/test/hotspot/jtreg/native_sanity/JniVersion.java index e1451d2e9a5..da9149e99d3 100644 --- a/test/hotspot/jtreg/native_sanity/JniVersion.java +++ b/test/hotspot/jtreg/native_sanity/JniVersion.java @@ -27,12 +27,12 @@ */ public class JniVersion { - public static final int JNI_VERSION_9 = 0x00090000; + public static final int JNI_VERSION_10 = 0x000a0000; public static void main(String... args) throws Exception { System.loadLibrary("JniVersion"); int res = getJniVersion(); - if (res != JNI_VERSION_9) { + if (res != JNI_VERSION_10) { throw new Exception("Unexpected value returned from getJniVersion(): 0x" + Integer.toHexString(res)); } } From 449114a4f6620bf1a638a725702fb9a3f0d67fae Mon Sep 17 00:00:00 2001 From: Calvin Cheung Date: Tue, 10 Oct 2017 14:38:56 -0700 Subject: [PATCH 70/80] 8185694: Replace SystemDictionaryShared::_java_platform_loader with SystemDictionary::is_platform_class_loader() Added the creation of _java_platform_loader Reviewed-by: iklam, coleenp, mchung, dholmes, jiangli --- .../share/classfile/systemDictionary.cpp | 26 ++++++++++++++----- .../share/classfile/systemDictionary.hpp | 10 ++++--- src/hotspot/share/classfile/vmSymbols.hpp | 1 + src/hotspot/share/runtime/thread.cpp | 4 +-- 4 files changed, 30 insertions(+), 11 deletions(-) diff --git a/src/hotspot/share/classfile/systemDictionary.cpp b/src/hotspot/share/classfile/systemDictionary.cpp index ededdc3f2d0..59da43e11c4 100644 --- a/src/hotspot/share/classfile/systemDictionary.cpp +++ b/src/hotspot/share/classfile/systemDictionary.cpp @@ -104,6 +104,7 @@ InstanceKlass* SystemDictionary::_well_known_klasses[SystemDictionary::WKID InstanceKlass* SystemDictionary::_box_klasses[T_VOID+1] = { NULL /*, NULL...*/ }; oop SystemDictionary::_java_system_loader = NULL; +oop SystemDictionary::_java_platform_loader = NULL; bool SystemDictionary::_has_loadClassInternal = false; bool SystemDictionary::_has_checkPackageAccess = false; @@ -117,27 +118,38 @@ const int defaultProtectionDomainCacheSize = 1009; // ---------------------------------------------------------------------------- -// Java-level SystemLoader +// Java-level SystemLoader and PlatformLoader oop SystemDictionary::java_system_loader() { return _java_system_loader; } -void SystemDictionary::compute_java_system_loader(TRAPS) { - Klass* system_klass = WK_KLASS(ClassLoader_klass); +oop SystemDictionary::java_platform_loader() { + return _java_platform_loader; +} + +void SystemDictionary::compute_java_loaders(TRAPS) { JavaValue result(T_OBJECT); + InstanceKlass* class_loader_klass = SystemDictionary::ClassLoader_klass(); JavaCalls::call_static(&result, - WK_KLASS(ClassLoader_klass), + class_loader_klass, vmSymbols::getSystemClassLoader_name(), vmSymbols::void_classloader_signature(), CHECK); _java_system_loader = (oop)result.get_jobject(); + JavaCalls::call_static(&result, + class_loader_klass, + vmSymbols::getPlatformClassLoader_name(), + vmSymbols::void_classloader_signature(), + CHECK); + + _java_platform_loader = (oop)result.get_jobject(); + CDS_ONLY(SystemDictionaryShared::initialize(CHECK);) } - ClassLoaderData* SystemDictionary::register_loader(Handle class_loader, TRAPS) { if (class_loader() == NULL) return ClassLoaderData::the_null_class_loader_data(); return ClassLoaderDataGraph::find_or_create(class_loader, THREAD); @@ -169,7 +181,7 @@ bool SystemDictionary::is_system_class_loader(oop class_loader) { return false; } return (class_loader->klass() == SystemDictionary::jdk_internal_loader_ClassLoaders_AppClassLoader_klass() || - class_loader == _java_system_loader); + class_loader == _java_system_loader); } // Returns true if the passed class loader is the platform class loader. @@ -1940,6 +1952,7 @@ bool SystemDictionary::do_unloading(BoolObjectClosure* is_alive, void SystemDictionary::roots_oops_do(OopClosure* strong, OopClosure* weak) { strong->do_oop(&_java_system_loader); + strong->do_oop(&_java_platform_loader); strong->do_oop(&_system_loader_lock_obj); CDS_ONLY(SystemDictionaryShared::roots_oops_do(strong);) @@ -1964,6 +1977,7 @@ void SystemDictionary::roots_oops_do(OopClosure* strong, OopClosure* weak) { void SystemDictionary::oops_do(OopClosure* f) { f->do_oop(&_java_system_loader); + f->do_oop(&_java_platform_loader); f->do_oop(&_system_loader_lock_obj); CDS_ONLY(SystemDictionaryShared::oops_do(f);) diff --git a/src/hotspot/share/classfile/systemDictionary.hpp b/src/hotspot/share/classfile/systemDictionary.hpp index 4bd30563527..17da32a2859 100644 --- a/src/hotspot/share/classfile/systemDictionary.hpp +++ b/src/hotspot/share/classfile/systemDictionary.hpp @@ -484,11 +484,14 @@ public: static bool Object_klass_loaded() { return WK_KLASS(Object_klass) != NULL; } static bool ClassLoader_klass_loaded() { return WK_KLASS(ClassLoader_klass) != NULL; } - // Returns default system loader + // Returns java system loader static oop java_system_loader(); - // Compute the default system loader - static void compute_java_system_loader(TRAPS); + // Returns java platform loader + static oop java_platform_loader(); + + // Compute the java system and platform loaders + static void compute_java_loaders(TRAPS); // Register a new class loader static ClassLoaderData* register_loader(Handle class_loader, TRAPS); @@ -700,6 +703,7 @@ protected: static InstanceKlass* _box_klasses[T_VOID+1]; static oop _java_system_loader; + static oop _java_platform_loader; static bool _has_loadClassInternal; static bool _has_checkPackageAccess; diff --git a/src/hotspot/share/classfile/vmSymbols.hpp b/src/hotspot/share/classfile/vmSymbols.hpp index 65001d4cce9..88f03e5a205 100644 --- a/src/hotspot/share/classfile/vmSymbols.hpp +++ b/src/hotspot/share/classfile/vmSymbols.hpp @@ -371,6 +371,7 @@ template(deadChild_name, "deadChild") \ template(getFromClass_name, "getFromClass") \ template(dispatch_name, "dispatch") \ + template(getPlatformClassLoader_name, "getPlatformClassLoader") \ template(getSystemClassLoader_name, "getSystemClassLoader") \ template(fillInStackTrace_name, "fillInStackTrace") \ template(getCause_name, "getCause") \ diff --git a/src/hotspot/share/runtime/thread.cpp b/src/hotspot/share/runtime/thread.cpp index 3eca85744cd..41fd4cc58b4 100644 --- a/src/hotspot/share/runtime/thread.cpp +++ b/src/hotspot/share/runtime/thread.cpp @@ -3751,8 +3751,8 @@ jint Threads::create_vm(JavaVMInitArgs* args, bool* canTryAgain) { // Final system initialization including security manager and system class loader call_initPhase3(CHECK_JNI_ERR); - // cache the system class loader - SystemDictionary::compute_java_system_loader(CHECK_(JNI_ERR)); + // cache the system and platform class loaders + SystemDictionary::compute_java_loaders(CHECK_JNI_ERR); #if INCLUDE_JVMCI if (EnableJVMCI) { From ac63626f1fd0f1bc3cc1e9f62e1952efe482bc8f Mon Sep 17 00:00:00 2001 From: Mikhailo Seledtsov Date: Tue, 10 Oct 2017 19:18:36 -0700 Subject: [PATCH 71/80] 8181592: [TESTBUG] Docker test utils and docker jdk basic test Implemented docker test utilities and basic test Reviewed-by: iignatyev, lmesnik, gtriantafill --- test/hotspot/jtreg/TEST.ROOT | 3 +- .../containers/docker/DockerBasicTest.java | 83 ++++++ .../containers/docker/Dockerfile-BasicTest | 8 + .../containers/docker/HelloDocker.java | 28 ++ test/jtreg-ext/requires/VMProps.java | 34 +++ .../containers/docker/DockerRunOptions.java | 72 +++++ .../containers/docker/DockerTestUtils.java | 276 ++++++++++++++++++ 7 files changed, 503 insertions(+), 1 deletion(-) create mode 100644 test/hotspot/jtreg/runtime/containers/docker/DockerBasicTest.java create mode 100644 test/hotspot/jtreg/runtime/containers/docker/Dockerfile-BasicTest create mode 100644 test/hotspot/jtreg/runtime/containers/docker/HelloDocker.java create mode 100644 test/lib/jdk/test/lib/containers/docker/DockerRunOptions.java create mode 100644 test/lib/jdk/test/lib/containers/docker/DockerTestUtils.java diff --git a/test/hotspot/jtreg/TEST.ROOT b/test/hotspot/jtreg/TEST.ROOT index ea7ebb451ee..69eca8ec107 100644 --- a/test/hotspot/jtreg/TEST.ROOT +++ b/test/hotspot/jtreg/TEST.ROOT @@ -53,7 +53,8 @@ requires.properties= \ vm.rtm.os \ vm.aot \ vm.cds \ - vm.graal.enabled + vm.graal.enabled \ + docker.support # Minimum jtreg version requiredVersion=4.2 b08 diff --git a/test/hotspot/jtreg/runtime/containers/docker/DockerBasicTest.java b/test/hotspot/jtreg/runtime/containers/docker/DockerBasicTest.java new file mode 100644 index 00000000000..41867e74b89 --- /dev/null +++ b/test/hotspot/jtreg/runtime/containers/docker/DockerBasicTest.java @@ -0,0 +1,83 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + + +/* + * @test + * @summary Basic (sanity) test for JDK-under-test inside a docker image. + * @requires (docker.support) + * @library /test/lib + * @modules java.base/jdk.internal.misc + * java.management + * jdk.jartool/sun.tools.jar + * @build HelloDocker + * @run driver DockerBasicTest + */ +import jdk.test.lib.containers.docker.DockerRunOptions; +import jdk.test.lib.containers.docker.DockerTestUtils; +import jdk.test.lib.Platform; +import jdk.test.lib.Utils; + + +public class DockerBasicTest { + private static final String imageNameAndTag = "jdk10-internal:test"; + // Diganostics: set to false to examine image after the test + private static final boolean removeImageAfterTest = true; + + public static void main(String[] args) throws Exception { + if (!DockerTestUtils.canTestDocker()) { + return; + } + + DockerTestUtils.buildJdkDockerImage(imageNameAndTag, "Dockerfile-BasicTest", "jdk-docker"); + + try { + testJavaVersion(); + testHelloDocker(); + } finally { + if (removeImageAfterTest) + DockerTestUtils.removeDockerImage(imageNameAndTag); + } + } + + + private static void testJavaVersion() throws Exception { + DockerTestUtils.dockerRunJava( + new DockerRunOptions(imageNameAndTag, "/jdk/bin/java", "-version")) + .shouldHaveExitValue(0) + .shouldContain(Platform.vmName); + } + + + private static void testHelloDocker() throws Exception { + DockerRunOptions opts = + new DockerRunOptions(imageNameAndTag, "/jdk/bin/java", "HelloDocker") + .addJavaOpts("-cp", "/test-classes/") + .addDockerOpts("--volume", Utils.TEST_CLASSES + ":/test-classes/"); + + DockerTestUtils.dockerRunJava(opts) + .shouldHaveExitValue(0) + .shouldContain("Hello Docker"); + } + +} diff --git a/test/hotspot/jtreg/runtime/containers/docker/Dockerfile-BasicTest b/test/hotspot/jtreg/runtime/containers/docker/Dockerfile-BasicTest new file mode 100644 index 00000000000..166c969289e --- /dev/null +++ b/test/hotspot/jtreg/runtime/containers/docker/Dockerfile-BasicTest @@ -0,0 +1,8 @@ +FROM oraclelinux:7.2 +MAINTAINER mikhailo.seledtsov@oracle.com + +COPY /jdk /jdk + +ENV JAVA_HOME=/jdk + +CMD ["/bin/bash"] diff --git a/test/hotspot/jtreg/runtime/containers/docker/HelloDocker.java b/test/hotspot/jtreg/runtime/containers/docker/HelloDocker.java new file mode 100644 index 00000000000..9b5f56035b3 --- /dev/null +++ b/test/hotspot/jtreg/runtime/containers/docker/HelloDocker.java @@ -0,0 +1,28 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +public class HelloDocker { + public static void main(String args[]) { + System.out.println("Hello Docker"); + } +} diff --git a/test/jtreg-ext/requires/VMProps.java b/test/jtreg-ext/requires/VMProps.java index c507a8c74c3..63c9ae9b049 100644 --- a/test/jtreg-ext/requires/VMProps.java +++ b/test/jtreg-ext/requires/VMProps.java @@ -32,6 +32,7 @@ import java.util.HashMap; import java.util.List; import java.util.Map; import java.util.concurrent.Callable; +import java.util.concurrent.TimeUnit; import java.util.regex.Matcher; import java.util.regex.Pattern; @@ -75,6 +76,7 @@ public class VMProps implements Callable> { map.put("vm.cds", vmCDS()); // vm.graal.enabled is true if Graal is used as JIT map.put("vm.graal.enabled", isGraalEnabled()); + map.put("docker.support", dockerSupport()); vmGC(map); // vm.gc.X = true/false VMProps.dump(map); @@ -329,6 +331,38 @@ public class VMProps implements Callable> { return "true"; } + + /** + * A simple check for docker support + * + * @return true if docker is supported in a given environment + */ + protected String dockerSupport() { + // currently docker testing is only supported for Linux-x64 + if (! ( Platform.isLinux() && Platform.isX64() ) ) + return "false"; + + boolean isSupported; + try { + isSupported = checkDockerSupport(); + } catch (Exception e) { + isSupported = false; + System.err.println("dockerSupport() threw exception: " + e); + } + + return (isSupported) ? "true" : "false"; + } + + private boolean checkDockerSupport() throws IOException, InterruptedException { + ProcessBuilder pb = new ProcessBuilder("docker", "ps"); + Process p = pb.start(); + p.waitFor(10, TimeUnit.SECONDS); + + return (p.exitValue() == 0); + } + + + /** * Dumps the map to the file if the file name is given as the property. * This functionality could be helpful to know context in the real diff --git a/test/lib/jdk/test/lib/containers/docker/DockerRunOptions.java b/test/lib/jdk/test/lib/containers/docker/DockerRunOptions.java new file mode 100644 index 00000000000..254edb86cb7 --- /dev/null +++ b/test/lib/jdk/test/lib/containers/docker/DockerRunOptions.java @@ -0,0 +1,72 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ +package jdk.test.lib.containers.docker; + +import java.util.ArrayList; +import java.util.Collections; + + +// This class represents options for running java inside docker containers +// in test environment. +public class DockerRunOptions { + public String imageNameAndTag; + public ArrayList dockerOpts = new ArrayList(); + public String command; // normally a full path to java + public ArrayList javaOpts = new ArrayList(); + public String classToRun; // class or "-version" + public ArrayList classParams = new ArrayList(); + + public boolean tty = true; + public boolean removeContainerAfterUse = true; + public boolean appendTestJavaOptions = true; + public boolean retainChildStdout = false; + + /** + * Convenience constructor for most common use cases in testing. + * @param imageNameAndTag a string representing name and tag for the + * docker image to run, as "name:tag" + * @param javaCmd a java command to run (e.g. /jdk/bin/java) + * @param classToRun a class to run, or "-version" + * @param javaOpts java options to use + * + * @return Default docker run options + */ + public DockerRunOptions(String imageNameAndTag, String javaCmd, + String classToRun, String... javaOpts) { + this.imageNameAndTag = imageNameAndTag; + this.command = javaCmd; + this.classToRun = classToRun; + this.addJavaOpts(javaOpts); + } + + public DockerRunOptions addDockerOpts(String... opts) { + Collections.addAll(dockerOpts, opts); + return this; + } + + public DockerRunOptions addJavaOpts(String... opts) { + Collections.addAll(javaOpts, opts); + return this; + } + +} diff --git a/test/lib/jdk/test/lib/containers/docker/DockerTestUtils.java b/test/lib/jdk/test/lib/containers/docker/DockerTestUtils.java new file mode 100644 index 00000000000..b9b84dbd29f --- /dev/null +++ b/test/lib/jdk/test/lib/containers/docker/DockerTestUtils.java @@ -0,0 +1,276 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ +package jdk.test.lib.containers.docker; + +import java.io.File; +import java.io.IOException; +import java.nio.file.Files; +import java.nio.file.FileVisitResult; +import java.nio.file.Path; +import java.nio.file.Paths; +import java.nio.file.SimpleFileVisitor; +import java.nio.file.StandardCopyOption; +import java.nio.file.attribute.BasicFileAttributes; +import java.util.ArrayList; +import java.util.Collections; +import java.util.List; +import jdk.test.lib.Utils; +import jdk.test.lib.process.OutputAnalyzer; +import jdk.test.lib.process.ProcessTools; + + +public class DockerTestUtils { + private static final String FS = File.separator; + private static boolean isDockerEngineAvailable = false; + private static boolean wasDockerEngineChecked = false; + + // Diagnostics: set to true to enable more diagnostic info + private static final boolean DEBUG = false; + + /** + * Optimized check of whether the docker engine is available in a given + * environment. Checks only once, then remembers the result in a singleton. + * + * @return true if docker engine is available + * @throws Exception + */ + public static boolean isDockerEngineAvailable() throws Exception { + if (wasDockerEngineChecked) + return isDockerEngineAvailable; + + isDockerEngineAvailable = isDockerEngineAvailableCheck(); + wasDockerEngineChecked = true; + return isDockerEngineAvailable; + } + + + /** + * Convenience method, will check if docker engine is available and usable; + * will print the appropriate message when not available. + * + * @return true if docker engine is available + * @throws Exception + */ + public static boolean canTestDocker() throws Exception { + if (isDockerEngineAvailable()) { + return true; + } else { + System.out.println("Docker engine is not available on this system"); + System.out.println("This test is SKIPPED"); + return false; + } + } + + + /** + * Simple check - is docker engine available, accessible and usable. + * Run basic docker command: 'docker ps' - list docker instances. + * If docker engine is available and accesible then true is returned + * and we can proceed with testing docker. + * + * @return true if docker engine is available and usable + * @throws Exception + */ + private static boolean isDockerEngineAvailableCheck() throws Exception { + try { + execute("docker", "ps") + .shouldHaveExitValue(0) + .shouldContain("CONTAINER") + .shouldContain("IMAGE"); + } catch (Exception e) { + return false; + } + return true; + } + + + /** + * Build a docker image that contains JDK under test. + * The jdk will be placed under the "/jdk/" folder inside the docker file system. + * + * @param imageName name of the image to be created, including version tag + * @param dockerfile name of the dockerfile residing in the test source + * @param buildDirName name of the docker build/staging directory, which will + * be created in the jtreg's scratch folder + * @throws Exception + */ + public static void + buildJdkDockerImage(String imageName, String dockerfile, String buildDirName) + throws Exception { + + Path buildDir = Paths.get(".", buildDirName); + if (Files.exists(buildDir)) { + throw new RuntimeException("The docker build directory already exists: " + buildDir); + } + + Path jdkSrcDir = Paths.get(Utils.TEST_JDK); + Path jdkDstDir = buildDir.resolve("jdk"); + + Files.createDirectories(jdkDstDir); + + // Copy JDK-under-test tree to the docker build directory. + // This step is required for building a docker image. + Files.walkFileTree(jdkSrcDir, new CopyFileVisitor(jdkSrcDir, jdkDstDir)); + buildDockerImage(imageName, Paths.get(Utils.TEST_SRC, dockerfile), buildDir); + } + + + /** + * Build a docker image based on given docker file and docker build directory. + * + * @param imageName name of the image to be created, including version tag + * @param dockerfile path to the Dockerfile to be used for building the docker + * image. The specified dockerfile will be copied to the docker build + * directory as 'Dockerfile' + * @param buildDir build directory; it should already contain all the content + * needed to build the docker image. + * @throws Exception + */ + public static void + buildDockerImage(String imageName, Path dockerfile, Path buildDir) throws Exception { + + // Copy docker file to the build dir + Files.copy(dockerfile, buildDir.resolve("Dockerfile")); + + // Build the docker + execute("docker", "build", buildDir.toString(), "--no-cache", "--tag", imageName) + .shouldHaveExitValue(0) + .shouldContain("Successfully built"); + } + + + /** + * Run Java inside the docker image with specified parameters and options. + * + * @param DockerRunOptions optins for running docker + * + * @return output of the run command + * @throws Exception + */ + public static OutputAnalyzer dockerRunJava(DockerRunOptions opts) throws Exception { + ArrayList cmd = new ArrayList<>(); + + cmd.add("docker"); + cmd.add("run"); + if (opts.tty) + cmd.add("--tty=true"); + if (opts.removeContainerAfterUse) + cmd.add("--rm"); + + cmd.addAll(opts.dockerOpts); + cmd.add(opts.imageNameAndTag); + cmd.add(opts.command); + + cmd.addAll(opts.javaOpts); + if (opts.appendTestJavaOptions) { + Collections.addAll(cmd, Utils.getTestJavaOpts()); + } + + cmd.add(opts.classToRun); + cmd.addAll(opts.classParams); + + return execute(cmd); + } + + + /** + * Remove docker image + * + * @param DockerRunOptions optins for running docker + * @return output of the command + * @throws Exception + */ + public static OutputAnalyzer removeDockerImage(String imageNameAndTag) throws Exception { + return execute("docker", "rmi", "--force", imageNameAndTag); + } + + + + /** + * Convenience method - express command as sequence of strings + * + * @param command to execute + * @return The output from the process + * @throws Exception + */ + public static OutputAnalyzer execute(List command) throws Exception { + return execute(command.toArray(new String[command.size()])); + } + + + /** + * Execute a specified command in a process, report diagnostic info. + * + * @param command to be executed + * @return The output from the process + * @throws Exception + */ + public static OutputAnalyzer execute(String... command) throws Exception { + + ProcessBuilder pb = new ProcessBuilder(command); + System.out.println("[COMMAND]\n" + Utils.getCommandLine(pb)); + + long started = System.currentTimeMillis(); + OutputAnalyzer output = new OutputAnalyzer(pb.start()); + + System.out.println("[ELAPSED: " + (System.currentTimeMillis() - started) + " ms]"); + System.out.println("[STDERR]\n" + output.getStderr()); + System.out.println("[STDOUT]\n" + output.getStdout()); + + return output; + } + + + private static class CopyFileVisitor extends SimpleFileVisitor { + private final Path src; + private final Path dst; + + public CopyFileVisitor(Path src, Path dst) { + this.src = src; + this.dst = dst; + } + + + @Override + public FileVisitResult preVisitDirectory(Path file, + BasicFileAttributes attrs) throws IOException { + Path dstDir = dst.resolve(src.relativize(file)); + if (!dstDir.toFile().exists()) { + Files.createDirectories(dstDir); + } + return FileVisitResult.CONTINUE; + } + + + @Override + public FileVisitResult visitFile(Path file, + BasicFileAttributes attrs) throws IOException { + if (!file.toFile().isFile()) { + return FileVisitResult.CONTINUE; + } + Path dstFile = dst.resolve(src.relativize(file)); + Files.copy(file, dstFile, StandardCopyOption.COPY_ATTRIBUTES); + return FileVisitResult.CONTINUE; + } + } +} From b5dd6a9a45b8e9120733798b915eb8111a7c65ef Mon Sep 17 00:00:00 2001 From: Erik Helin Date: Fri, 15 Sep 2017 14:47:13 +0200 Subject: [PATCH 72/80] 8187578: BitMap::reallocate should check if old_map is NULL Reviewed-by: stefank, eosterlund, dholmes --- src/hotspot/share/utilities/bitMap.cpp | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/src/hotspot/share/utilities/bitMap.cpp b/src/hotspot/share/utilities/bitMap.cpp index 21a3229411b..687b98e7085 100644 --- a/src/hotspot/share/utilities/bitMap.cpp +++ b/src/hotspot/share/utilities/bitMap.cpp @@ -81,8 +81,10 @@ BitMap::bm_word_t* BitMap::reallocate(const Allocator& allocator, bm_word_t* old if (new_size_in_words > 0) { map = allocator.allocate(new_size_in_words); - Copy::disjoint_words((HeapWord*)old_map, (HeapWord*) map, - MIN2(old_size_in_words, new_size_in_words)); + if (old_map != NULL) { + Copy::disjoint_words((HeapWord*)old_map, (HeapWord*) map, + MIN2(old_size_in_words, new_size_in_words)); + } if (new_size_in_words > old_size_in_words) { clear_range_of_words(map, old_size_in_words, new_size_in_words); From d3466f7dce6f541b00455ea45d2faa44becc392d Mon Sep 17 00:00:00 2001 From: Harold Seigel Date: Wed, 11 Oct 2017 10:03:22 -0400 Subject: [PATCH 73/80] 8188922: [TESTBUG] runtime/CommandLine/VMDeprecatedOptions.java fails with JDK10 release bits Add -XX:+UnlockDiagnosticVMOptions to the command line when testing a deprecated diagnostic option. Reviewed-by: coleenp, lfoltan --- .../runtime/CommandLine/VMDeprecatedOptions.java | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java b/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java index d53218760ac..ab0b29d95ed 100644 --- a/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java +++ b/test/hotspot/jtreg/runtime/CommandLine/VMDeprecatedOptions.java @@ -42,7 +42,6 @@ public class VMDeprecatedOptions { // deprecated non-alias flags: {"MaxGCMinorPauseMillis", "1032"}, {"MustCallLoadClassInternal", "false"}, - {"UnsyncloadClass", "false"}, {"MaxRAMFraction", "8"}, {"MinRAMFraction", "2"}, {"InitialRAMFraction", "64"}, @@ -76,7 +75,21 @@ public class VMDeprecatedOptions { } } + // Deprecated diagnostic command line options need to be preceded on the + // command line by -XX:+UnlockDiagnosticVMOptions. + static void testDeprecatedDiagnostic(String option, String value) throws Throwable { + String XXoption = CommandLineOptionTest.prepareFlag(option, value); + ProcessBuilder processBuilder = ProcessTools.createJavaProcessBuilder( + CommandLineOptionTest.UNLOCK_DIAGNOSTIC_VM_OPTIONS, XXoption, "-version"); + OutputAnalyzer output = new OutputAnalyzer(processBuilder.start()); + // check for option deprecation message: + output.shouldHaveExitValue(0); + String match = getDeprecationString(option); + output.shouldMatch(match); + } + public static void main(String[] args) throws Throwable { testDeprecated(DEPRECATED_OPTIONS); // Make sure that each deprecated option is mentioned in the output. + testDeprecatedDiagnostic("UnsyncloadClass", "false"); } } From ccbf029d2b4d713aead707aada6a736a0999e839 Mon Sep 17 00:00:00 2001 From: Yasumasa Suenaga Date: Wed, 11 Oct 2017 23:29:24 +0900 Subject: [PATCH 74/80] 8189069: regression after push of 8187403: "AssertionFailure: addr should be OopHandle" Reviewed-by: sspitsyn, jgeorge --- .../sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java | 10 ++++------ .../classes/sun/jvm/hotspot/gc/g1/HeapRegion.java | 9 ++------- 2 files changed, 6 insertions(+), 13 deletions(-) diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java index 331a8eb1499..596db0d53a4 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/G1HeapRegionTable.java @@ -37,7 +37,6 @@ import sun.jvm.hotspot.types.AddressField; import sun.jvm.hotspot.types.CIntegerField; import sun.jvm.hotspot.types.Type; import sun.jvm.hotspot.types.TypeDataBase; -import sun.jvm.hotspot.utilities.Assert; // Mirror class for G1HeapRegionTable. It's essentially an index -> HeapRegion map. @@ -136,11 +135,10 @@ public class G1HeapRegionTable extends VMObject { } public HeapRegion getByAddress(Address addr) { - if (Assert.ASSERTS_ENABLED) { - Assert.that(addr instanceof OopHandle, "addr should be OopHandle"); - } - long biasedIndex = addr.asLongValue() >>> shiftBy(); - return new HeapRegion(addr.addOffsetToAsOopHandle(biasedIndex * HeapRegion.getPointerSize())); + long offset = biasedIndex * HeapRegion.getPointerSize(); + Address result = (addr instanceof OopHandle) ? addr.addOffsetToAsOopHandle(offset) + : addr.addOffsetTo(offset); + return new HeapRegion(result); } } diff --git a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java index 608bab9fb30..e771bb38de1 100644 --- a/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java +++ b/src/jdk.hotspot.agent/share/classes/sun/jvm/hotspot/gc/g1/HeapRegion.java @@ -38,7 +38,6 @@ import sun.jvm.hotspot.types.AddressField; import sun.jvm.hotspot.types.CIntegerField; import sun.jvm.hotspot.types.Type; import sun.jvm.hotspot.types.TypeDataBase; -import sun.jvm.hotspot.utilities.Assert; // Mirror class for HeapRegion. Currently we don't actually include // any of its fields but only iterate over it. @@ -76,12 +75,8 @@ public class HeapRegion extends CompactibleSpace { public HeapRegion(Address addr) { super(addr); - - if (Assert.ASSERTS_ENABLED) { - Assert.that(addr instanceof OopHandle, "addr should be OopHandle"); - } - - Address typeAddr = addr.addOffsetToAsOopHandle(typeFieldOffset); + Address typeAddr = (addr instanceof OopHandle) ? addr.addOffsetToAsOopHandle(typeFieldOffset) + : addr.addOffsetTo(typeFieldOffset); type = (HeapRegionType)VMObjectFactory.newObject(HeapRegionType.class, typeAddr); } From c0c2da94f435e967e864eb78dff7e1dfb6b6f50b Mon Sep 17 00:00:00 2001 From: Igor Veresov Date: Wed, 11 Oct 2017 16:19:09 -0700 Subject: [PATCH 75/80] 8189183: [AOT] Fix eclipse project generation after repo consolidation Reviewed-by: dlong --- .../hotspot/templates/eclipse/cproject | 2 +- src/hotspot/.mx.jvmci/mx_jvmci.py | 24 +++++++---- src/hotspot/.mx.jvmci/suite.py | 42 +++++++++---------- .../.mx.graal/suite.py | 2 +- 4 files changed, 37 insertions(+), 33 deletions(-) diff --git a/src/hotspot/.mx.jvmci/hotspot/templates/eclipse/cproject b/src/hotspot/.mx.jvmci/hotspot/templates/eclipse/cproject index b156340e98b..6f2353059e7 100644 --- a/src/hotspot/.mx.jvmci/hotspot/templates/eclipse/cproject +++ b/src/hotspot/.mx.jvmci/hotspot/templates/eclipse/cproject @@ -70,7 +70,7 @@ - + diff --git a/src/hotspot/.mx.jvmci/mx_jvmci.py b/src/hotspot/.mx.jvmci/mx_jvmci.py index 37a9baff97e..5b582b3d45d 100644 --- a/src/hotspot/.mx.jvmci/mx_jvmci.py +++ b/src/hotspot/.mx.jvmci/mx_jvmci.py @@ -256,14 +256,10 @@ class HotSpotProject(mx.NativeProject): """ roots = [ - 'ASSEMBLY_EXCEPTION', - 'LICENSE', - 'README', - 'THIRD_PARTY_README', - 'agent', - 'make', - 'src', - 'test' + 'cpu', + 'os', + 'os_cpu', + 'share' ] for jvmVariant in _jdkJvmVariants: @@ -605,6 +601,16 @@ def _get_openjdk_cpu(): def _get_openjdk_os_cpu(): return _get_openjdk_os() + '-' + _get_openjdk_cpu() +def _get_jdk_dir(): + suiteParentDir = dirname(_suite.dir) + # suitParentDir is now something like: /some_prefix/jdk10-hs/open/src + pathComponents = suiteParentDir.split(os.sep) + for i in range(0, len(pathComponents)): + if pathComponents[i] in ["open", "src"]: + del pathComponents[i:] + break + return os.path.join(os.sep, *pathComponents) + def _get_jdk_build_dir(debugLevel=None): """ Gets the directory into which the JDK is built. This directory contains @@ -613,7 +619,7 @@ def _get_jdk_build_dir(debugLevel=None): if debugLevel is None: debugLevel = _vm.debugLevel name = '{}-{}-{}-{}'.format(_get_openjdk_os_cpu(), 'normal', _vm.jvmVariant, debugLevel) - return join(dirname(_suite.dir), 'build', name) + return join(_get_jdk_dir(), 'build', name) _jvmci_bootclasspath_prepends = [] diff --git a/src/hotspot/.mx.jvmci/suite.py b/src/hotspot/.mx.jvmci/suite.py index 9415623d92b..edea9f2d82e 100644 --- a/src/hotspot/.mx.jvmci/suite.py +++ b/src/hotspot/.mx.jvmci/suite.py @@ -24,9 +24,7 @@ suite = { "defaultLicense" : "GPLv2-CPE", - # This puts mx/ as a sibling of the JDK build configuration directories - # (e.g., macosx-x86_64-normal-server-release). - "outputRoot" : "../build/mx/hotspot", + "outputRoot" : "../../build/mx/hotspot", # ------------- Libraries ------------- @@ -43,7 +41,7 @@ suite = { # ------------- JVMCI:Service ------------- "jdk.vm.ci.services" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "javaCompliance" : "9", "workingSets" : "API,JVMCI", @@ -52,7 +50,7 @@ suite = { # ------------- JVMCI:API ------------- "jdk.vm.ci.common" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "checkstyle" : "jdk.vm.ci.services", "javaCompliance" : "9", @@ -60,7 +58,7 @@ suite = { }, "jdk.vm.ci.meta" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "checkstyle" : "jdk.vm.ci.services", "javaCompliance" : "9", @@ -68,7 +66,7 @@ suite = { }, "jdk.vm.ci.code" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : ["jdk.vm.ci.meta"], "checkstyle" : "jdk.vm.ci.services", @@ -77,7 +75,7 @@ suite = { }, "jdk.vm.ci.code.test" : { - "subDir" : "test/compiler/jvmci", + "subDir" : "../../test/hotspot/jtreg/compiler/jvmci", "sourceDirs" : ["src"], "dependencies" : [ "mx:JUNIT", @@ -92,7 +90,7 @@ suite = { }, "jdk.vm.ci.runtime" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : [ "jdk.vm.ci.code", @@ -104,7 +102,7 @@ suite = { }, "jdk.vm.ci.runtime.test" : { - "subDir" : "test/compiler/jvmci", + "subDir" : "../../test/hotspot/jtreg/compiler/jvmci", "sourceDirs" : ["src"], "dependencies" : [ "mx:JUNIT", @@ -119,7 +117,7 @@ suite = { # ------------- JVMCI:HotSpot ------------- "jdk.vm.ci.aarch64" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : ["jdk.vm.ci.code"], "checkstyle" : "jdk.vm.ci.services", @@ -128,7 +126,7 @@ suite = { }, "jdk.vm.ci.amd64" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : ["jdk.vm.ci.code"], "checkstyle" : "jdk.vm.ci.services", @@ -137,7 +135,7 @@ suite = { }, "jdk.vm.ci.sparc" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : ["jdk.vm.ci.code"], "checkstyle" : "jdk.vm.ci.services", @@ -146,7 +144,7 @@ suite = { }, "jdk.vm.ci.hotspot" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : [ "jdk.vm.ci.common", @@ -163,7 +161,7 @@ suite = { }, "jdk.vm.ci.hotspot.test" : { - "subDir" : "test/compiler/jvmci", + "subDir" : "../../test/hotspot/jtreg/compiler/jvmci", "sourceDirs" : ["src"], "dependencies" : [ "TESTNG", @@ -175,7 +173,7 @@ suite = { }, "jdk.vm.ci.hotspot.aarch64" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : [ "jdk.vm.ci.aarch64", @@ -187,7 +185,7 @@ suite = { }, "jdk.vm.ci.hotspot.amd64" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : [ "jdk.vm.ci.amd64", @@ -199,7 +197,7 @@ suite = { }, "jdk.vm.ci.hotspot.sparc" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "sourceDirs" : ["src"], "dependencies" : [ "jdk.vm.ci.sparc", @@ -221,12 +219,12 @@ suite = { # ------------- Distributions ------------- "JVMCI_SERVICES" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "dependencies" : ["jdk.vm.ci.services"], }, "JVMCI_API" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "dependencies" : [ "jdk.vm.ci.runtime", "jdk.vm.ci.common", @@ -240,7 +238,7 @@ suite = { }, "JVMCI_HOTSPOT" : { - "subDir" : "src/jdk.internal.vm.ci/share/classes", + "subDir" : "../jdk.internal.vm.ci/share/classes", "dependencies" : [ "jdk.vm.ci.hotspot.aarch64", "jdk.vm.ci.hotspot.amd64", @@ -253,7 +251,7 @@ suite = { }, "JVMCI_TEST" : { - "subDir" : "test/compiler/jvmci", + "subDir" : "../../test/hotspot/jtreg/compiler/jvmci", "dependencies" : [ "jdk.vm.ci.runtime.test", ], diff --git a/src/jdk.internal.vm.compiler/.mx.graal/suite.py b/src/jdk.internal.vm.compiler/.mx.graal/suite.py index 6dd8b072ee2..c112ee8b289 100644 --- a/src/jdk.internal.vm.compiler/.mx.graal/suite.py +++ b/src/jdk.internal.vm.compiler/.mx.graal/suite.py @@ -6,7 +6,7 @@ suite = { # This puts mx/ as a sibling of the JDK build configuration directories # (e.g., macosx-x86_64-normal-server-release). - "outputRoot" : "../../../build/mx/hotspot", + "outputRoot" : "../../build/mx/hotspot", "jdklibraries" : { "JVMCI_SERVICES" : { From 3f2081a61866bfd0b105c43c9dd810224091908c Mon Sep 17 00:00:00 2001 From: Erik Helin Date: Mon, 18 Sep 2017 15:06:28 +0200 Subject: [PATCH 76/80] 8187667: Disable deprecation warning for readdir_r Reviewed-by: dholmes, sjohanss --- src/hotspot/os/linux/os_linux.inline.hpp | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/src/hotspot/os/linux/os_linux.inline.hpp b/src/hotspot/os/linux/os_linux.inline.hpp index a665e4c69c6..cf00c6a4621 100644 --- a/src/hotspot/os/linux/os_linux.inline.hpp +++ b/src/hotspot/os/linux/os_linux.inline.hpp @@ -98,6 +98,11 @@ inline int os::ftruncate(int fd, jlong length) { inline struct dirent* os::readdir(DIR* dirp, dirent *dbuf) { +// readdir_r has been deprecated since glibc 2.24. +// See https://sourceware.org/bugzilla/show_bug.cgi?id=19056 for more details. +#pragma GCC diagnostic push +#pragma GCC diagnostic ignored "-Wdeprecated-declarations" + dirent* p; int status; assert(dirp != NULL, "just checking"); @@ -111,6 +116,8 @@ inline struct dirent* os::readdir(DIR* dirp, dirent *dbuf) return NULL; } else return p; + +#pragma GCC diagnostic pop } inline int os::closedir(DIR *dirp) { From 4516caf1259e4ffec9da9f545fdb89b1a12c8593 Mon Sep 17 00:00:00 2001 From: Roman Kennke Date: Thu, 12 Oct 2017 15:08:19 +0200 Subject: [PATCH 77/80] 8179387: Factor out CMS specific code from GenCollectedHeap into its own subclass Reviewed-by: ehelin, coleenp --- src/hotspot/share/gc/cms/cmsHeap.cpp | 170 ++++++++++++++ src/hotspot/share/gc/cms/cmsHeap.hpp | 115 ++++++++++ .../share/gc/cms/compactibleFreeListSpace.cpp | 6 +- .../gc/cms/concurrentMarkSweepGeneration.cpp | 211 +++++++++--------- .../concurrentMarkSweepGeneration.inline.hpp | 4 +- .../gc/cms/concurrentMarkSweepThread.cpp | 10 +- .../share/gc/cms/parCardTableModRefBS.cpp | 6 +- src/hotspot/share/gc/cms/parNewGeneration.cpp | 51 +++-- src/hotspot/share/gc/cms/parNewGeneration.hpp | 11 +- .../share/gc/cms/parOopClosures.inline.hpp | 12 +- src/hotspot/share/gc/cms/vmCMSOperations.cpp | 51 ++--- .../share/gc/serial/defNewGeneration.cpp | 5 +- .../share/gc/serial/defNewGeneration.hpp | 4 +- src/hotspot/share/gc/shared/collectedHeap.hpp | 4 +- .../share/gc/shared/genCollectedHeap.cpp | 181 +-------------- .../share/gc/shared/genCollectedHeap.hpp | 98 ++++---- src/hotspot/share/memory/universe.cpp | 3 +- src/hotspot/share/services/memoryService.cpp | 3 +- 18 files changed, 538 insertions(+), 407 deletions(-) create mode 100644 src/hotspot/share/gc/cms/cmsHeap.cpp create mode 100644 src/hotspot/share/gc/cms/cmsHeap.hpp diff --git a/src/hotspot/share/gc/cms/cmsHeap.cpp b/src/hotspot/share/gc/cms/cmsHeap.cpp new file mode 100644 index 00000000000..f41da0379d0 --- /dev/null +++ b/src/hotspot/share/gc/cms/cmsHeap.cpp @@ -0,0 +1,170 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + * + */ + +#include "precompiled.hpp" +#include "gc/cms/concurrentMarkSweepThread.hpp" +#include "gc/cms/cmsHeap.hpp" +#include "gc/cms/vmCMSOperations.hpp" +#include "gc/shared/genOopClosures.inline.hpp" +#include "gc/shared/strongRootsScope.hpp" +#include "gc/shared/workgroup.hpp" +#include "oops/oop.inline.hpp" +#include "runtime/vmThread.hpp" +#include "utilities/stack.inline.hpp" + +CMSHeap::CMSHeap(GenCollectorPolicy *policy) : GenCollectedHeap(policy) { + _workers = new WorkGang("GC Thread", ParallelGCThreads, + /* are_GC_task_threads */true, + /* are_ConcurrentGC_threads */false); + _workers->initialize_workers(); +} + +jint CMSHeap::initialize() { + jint status = GenCollectedHeap::initialize(); + if (status != JNI_OK) return status; + + // If we are running CMS, create the collector responsible + // for collecting the CMS generations. + assert(collector_policy()->is_concurrent_mark_sweep_policy(), "must be CMS policy"); + create_cms_collector(); + + return JNI_OK; +} + +void CMSHeap::check_gen_kinds() { + assert(young_gen()->kind() == Generation::ParNew, + "Wrong youngest generation type"); + assert(old_gen()->kind() == Generation::ConcurrentMarkSweep, + "Wrong generation kind"); +} + +CMSHeap* CMSHeap::heap() { + CollectedHeap* heap = Universe::heap(); + assert(heap != NULL, "Uninitialized access to CMSHeap::heap()"); + assert(heap->kind() == CollectedHeap::CMSHeap, "Not a CMSHeap"); + return (CMSHeap*) heap; +} + +void CMSHeap::gc_threads_do(ThreadClosure* tc) const { + assert(workers() != NULL, "should have workers here"); + workers()->threads_do(tc); + ConcurrentMarkSweepThread::threads_do(tc); +} + +void CMSHeap::print_gc_threads_on(outputStream* st) const { + assert(workers() != NULL, "should have workers here"); + workers()->print_worker_threads_on(st); + ConcurrentMarkSweepThread::print_all_on(st); +} + +void CMSHeap::print_on_error(outputStream* st) const { + GenCollectedHeap::print_on_error(st); + st->cr(); + CMSCollector::print_on_error(st); +} + +void CMSHeap::create_cms_collector() { + assert(old_gen()->kind() == Generation::ConcurrentMarkSweep, + "Unexpected generation kinds"); + assert(gen_policy()->is_concurrent_mark_sweep_policy(), "Unexpected policy type"); + CMSCollector* collector = + new CMSCollector((ConcurrentMarkSweepGeneration*) old_gen(), + rem_set(), + gen_policy()->as_concurrent_mark_sweep_policy()); + + if (!collector->completed_initialization()) { + vm_shutdown_during_initialization("Could not create CMS collector"); + } +} + +void CMSHeap::collect(GCCause::Cause cause) { + if (should_do_concurrent_full_gc(cause)) { + // Mostly concurrent full collection. + collect_mostly_concurrent(cause); + } else { + GenCollectedHeap::collect(cause); + } +} + +bool CMSHeap::should_do_concurrent_full_gc(GCCause::Cause cause) { + switch (cause) { + case GCCause::_gc_locker: return GCLockerInvokesConcurrent; + case GCCause::_java_lang_system_gc: + case GCCause::_dcmd_gc_run: return ExplicitGCInvokesConcurrent; + default: return false; + } +} + +void CMSHeap::collect_mostly_concurrent(GCCause::Cause cause) { + assert(!Heap_lock->owned_by_self(), "Should not own Heap_lock"); + + MutexLocker ml(Heap_lock); + // Read the GC counts while holding the Heap_lock + unsigned int full_gc_count_before = total_full_collections(); + unsigned int gc_count_before = total_collections(); + { + MutexUnlocker mu(Heap_lock); + VM_GenCollectFullConcurrent op(gc_count_before, full_gc_count_before, cause); + VMThread::execute(&op); + } +} + +void CMSHeap::stop() { + ConcurrentMarkSweepThread::cmst()->stop(); +} + +void CMSHeap::cms_process_roots(StrongRootsScope* scope, + bool young_gen_as_roots, + ScanningOption so, + bool only_strong_roots, + OopsInGenClosure* root_closure, + CLDClosure* cld_closure) { + MarkingCodeBlobClosure mark_code_closure(root_closure, !CodeBlobToOopClosure::FixRelocations); + OopsInGenClosure* weak_roots = only_strong_roots ? NULL : root_closure; + CLDClosure* weak_cld_closure = only_strong_roots ? NULL : cld_closure; + + process_roots(scope, so, root_closure, weak_roots, cld_closure, weak_cld_closure, &mark_code_closure); + if (!only_strong_roots) { + process_string_table_roots(scope, root_closure); + } + + if (young_gen_as_roots && + !_process_strong_tasks->is_task_claimed(GCH_PS_younger_gens)) { + root_closure->set_generation(young_gen()); + young_gen()->oop_iterate(root_closure); + root_closure->reset_generation(); + } + + _process_strong_tasks->all_tasks_completed(scope->n_threads()); +} + +void CMSHeap::gc_prologue(bool full) { + always_do_update_barrier = false; + GenCollectedHeap::gc_prologue(full); +}; + +void CMSHeap::gc_epilogue(bool full) { + GenCollectedHeap::gc_epilogue(full); + always_do_update_barrier = true; +}; diff --git a/src/hotspot/share/gc/cms/cmsHeap.hpp b/src/hotspot/share/gc/cms/cmsHeap.hpp new file mode 100644 index 00000000000..94a8037cbca --- /dev/null +++ b/src/hotspot/share/gc/cms/cmsHeap.hpp @@ -0,0 +1,115 @@ +/* + * Copyright (c) 2017, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + * + */ + +#ifndef SHARE_VM_GC_CMS_CMSHEAP_HPP +#define SHARE_VM_GC_CMS_CMSHEAP_HPP + +#include "gc/cms/concurrentMarkSweepGeneration.hpp" +#include "gc/shared/collectedHeap.hpp" +#include "gc/shared/gcCause.hpp" +#include "gc/shared/genCollectedHeap.hpp" + +class CLDClosure; +class GenCollectorPolicy; +class OopsInGenClosure; +class outputStream; +class StrongRootsScope; +class ThreadClosure; +class WorkGang; + +class CMSHeap : public GenCollectedHeap { +public: + CMSHeap(GenCollectorPolicy *policy); + + // Returns JNI_OK on success + virtual jint initialize(); + + virtual void check_gen_kinds(); + + // Convenience function to be used in situations where the heap type can be + // asserted to be this type. + static CMSHeap* heap(); + + virtual Name kind() const { + return CollectedHeap::CMSHeap; + } + + virtual const char* name() const { + return "Concurrent Mark Sweep"; + } + + WorkGang* workers() const { return _workers; } + + virtual void print_gc_threads_on(outputStream* st) const; + virtual void gc_threads_do(ThreadClosure* tc) const; + virtual void print_on_error(outputStream* st) const; + + // Perform a full collection of the heap; intended for use in implementing + // "System.gc". This implies as full a collection as the CollectedHeap + // supports. Caller does not hold the Heap_lock on entry. + void collect(GCCause::Cause cause); + + bool is_in_closed_subset(const void* p) const { + return is_in_reserved(p); + } + + bool card_mark_must_follow_store() const { + return true; + } + + void stop(); + + // If "young_gen_as_roots" is false, younger generations are + // not scanned as roots; in this case, the caller must be arranging to + // scan the younger generations itself. (For example, a generation might + // explicitly mark reachable objects in younger generations, to avoid + // excess storage retention.) + void cms_process_roots(StrongRootsScope* scope, + bool young_gen_as_roots, + ScanningOption so, + bool only_strong_roots, + OopsInGenClosure* root_closure, + CLDClosure* cld_closure); + +private: + WorkGang* _workers; + + virtual void gc_prologue(bool full); + virtual void gc_epilogue(bool full); + + // Accessor for memory state verification support + NOT_PRODUCT( + virtual size_t skip_header_HeapWords() { return CMSCollector::skip_header_HeapWords(); } + ) + + // Returns success or failure. + void create_cms_collector(); + + // In support of ExplicitGCInvokesConcurrent functionality + bool should_do_concurrent_full_gc(GCCause::Cause cause); + + void collect_mostly_concurrent(GCCause::Cause cause); +}; + +#endif // SHARE_VM_GC_CMS_CMSHEAP_HPP diff --git a/src/hotspot/share/gc/cms/compactibleFreeListSpace.cpp b/src/hotspot/share/gc/cms/compactibleFreeListSpace.cpp index 3653c4df24f..34116c60433 100644 --- a/src/hotspot/share/gc/cms/compactibleFreeListSpace.cpp +++ b/src/hotspot/share/gc/cms/compactibleFreeListSpace.cpp @@ -23,13 +23,13 @@ */ #include "precompiled.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/cmsLockVerifier.hpp" #include "gc/cms/compactibleFreeListSpace.hpp" #include "gc/cms/concurrentMarkSweepGeneration.inline.hpp" #include "gc/cms/concurrentMarkSweepThread.hpp" #include "gc/shared/blockOffsetTable.inline.hpp" #include "gc/shared/collectedHeap.inline.hpp" -#include "gc/shared/genCollectedHeap.hpp" #include "gc/shared/space.inline.hpp" #include "gc/shared/spaceDecorator.hpp" #include "logging/log.hpp" @@ -154,7 +154,7 @@ HeapWord* CompactibleFreeListSpace::forward(oop q, size_t size, cp->space->set_compaction_top(compact_top); cp->space = cp->space->next_compaction_space(); if (cp->space == NULL) { - cp->gen = GenCollectedHeap::heap()->young_gen(); + cp->gen = CMSHeap::heap()->young_gen(); assert(cp->gen != NULL, "compaction must succeed"); cp->space = cp->gen->first_compaction_space(); assert(cp->space != NULL, "generation must have a first compaction space"); @@ -2298,7 +2298,7 @@ void CompactibleFreeListSpace::verify() const { // Iterate over all oops in the heap. Uses the _no_header version // since we are not interested in following the klass pointers. - GenCollectedHeap::heap()->oop_iterate_no_header(&cl); + CMSHeap::heap()->oop_iterate_no_header(&cl); } if (VerifyObjectStartArray) { diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp index 59161a2baa6..0cbc0642a8b 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.cpp @@ -29,6 +29,7 @@ #include "classfile/systemDictionary.hpp" #include "code/codeCache.hpp" #include "gc/cms/cmsCollectorPolicy.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/cmsOopClosures.inline.hpp" #include "gc/cms/compactibleFreeListSpace.hpp" #include "gc/cms/concurrentMarkSweepGeneration.inline.hpp" @@ -298,14 +299,14 @@ void CMSCollector::ref_processor_init() { } AdaptiveSizePolicy* CMSCollector::size_policy() { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - return gch->gen_policy()->size_policy(); + CMSHeap* heap = CMSHeap::heap(); + return heap->gen_policy()->size_policy(); } void ConcurrentMarkSweepGeneration::initialize_performance_counters() { const char* gen_name = "old"; - GenCollectorPolicy* gcp = GenCollectedHeap::heap()->gen_policy(); + GenCollectorPolicy* gcp = CMSHeap::heap()->gen_policy(); // Generation Counters - generation 1, 1 subspace _gen_counters = new GenerationCounters(gen_name, 1, 1, gcp->min_old_size(), gcp->max_old_size(), &_virtual_space); @@ -354,8 +355,8 @@ void CMSStats::adjust_cms_free_adjustment_factor(bool fail, size_t free) { // young generation collection. double CMSStats::time_until_cms_gen_full() const { size_t cms_free = _cms_gen->cmsSpace()->free(); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - size_t expected_promotion = MIN2(gch->young_gen()->capacity(), + CMSHeap* heap = CMSHeap::heap(); + size_t expected_promotion = MIN2(heap->young_gen()->capacity(), (size_t) _cms_gen->gc_stats()->avg_promoted()->padded_average()); if (cms_free > expected_promotion) { // Start a cms collection if there isn't enough space to promote @@ -595,12 +596,12 @@ CMSCollector::CMSCollector(ConcurrentMarkSweepGeneration* cmsGen, assert(CGC_lock != NULL, "Where's the CGC_lock?"); // Support for parallelizing young gen rescan - GenCollectedHeap* gch = GenCollectedHeap::heap(); - assert(gch->young_gen()->kind() == Generation::ParNew, "CMS can only be used with ParNew"); - _young_gen = (ParNewGeneration*)gch->young_gen(); - if (gch->supports_inline_contig_alloc()) { - _top_addr = gch->top_addr(); - _end_addr = gch->end_addr(); + CMSHeap* heap = CMSHeap::heap(); + assert(heap->young_gen()->kind() == Generation::ParNew, "CMS can only be used with ParNew"); + _young_gen = (ParNewGeneration*)heap->young_gen(); + if (heap->supports_inline_contig_alloc()) { + _top_addr = heap->top_addr(); + _end_addr = heap->end_addr(); assert(_young_gen != NULL, "no _young_gen"); _eden_chunk_index = 0; _eden_chunk_capacity = (_young_gen->max_capacity() + CMSSamplingGrain) / CMSSamplingGrain; @@ -762,9 +763,9 @@ void ConcurrentMarkSweepGeneration::compute_new_size_free_list() { log.trace(" Maximum free fraction %f", maximum_free_percentage); log.trace(" Capacity " SIZE_FORMAT, capacity() / 1000); log.trace(" Desired capacity " SIZE_FORMAT, desired_capacity / 1000); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - assert(gch->is_old_gen(this), "The CMS generation should always be the old generation"); - size_t young_size = gch->young_gen()->capacity(); + CMSHeap* heap = CMSHeap::heap(); + assert(heap->is_old_gen(this), "The CMS generation should always be the old generation"); + size_t young_size = heap->young_gen()->capacity(); log.trace(" Young gen size " SIZE_FORMAT, young_size / 1000); log.trace(" unsafe_max_alloc_nogc " SIZE_FORMAT, unsafe_max_alloc_nogc() / 1000); log.trace(" contiguous available " SIZE_FORMAT, contiguous_available() / 1000); @@ -923,7 +924,7 @@ oop ConcurrentMarkSweepGeneration::promote(oop obj, size_t obj_size) { assert_lock_strong(freelistLock()); #ifndef PRODUCT - if (GenCollectedHeap::heap()->promotion_should_fail()) { + if (CMSHeap::heap()->promotion_should_fail()) { return NULL; } #endif // #ifndef PRODUCT @@ -1000,7 +1001,7 @@ ConcurrentMarkSweepGeneration::par_promote(int thread_num, oop old, markOop m, size_t word_sz) { #ifndef PRODUCT - if (GenCollectedHeap::heap()->promotion_should_fail()) { + if (CMSHeap::heap()->promotion_should_fail()) { return NULL; } #endif // #ifndef PRODUCT @@ -1179,10 +1180,10 @@ bool CMSCollector::shouldConcurrentCollect() { // We start a collection if we believe an incremental collection may fail; // this is not likely to be productive in practice because it's probably too // late anyway. - GenCollectedHeap* gch = GenCollectedHeap::heap(); - assert(gch->collector_policy()->is_generation_policy(), + CMSHeap* heap = CMSHeap::heap(); + assert(heap->collector_policy()->is_generation_policy(), "You may want to check the correctness of the following"); - if (gch->incremental_collection_will_fail(true /* consult_young */)) { + if (heap->incremental_collection_will_fail(true /* consult_young */)) { log.print("CMSCollector: collect because incremental collection will fail "); return true; } @@ -1294,8 +1295,8 @@ void CMSCollector::collect(bool full, } void CMSCollector::request_full_gc(unsigned int full_gc_count, GCCause::Cause cause) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - unsigned int gc_count = gch->total_full_collections(); + CMSHeap* heap = CMSHeap::heap(); + unsigned int gc_count = heap->total_full_collections(); if (gc_count == full_gc_count) { MutexLockerEx y(CGC_lock, Mutex::_no_safepoint_check_flag); _full_gc_requested = true; @@ -1307,7 +1308,7 @@ void CMSCollector::request_full_gc(unsigned int full_gc_count, GCCause::Cause ca } bool CMSCollector::is_external_interruption() { - GCCause::Cause cause = GenCollectedHeap::heap()->gc_cause(); + GCCause::Cause cause = CMSHeap::heap()->gc_cause(); return GCCause::is_user_requested_gc(cause) || GCCause::is_serviceability_requested_gc(cause); } @@ -1456,8 +1457,8 @@ void CMSCollector::acquire_control_and_collect(bool full, // Inform cms gen if this was due to partial collection failing. // The CMS gen may use this fact to determine its expansion policy. - GenCollectedHeap* gch = GenCollectedHeap::heap(); - if (gch->incremental_collection_will_fail(false /* don't consult_young */)) { + CMSHeap* heap = CMSHeap::heap(); + if (heap->incremental_collection_will_fail(false /* don't consult_young */)) { assert(!_cmsGen->incremental_collection_failed(), "Should have been noticed, reacted to and cleared"); _cmsGen->set_incremental_collection_failed(); @@ -1489,14 +1490,14 @@ void CMSCollector::acquire_control_and_collect(bool full, // Has the GC time limit been exceeded? size_t max_eden_size = _young_gen->max_eden_size(); - GCCause::Cause gc_cause = gch->gc_cause(); + GCCause::Cause gc_cause = heap->gc_cause(); size_policy()->check_gc_overhead_limit(_young_gen->used(), _young_gen->eden()->used(), _cmsGen->max_capacity(), max_eden_size, full, gc_cause, - gch->collector_policy()); + heap->collector_policy()); // Reset the expansion cause, now that we just completed // a collection cycle. @@ -1518,21 +1519,21 @@ void CMSCollector::compute_new_size() { // A work method used by the foreground collector to do // a mark-sweep-compact. void CMSCollector::do_compaction_work(bool clear_all_soft_refs) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); STWGCTimer* gc_timer = GenMarkSweep::gc_timer(); gc_timer->register_gc_start(); SerialOldTracer* gc_tracer = GenMarkSweep::gc_tracer(); - gc_tracer->report_gc_start(gch->gc_cause(), gc_timer->gc_start()); + gc_tracer->report_gc_start(heap->gc_cause(), gc_timer->gc_start()); - gch->pre_full_gc_dump(gc_timer); + heap->pre_full_gc_dump(gc_timer); GCTraceTime(Trace, gc, phases) t("CMS:MSC"); // Temporarily widen the span of the weak reference processing to // the entire heap. - MemRegion new_span(GenCollectedHeap::heap()->reserved_region()); + MemRegion new_span(CMSHeap::heap()->reserved_region()); ReferenceProcessorSpanMutator rp_mut_span(ref_processor(), new_span); // Temporarily, clear the "is_alive_non_header" field of the // reference processor. @@ -1608,7 +1609,7 @@ void CMSCollector::do_compaction_work(bool clear_all_soft_refs) { // No longer a need to do a concurrent collection for Metaspace. MetaspaceGC::set_should_concurrent_collect(false); - gch->post_full_gc_dump(gc_timer); + heap->post_full_gc_dump(gc_timer); gc_timer->register_gc_end(); @@ -1702,7 +1703,7 @@ void CMSCollector::collect_in_background(GCCause::Cause cause) { assert(Thread::current()->is_ConcurrentGC_thread(), "A CMS asynchronous collection is only allowed on a CMS thread."); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); { bool safepoint_check = Mutex::_no_safepoint_check_flag; MutexLockerEx hl(Heap_lock, safepoint_check); @@ -1731,8 +1732,8 @@ void CMSCollector::collect_in_background(GCCause::Cause cause) { _full_gc_requested = false; // acks all outstanding full gc requests _full_gc_cause = GCCause::_no_gc; // Signal that we are about to start a collection - gch->increment_total_full_collections(); // ... starting a collection cycle - _collection_count_start = gch->total_full_collections(); + heap->increment_total_full_collections(); // ... starting a collection cycle + _collection_count_start = heap->total_full_collections(); } size_t prev_used = _cmsGen->used(); @@ -1925,9 +1926,9 @@ void CMSCollector::register_gc_end() { } void CMSCollector::save_heap_summary() { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - _last_heap_summary = gch->create_heap_summary(); - _last_metaspace_summary = gch->create_metaspace_summary(); + CMSHeap* heap = CMSHeap::heap(); + _last_heap_summary = heap->create_heap_summary(); + _last_metaspace_summary = heap->create_metaspace_summary(); } void CMSCollector::report_heap_summary(GCWhen::Type when) { @@ -2303,10 +2304,10 @@ bool CMSCollector::verify_after_remark() { assert(verification_mark_stack()->isEmpty(), "markStack should be empty"); verify_work_stacks_empty(); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - gch->ensure_parsability(false); // fill TLABs, but no need to retire them + CMSHeap* heap = CMSHeap::heap(); + heap->ensure_parsability(false); // fill TLABs, but no need to retire them // Update the saved marks which may affect the root scans. - gch->save_marks(); + heap->save_marks(); if (CMSRemarkVerifyVariant == 1) { // In this first variant of verification, we complete @@ -2329,19 +2330,19 @@ bool CMSCollector::verify_after_remark() { void CMSCollector::verify_after_remark_work_1() { ResourceMark rm; HandleMark hm; - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); // Get a clear set of claim bits for the roots processing to work with. ClassLoaderDataGraph::clear_claimed_marks(); // Mark from roots one level into CMS MarkRefsIntoClosure notOlder(_span, verification_mark_bm()); - gch->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. + heap->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. { StrongRootsScope srs(1); - gch->cms_process_roots(&srs, + heap->cms_process_roots(&srs, true, // young gen as roots GenCollectedHeap::ScanningOption(roots_scanning_options()), should_unload_classes(), @@ -2376,7 +2377,7 @@ void CMSCollector::verify_after_remark_work_1() { log.error("Failed marking verification after remark"); ResourceMark rm; LogStream ls(log.error()); - gch->print_on(&ls); + heap->print_on(&ls); fatal("CMS: failed marking verification after remark"); } } @@ -2399,7 +2400,7 @@ class VerifyCLDOopsCLDClosure : public CLDClosure { void CMSCollector::verify_after_remark_work_2() { ResourceMark rm; HandleMark hm; - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); // Get a clear set of claim bits for the roots processing to work with. ClassLoaderDataGraph::clear_claimed_marks(); @@ -2409,12 +2410,12 @@ void CMSCollector::verify_after_remark_work_2() { markBitMap()); CLDToOopClosure cld_closure(¬Older, true); - gch->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. + heap->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. { StrongRootsScope srs(1); - gch->cms_process_roots(&srs, + heap->cms_process_roots(&srs, true, // young gen as roots GenCollectedHeap::ScanningOption(roots_scanning_options()), should_unload_classes(), @@ -2803,7 +2804,7 @@ class CMSParInitialMarkTask: public CMSParMarkTask { void CMSCollector::checkpointRootsInitial() { assert(_collectorState == InitialMarking, "Wrong collector state"); check_correct_thread_executing(); - TraceCMSMemoryManagerStats tms(_collectorState,GenCollectedHeap::heap()->gc_cause()); + TraceCMSMemoryManagerStats tms(_collectorState, CMSHeap::heap()->gc_cause()); save_heap_summary(); report_heap_summary(GCWhen::BeforeGC); @@ -2844,14 +2845,14 @@ void CMSCollector::checkpointRootsInitialWork() { HandleMark hm; MarkRefsIntoClosure notOlder(_span, &_markBitMap); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); verify_work_stacks_empty(); verify_overflow_empty(); - gch->ensure_parsability(false); // fill TLABs, but no need to retire them + heap->ensure_parsability(false); // fill TLABs, but no need to retire them // Update the saved marks which may affect the root scans. - gch->save_marks(); + heap->save_marks(); // weak reference processing has not started yet. ref_processor()->set_enqueuing_is_done(false); @@ -2872,7 +2873,7 @@ void CMSCollector::checkpointRootsInitialWork() { #endif if (CMSParallelInitialMarkEnabled) { // The parallel version. - WorkGang* workers = gch->workers(); + WorkGang* workers = heap->workers(); assert(workers != NULL, "Need parallel worker threads."); uint n_workers = workers->active_workers(); @@ -2891,11 +2892,11 @@ void CMSCollector::checkpointRootsInitialWork() { } else { // The serial version. CLDToOopClosure cld_closure(¬Older, true); - gch->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. + heap->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. StrongRootsScope srs(1); - gch->cms_process_roots(&srs, + heap->cms_process_roots(&srs, true, // young gen as roots GenCollectedHeap::ScanningOption(roots_scanning_options()), should_unload_classes(), @@ -3800,7 +3801,7 @@ size_t CMSCollector::preclean_work(bool clean_refs, bool clean_survivor) { bitMapLock()); startTimer(); unsigned int before_count = - GenCollectedHeap::heap()->total_collections(); + CMSHeap::heap()->total_collections(); SurvivorSpacePrecleanClosure sss_cl(this, _span, &_markBitMap, &_markStack, &pam_cl, before_count, CMSYield); @@ -4103,7 +4104,7 @@ void CMSCollector::checkpointRootsFinal() { // world is stopped at this checkpoint assert(SafepointSynchronize::is_at_safepoint(), "world should be stopped"); - TraceCMSMemoryManagerStats tms(_collectorState,GenCollectedHeap::heap()->gc_cause()); + TraceCMSMemoryManagerStats tms(_collectorState, CMSHeap::heap()->gc_cause()); verify_work_stacks_empty(); verify_overflow_empty(); @@ -4112,16 +4113,16 @@ void CMSCollector::checkpointRootsFinal() { _young_gen->used() / K, _young_gen->capacity() / K); { if (CMSScavengeBeforeRemark) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); // Temporarily set flag to false, GCH->do_collection will // expect it to be false and set to true - FlagSetting fl(gch->_is_gc_active, false); + FlagSetting fl(heap->_is_gc_active, false); - gch->do_collection(true, // full (i.e. force, see below) - false, // !clear_all_soft_refs - 0, // size - false, // is_tlab - GenCollectedHeap::YoungGen // type + heap->do_collection(true, // full (i.e. force, see below) + false, // !clear_all_soft_refs + 0, // size + false, // is_tlab + GenCollectedHeap::YoungGen // type ); } FreelistLocker x(this); @@ -4142,7 +4143,7 @@ void CMSCollector::checkpointRootsFinalWork() { ResourceMark rm; HandleMark hm; - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); if (should_unload_classes()) { CodeCache::gc_prologue(); @@ -4162,9 +4163,9 @@ void CMSCollector::checkpointRootsFinalWork() { // or of an indication of whether the scavenge did indeed occur, // we cannot rely on TLAB's having been filled and must do // so here just in case a scavenge did not happen. - gch->ensure_parsability(false); // fill TLAB's, but no need to retire them + heap->ensure_parsability(false); // fill TLAB's, but no need to retire them // Update the saved marks which may affect the root scans. - gch->save_marks(); + heap->save_marks(); print_eden_and_survivor_chunk_arrays(); @@ -4240,7 +4241,7 @@ void CMSCollector::checkpointRootsFinalWork() { _markStack._failed_double = 0; if ((VerifyAfterGC || VerifyDuringGC) && - GenCollectedHeap::heap()->total_collections() >= VerifyGCStartAt) { + CMSHeap::heap()->total_collections() >= VerifyGCStartAt) { verify_after_remark(); } @@ -4262,7 +4263,7 @@ void CMSParInitialMarkTask::work(uint worker_id) { // ---------- scan from roots -------------- _timer.start(); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); ParMarkRefsIntoClosure par_mri_cl(_collector->_span, &(_collector->_markBitMap)); // ---------- young gen roots -------------- @@ -4278,12 +4279,12 @@ void CMSParInitialMarkTask::work(uint worker_id) { CLDToOopClosure cld_closure(&par_mri_cl, true); - gch->cms_process_roots(_strong_roots_scope, - false, // yg was scanned above - GenCollectedHeap::ScanningOption(_collector->CMSCollector::roots_scanning_options()), - _collector->should_unload_classes(), - &par_mri_cl, - &cld_closure); + heap->cms_process_roots(_strong_roots_scope, + false, // yg was scanned above + GenCollectedHeap::ScanningOption(_collector->CMSCollector::roots_scanning_options()), + _collector->should_unload_classes(), + &par_mri_cl, + &cld_closure); assert(_collector->should_unload_classes() || (_collector->CMSCollector::roots_scanning_options() & GenCollectedHeap::SO_AllCodeCache), "if we didn't scan the code cache, we have to be ready to drop nmethods with expired weak oops"); @@ -4387,7 +4388,7 @@ void CMSParRemarkTask::work(uint worker_id) { // ---------- rescan from roots -------------- _timer.start(); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); ParMarkRefsIntoAndScanClosure par_mrias_cl(_collector, _collector->_span, _collector->ref_processor(), &(_collector->_markBitMap), @@ -4407,12 +4408,12 @@ void CMSParRemarkTask::work(uint worker_id) { // ---------- remaining roots -------------- _timer.reset(); _timer.start(); - gch->cms_process_roots(_strong_roots_scope, - false, // yg was scanned above - GenCollectedHeap::ScanningOption(_collector->CMSCollector::roots_scanning_options()), - _collector->should_unload_classes(), - &par_mrias_cl, - NULL); // The dirty klasses will be handled below + heap->cms_process_roots(_strong_roots_scope, + false, // yg was scanned above + GenCollectedHeap::ScanningOption(_collector->CMSCollector::roots_scanning_options()), + _collector->should_unload_classes(), + &par_mrias_cl, + NULL); // The dirty klasses will be handled below assert(_collector->should_unload_classes() || (_collector->CMSCollector::roots_scanning_options() & GenCollectedHeap::SO_AllCodeCache), @@ -4839,8 +4840,8 @@ initialize_sequential_subtasks_for_young_gen_rescan(int n_threads) { // Parallel version of remark void CMSCollector::do_remark_parallel() { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - WorkGang* workers = gch->workers(); + CMSHeap* heap = CMSHeap::heap(); + WorkGang* workers = heap->workers(); assert(workers != NULL, "Need parallel worker threads."); // Choose to use the number of GC workers most recently set // into "active_workers". @@ -4856,7 +4857,7 @@ void CMSCollector::do_remark_parallel() { // the younger_gen cards, so we shouldn't call the following else // the verification code as well as subsequent younger_refs_iterate // code would get confused. XXX - // gch->rem_set()->prepare_for_younger_refs_iterate(true); // parallel + // heap->rem_set()->prepare_for_younger_refs_iterate(true); // parallel // The young gen rescan work will not be done as part of // process_roots (which currently doesn't know how to @@ -4898,7 +4899,7 @@ void CMSCollector::do_remark_parallel() { void CMSCollector::do_remark_non_parallel() { ResourceMark rm; HandleMark hm; - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); ReferenceProcessorMTDiscoveryMutator mt(ref_processor(), false); MarkRefsIntoAndScanClosure @@ -4939,7 +4940,7 @@ void CMSCollector::do_remark_non_parallel() { } } if (VerifyDuringGC && - GenCollectedHeap::heap()->total_collections() >= VerifyGCStartAt) { + CMSHeap::heap()->total_collections() >= VerifyGCStartAt) { HandleMark hm; // Discard invalid handles created during verification Universe::verify(); } @@ -4948,15 +4949,15 @@ void CMSCollector::do_remark_non_parallel() { verify_work_stacks_empty(); - gch->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. + heap->rem_set()->prepare_for_younger_refs_iterate(false); // Not parallel. StrongRootsScope srs(1); - gch->cms_process_roots(&srs, - true, // young gen as roots - GenCollectedHeap::ScanningOption(roots_scanning_options()), - should_unload_classes(), - &mrias_cl, - NULL); // The dirty klasses will be handled below + heap->cms_process_roots(&srs, + true, // young gen as roots + GenCollectedHeap::ScanningOption(roots_scanning_options()), + should_unload_classes(), + &mrias_cl, + NULL); // The dirty klasses will be handled below assert(should_unload_classes() || (roots_scanning_options() & GenCollectedHeap::SO_AllCodeCache), @@ -5148,8 +5149,8 @@ void CMSRefProcTaskProxy::do_work_steal(int i, void CMSRefProcTaskExecutor::execute(ProcessTask& task) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - WorkGang* workers = gch->workers(); + CMSHeap* heap = CMSHeap::heap(); + WorkGang* workers = heap->workers(); assert(workers != NULL, "Need parallel worker threads."); CMSRefProcTaskProxy rp_task(task, &_collector, _collector.ref_processor()->span(), @@ -5161,8 +5162,8 @@ void CMSRefProcTaskExecutor::execute(ProcessTask& task) void CMSRefProcTaskExecutor::execute(EnqueueTask& task) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); - WorkGang* workers = gch->workers(); + CMSHeap* heap = CMSHeap::heap(); + WorkGang* workers = heap->workers(); assert(workers != NULL, "Need parallel worker threads."); CMSRefEnqueueTaskProxy enq_task(task); workers->run_task(&enq_task); @@ -5195,9 +5196,9 @@ void CMSCollector::refProcessingWork() { // and a different number of discovered lists may have Ref objects. // That is OK as long as the Reference lists are balanced (see // balance_all_queues() and balance_queues()). - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); uint active_workers = ParallelGCThreads; - WorkGang* workers = gch->workers(); + WorkGang* workers = heap->workers(); if (workers != NULL) { active_workers = workers->active_workers(); // The expectation is that active_workers will have already @@ -5305,7 +5306,7 @@ void CMSCollector::sweep() { verify_work_stacks_empty(); verify_overflow_empty(); increment_sweep_count(); - TraceCMSMemoryManagerStats tms(_collectorState,GenCollectedHeap::heap()->gc_cause()); + TraceCMSMemoryManagerStats tms(_collectorState, CMSHeap::heap()->gc_cause()); _inter_sweep_timer.stop(); _inter_sweep_estimate.sample(_inter_sweep_timer.seconds()); @@ -5378,9 +5379,9 @@ void CMSCollector::sweep() { // this generation. If such a promotion may still fail, // the flag will be set again when a young collection is // attempted. - GenCollectedHeap* gch = GenCollectedHeap::heap(); - gch->clear_incremental_collection_failed(); // Worth retrying as fresh space may have been freed up - gch->update_full_collections_completed(_collection_count_start); + CMSHeap* heap = CMSHeap::heap(); + heap->clear_incremental_collection_failed(); // Worth retrying as fresh space may have been freed up + heap->update_full_collections_completed(_collection_count_start); } // FIX ME!!! Looks like this belongs in CFLSpace, with @@ -5415,7 +5416,7 @@ void ConcurrentMarkSweepGeneration::update_gc_stats(Generation* current_generati bool full) { // If the young generation has been collected, gather any statistics // that are of interest at this point. - bool current_is_young = GenCollectedHeap::heap()->is_young_gen(current_generation); + bool current_is_young = CMSHeap::heap()->is_young_gen(current_generation); if (!full && current_is_young) { // Gather statistics on the young generation collection. collector()->stats().record_gc0_end(used()); @@ -6188,7 +6189,7 @@ size_t SurvivorSpacePrecleanClosure::do_object_careful(oop p) { do_yield_check(); } unsigned int after_count = - GenCollectedHeap::heap()->total_collections(); + CMSHeap::heap()->total_collections(); bool abort = (_before_count != after_count) || _collector->should_abort_preclean(); return abort ? 0 : size; diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.inline.hpp b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.inline.hpp index 503ef69eff0..ca61c8fd45c 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.inline.hpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepGeneration.inline.hpp @@ -25,13 +25,13 @@ #ifndef SHARE_VM_GC_CMS_CONCURRENTMARKSWEEPGENERATION_INLINE_HPP #define SHARE_VM_GC_CMS_CONCURRENTMARKSWEEPGENERATION_INLINE_HPP +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/cmsLockVerifier.hpp" #include "gc/cms/compactibleFreeListSpace.hpp" #include "gc/cms/concurrentMarkSweepGeneration.hpp" #include "gc/cms/concurrentMarkSweepThread.hpp" #include "gc/cms/parNewGeneration.hpp" #include "gc/shared/gcUtil.hpp" -#include "gc/shared/genCollectedHeap.hpp" #include "utilities/align.hpp" #include "utilities/bitMap.inline.hpp" @@ -256,7 +256,7 @@ inline bool CMSCollector::should_abort_preclean() const { // scavenge is done or foreground GC wants to take over collection return _collectorState == AbortablePreclean && (_abort_preclean || _foregroundGCIsActive || - GenCollectedHeap::heap()->incremental_collection_will_fail(true /* consult_young */)); + CMSHeap::heap()->incremental_collection_will_fail(true /* consult_young */)); } inline size_t CMSCollector::get_eden_used() const { diff --git a/src/hotspot/share/gc/cms/concurrentMarkSweepThread.cpp b/src/hotspot/share/gc/cms/concurrentMarkSweepThread.cpp index 43a32e913e8..a4de148bc1a 100644 --- a/src/hotspot/share/gc/cms/concurrentMarkSweepThread.cpp +++ b/src/hotspot/share/gc/cms/concurrentMarkSweepThread.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -24,10 +24,10 @@ #include "precompiled.hpp" #include "classfile/systemDictionary.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/concurrentMarkSweepGeneration.inline.hpp" #include "gc/cms/concurrentMarkSweepThread.hpp" #include "gc/shared/gcId.hpp" -#include "gc/shared/genCollectedHeap.hpp" #include "oops/oop.inline.hpp" #include "runtime/init.hpp" #include "runtime/interfaceSupport.hpp" @@ -225,7 +225,7 @@ void ConcurrentMarkSweepThread::wait_on_cms_lock_for_scavenge(long t_millis) { // Wait time in millis or 0 value representing infinite wait for a scavenge assert(t_millis >= 0, "Wait time for scavenge should be 0 or positive"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); double start_time_secs = os::elapsedTime(); double end_time_secs = start_time_secs + (t_millis / ((double) MILLIUNITS)); @@ -233,7 +233,7 @@ void ConcurrentMarkSweepThread::wait_on_cms_lock_for_scavenge(long t_millis) { unsigned int before_count; { MutexLockerEx hl(Heap_lock, Mutex::_no_safepoint_check_flag); - before_count = gch->total_collections(); + before_count = heap->total_collections(); } unsigned int loop_count = 0; @@ -279,7 +279,7 @@ void ConcurrentMarkSweepThread::wait_on_cms_lock_for_scavenge(long t_millis) { unsigned int after_count; { MutexLockerEx hl(Heap_lock, Mutex::_no_safepoint_check_flag); - after_count = gch->total_collections(); + after_count = heap->total_collections(); } if(before_count != after_count) { diff --git a/src/hotspot/share/gc/cms/parCardTableModRefBS.cpp b/src/hotspot/share/gc/cms/parCardTableModRefBS.cpp index 4456fe6fc7d..085b94cb388 100644 --- a/src/hotspot/share/gc/cms/parCardTableModRefBS.cpp +++ b/src/hotspot/share/gc/cms/parCardTableModRefBS.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2007, 2015, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2007, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -23,10 +23,10 @@ */ #include "precompiled.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/shared/cardTableModRefBS.hpp" #include "gc/shared/cardTableRS.hpp" #include "gc/shared/collectedHeap.hpp" -#include "gc/shared/genCollectedHeap.hpp" #include "gc/shared/space.inline.hpp" #include "memory/allocation.inline.hpp" #include "memory/virtualspace.hpp" @@ -394,7 +394,7 @@ get_LNC_array_for_space(Space* sp, // Do a dirty read here. If we pass the conditional then take the rare // event lock and do the read again in case some other thread had already // succeeded and done the resize. - int cur_collection = GenCollectedHeap::heap()->total_collections(); + int cur_collection = CMSHeap::heap()->total_collections(); // Updated _last_LNC_resizing_collection[i] must not be visible before // _lowest_non_clean and friends are visible. Therefore use acquire/release // to guarantee this on non TSO architecures. diff --git a/src/hotspot/share/gc/cms/parNewGeneration.cpp b/src/hotspot/share/gc/cms/parNewGeneration.cpp index b8bdd04af0a..a8c13d0e514 100644 --- a/src/hotspot/share/gc/cms/parNewGeneration.cpp +++ b/src/hotspot/share/gc/cms/parNewGeneration.cpp @@ -23,6 +23,7 @@ */ #include "precompiled.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/compactibleFreeListSpace.hpp" #include "gc/cms/concurrentMarkSweepGeneration.hpp" #include "gc/cms/parNewGeneration.inline.hpp" @@ -124,7 +125,7 @@ bool ParScanThreadState::should_be_partially_scanned(oop new_obj, oop old_obj) c void ParScanThreadState::scan_partial_array_and_push_remainder(oop old) { assert(old->is_objArray(), "must be obj array"); assert(old->is_forwarded(), "must be forwarded"); - assert(GenCollectedHeap::heap()->is_in_reserved(old), "must be in heap."); + assert(CMSHeap::heap()->is_in_reserved(old), "must be in heap."); assert(!old_gen()->is_in(old), "must be in young generation."); objArrayOop obj = objArrayOop(old->forwardee()); @@ -205,9 +206,9 @@ bool ParScanThreadState::take_from_overflow_stack() { for (size_t i = 0; i != num_take_elems; i++) { oop cur = of_stack->pop(); oop obj_to_push = cur->forwardee(); - assert(GenCollectedHeap::heap()->is_in_reserved(cur), "Should be in heap"); + assert(CMSHeap::heap()->is_in_reserved(cur), "Should be in heap"); assert(!old_gen()->is_in_reserved(cur), "Should be in young gen"); - assert(GenCollectedHeap::heap()->is_in_reserved(obj_to_push), "Should be in heap"); + assert(CMSHeap::heap()->is_in_reserved(obj_to_push), "Should be in heap"); if (should_be_partially_scanned(obj_to_push, cur)) { assert(arrayOop(cur)->length() == 0, "entire array remaining to be scanned"); obj_to_push = cur; @@ -590,7 +591,7 @@ ParNewGenTask::ParNewGenTask(ParNewGeneration* young_gen, {} void ParNewGenTask::work(uint worker_id) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); // Since this is being done in a separate thread, need new resource // and handle marks. ResourceMark rm; @@ -602,10 +603,10 @@ void ParNewGenTask::work(uint worker_id) { par_scan_state.set_young_old_boundary(_young_old_boundary); CLDScanClosure cld_scan_closure(&par_scan_state.to_space_root_closure(), - gch->rem_set()->cld_rem_set()->accumulate_modified_oops()); + heap->rem_set()->cld_rem_set()->accumulate_modified_oops()); par_scan_state.start_strong_roots(); - gch->young_process_roots(_strong_roots_scope, + heap->young_process_roots(_strong_roots_scope, &par_scan_state.to_space_root_closure(), &par_scan_state.older_gen_closure(), &cld_scan_closure); @@ -687,7 +688,7 @@ void /*ParNewGeneration::*/ParKeepAliveClosure::do_oop_work(T* p) { _par_cl->do_oop_nv(p); - if (GenCollectedHeap::heap()->is_in_reserved(p)) { + if (CMSHeap::heap()->is_in_reserved(p)) { oop obj = oopDesc::load_decode_heap_oop_not_null(p); _rs->write_ref_field_gc_par(p, obj); } @@ -714,7 +715,7 @@ void /*ParNewGeneration::*/KeepAliveClosure::do_oop_work(T* p) { _cl->do_oop_nv(p); - if (GenCollectedHeap::heap()->is_in_reserved(p)) { + if (CMSHeap::heap()->is_in_reserved(p)) { oop obj = oopDesc::load_decode_heap_oop_not_null(p); _rs->write_ref_field_gc_par(p, obj); } @@ -804,7 +805,7 @@ public: }; void ParNewRefProcTaskExecutor::execute(ProcessTask& task) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* gch = CMSHeap::heap(); WorkGang* workers = gch->workers(); assert(workers != NULL, "Need parallel worker threads."); _state_set.reset(workers->active_workers(), _young_gen.promotion_failed()); @@ -816,7 +817,7 @@ void ParNewRefProcTaskExecutor::execute(ProcessTask& task) { } void ParNewRefProcTaskExecutor::execute(EnqueueTask& task) { - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* gch = CMSHeap::heap(); WorkGang* workers = gch->workers(); assert(workers != NULL, "Need parallel worker threads."); ParNewRefEnqueueTaskProxy enq_task(task); @@ -825,8 +826,8 @@ void ParNewRefProcTaskExecutor::execute(EnqueueTask& task) { void ParNewRefProcTaskExecutor::set_single_threaded_mode() { _state_set.flush(); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - gch->save_marks(); + CMSHeap* heap = CMSHeap::heap(); + heap->save_marks(); } ScanClosureWithParBarrier:: @@ -835,10 +836,10 @@ ScanClosureWithParBarrier(ParNewGeneration* g, bool gc_barrier) : { } EvacuateFollowersClosureGeneral:: -EvacuateFollowersClosureGeneral(GenCollectedHeap* gch, +EvacuateFollowersClosureGeneral(CMSHeap* heap, OopsInGenClosure* cur, OopsInGenClosure* older) : - _gch(gch), + _heap(heap), _scan_cur_or_nonheap(cur), _scan_older(older) { } @@ -846,15 +847,15 @@ void EvacuateFollowersClosureGeneral::do_void() { do { // Beware: this call will lead to closure applications via virtual // calls. - _gch->oop_since_save_marks_iterate(GenCollectedHeap::YoungGen, - _scan_cur_or_nonheap, - _scan_older); - } while (!_gch->no_allocs_since_save_marks()); + _heap->oop_since_save_marks_iterate(GenCollectedHeap::YoungGen, + _scan_cur_or_nonheap, + _scan_older); + } while (!_heap->no_allocs_since_save_marks()); } // A Generation that does parallel young-gen collection. -void ParNewGeneration::handle_promotion_failed(GenCollectedHeap* gch, ParScanThreadStateSet& thread_state_set) { +void ParNewGeneration::handle_promotion_failed(CMSHeap* gch, ParScanThreadStateSet& thread_state_set) { assert(_promo_failure_scan_stack.is_empty(), "post condition"); _promo_failure_scan_stack.clear(true); // Clear cached segments. @@ -883,7 +884,7 @@ void ParNewGeneration::collect(bool full, bool is_tlab) { assert(full || size > 0, "otherwise we don't want to collect"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* gch = CMSHeap::heap(); _gc_timer->register_gc_start(); @@ -1064,7 +1065,7 @@ void ParNewGeneration::collect(bool full, } size_t ParNewGeneration::desired_plab_sz() { - return _plab_stats.desired_plab_sz(GenCollectedHeap::heap()->workers()->active_workers()); + return _plab_stats.desired_plab_sz(CMSHeap::heap()->workers()->active_workers()); } static int sum; @@ -1168,7 +1169,7 @@ oop ParNewGeneration::copy_to_survivor_space(ParScanThreadState* par_scan_state, } else { // Is in to-space; do copying ourselves. Copy::aligned_disjoint_words((HeapWord*)old, (HeapWord*)new_obj, sz); - assert(GenCollectedHeap::heap()->is_in_reserved(new_obj), "illegal forwarding pointer value."); + assert(CMSHeap::heap()->is_in_reserved(new_obj), "illegal forwarding pointer value."); forward_ptr = old->forward_to_atomic(new_obj); // Restore the mark word copied above. new_obj->set_mark(m); @@ -1475,3 +1476,9 @@ void ParNewGeneration::ref_processor_init() { const char* ParNewGeneration::name() const { return "par new generation"; } + +void ParNewGeneration::restore_preserved_marks() { + SharedRestorePreservedMarksTaskExecutor task_executor(CMSHeap::heap()->workers()); + _preserved_marks_set.restore(&task_executor); +} + diff --git a/src/hotspot/share/gc/cms/parNewGeneration.hpp b/src/hotspot/share/gc/cms/parNewGeneration.hpp index 0576e05cebd..a27c7c36c43 100644 --- a/src/hotspot/share/gc/cms/parNewGeneration.hpp +++ b/src/hotspot/share/gc/cms/parNewGeneration.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -35,6 +35,7 @@ #include "memory/padded.hpp" class ChunkArray; +class CMSHeap; class ParScanWithoutBarrierClosure; class ParScanWithBarrierClosure; class ParRootScanWithoutBarrierClosure; @@ -259,11 +260,11 @@ class KeepAliveClosure: public DefNewGeneration::KeepAliveClosure { class EvacuateFollowersClosureGeneral: public VoidClosure { private: - GenCollectedHeap* _gch; + CMSHeap* _heap; OopsInGenClosure* _scan_cur_or_nonheap; OopsInGenClosure* _scan_older; public: - EvacuateFollowersClosureGeneral(GenCollectedHeap* gch, + EvacuateFollowersClosureGeneral(CMSHeap* heap, OopsInGenClosure* cur, OopsInGenClosure* older); virtual void do_void(); @@ -336,7 +337,7 @@ class ParNewGeneration: public DefNewGeneration { static oop real_forwardee_slow(oop obj); static void waste_some_time(); - void handle_promotion_failed(GenCollectedHeap* gch, ParScanThreadStateSet& thread_state_set); + void handle_promotion_failed(CMSHeap* gch, ParScanThreadStateSet& thread_state_set); protected: @@ -345,6 +346,8 @@ class ParNewGeneration: public DefNewGeneration { bool survivor_overflow() { return _survivor_overflow; } void set_survivor_overflow(bool v) { _survivor_overflow = v; } + void restore_preserved_marks(); + public: ParNewGeneration(ReservedSpace rs, size_t initial_byte_size); diff --git a/src/hotspot/share/gc/cms/parOopClosures.inline.hpp b/src/hotspot/share/gc/cms/parOopClosures.inline.hpp index eb4dea537e4..a24f004d45a 100644 --- a/src/hotspot/share/gc/cms/parOopClosures.inline.hpp +++ b/src/hotspot/share/gc/cms/parOopClosures.inline.hpp @@ -25,10 +25,10 @@ #ifndef SHARE_VM_GC_CMS_PAROOPCLOSURES_INLINE_HPP #define SHARE_VM_GC_CMS_PAROOPCLOSURES_INLINE_HPP +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/parNewGeneration.hpp" #include "gc/cms/parOopClosures.hpp" #include "gc/shared/cardTableRS.hpp" -#include "gc/shared/genCollectedHeap.hpp" #include "gc/shared/genOopClosures.inline.hpp" #include "logging/log.hpp" #include "logging/logStream.hpp" @@ -72,9 +72,9 @@ template inline void ParScanClosure::do_oop_work(T* p, bool gc_barrier, bool root_scan) { - assert((!GenCollectedHeap::heap()->is_in_reserved(p) || + assert((!CMSHeap::heap()->is_in_reserved(p) || generation()->is_in_reserved(p)) - && (GenCollectedHeap::heap()->is_young_gen(generation()) || gc_barrier), + && (CMSHeap::heap()->is_young_gen(generation()) || gc_barrier), "The gen must be right, and we must be doing the barrier " "in older generations."); T heap_oop = oopDesc::load_heap_oop(p); @@ -85,8 +85,8 @@ inline void ParScanClosure::do_oop_work(T* p, if (_g->to()->is_in_reserved(obj)) { Log(gc) log; log.error("Scanning field (" PTR_FORMAT ") twice?", p2i(p)); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - Space* sp = gch->space_containing(p); + CMSHeap* heap = CMSHeap::heap(); + Space* sp = heap->space_containing(p); oop obj = oop(sp->block_start(p)); assert((HeapWord*)obj < (HeapWord*)p, "Error"); log.error("Object: " PTR_FORMAT, p2i((void *)obj)); @@ -96,7 +96,7 @@ inline void ParScanClosure::do_oop_work(T* p, log.error("-----"); log.error("Heap:"); log.error("-----"); - gch->print_on(&ls); + heap->print_on(&ls); ShouldNotReachHere(); } #endif diff --git a/src/hotspot/share/gc/cms/vmCMSOperations.cpp b/src/hotspot/share/gc/cms/vmCMSOperations.cpp index 3aa8a0ccd6b..1c2e6a51d10 100644 --- a/src/hotspot/share/gc/cms/vmCMSOperations.cpp +++ b/src/hotspot/share/gc/cms/vmCMSOperations.cpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2005, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2005, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -23,6 +23,7 @@ */ #include "precompiled.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/cms/concurrentMarkSweepGeneration.inline.hpp" #include "gc/cms/concurrentMarkSweepThread.hpp" #include "gc/cms/vmCMSOperations.hpp" @@ -39,19 +40,19 @@ ////////////////////////////////////////////////////////// void VM_CMS_Operation::verify_before_gc() { if (VerifyBeforeGC && - GenCollectedHeap::heap()->total_collections() >= VerifyGCStartAt) { + CMSHeap::heap()->total_collections() >= VerifyGCStartAt) { GCTraceTime(Info, gc, phases, verify) tm("Verify Before", _collector->_gc_timer_cm); HandleMark hm; FreelistLocker x(_collector); MutexLockerEx y(_collector->bitMapLock(), Mutex::_no_safepoint_check_flag); - GenCollectedHeap::heap()->prepare_for_verify(); + CMSHeap::heap()->prepare_for_verify(); Universe::verify(); } } void VM_CMS_Operation::verify_after_gc() { if (VerifyAfterGC && - GenCollectedHeap::heap()->total_collections() >= VerifyGCStartAt) { + CMSHeap::heap()->total_collections() >= VerifyGCStartAt) { GCTraceTime(Info, gc, phases, verify) tm("Verify After", _collector->_gc_timer_cm); HandleMark hm; FreelistLocker x(_collector); @@ -112,13 +113,13 @@ void VM_CMS_Initial_Mark::doit() { _collector->_gc_timer_cm->register_gc_pause_start("Initial Mark"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - GCCauseSetter gccs(gch, GCCause::_cms_initial_mark); + CMSHeap* heap = CMSHeap::heap(); + GCCauseSetter gccs(heap, GCCause::_cms_initial_mark); VM_CMS_Operation::verify_before_gc(); IsGCActiveMark x; // stop-world GC active - _collector->do_CMS_operation(CMSCollector::CMS_op_checkpointRootsInitial, gch->gc_cause()); + _collector->do_CMS_operation(CMSCollector::CMS_op_checkpointRootsInitial, heap->gc_cause()); VM_CMS_Operation::verify_after_gc(); @@ -140,13 +141,13 @@ void VM_CMS_Final_Remark::doit() { _collector->_gc_timer_cm->register_gc_pause_start("Final Mark"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - GCCauseSetter gccs(gch, GCCause::_cms_final_remark); + CMSHeap* heap = CMSHeap::heap(); + GCCauseSetter gccs(heap, GCCause::_cms_final_remark); VM_CMS_Operation::verify_before_gc(); IsGCActiveMark x; // stop-world GC active - _collector->do_CMS_operation(CMSCollector::CMS_op_checkpointRootsFinal, gch->gc_cause()); + _collector->do_CMS_operation(CMSCollector::CMS_op_checkpointRootsFinal, heap->gc_cause()); VM_CMS_Operation::verify_after_gc(); @@ -162,8 +163,8 @@ void VM_GenCollectFullConcurrent::doit() { assert(Thread::current()->is_VM_thread(), "Should be VM thread"); assert(GCLockerInvokesConcurrent || ExplicitGCInvokesConcurrent, "Unexpected"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - if (_gc_count_before == gch->total_collections()) { + CMSHeap* heap = CMSHeap::heap(); + if (_gc_count_before == heap->total_collections()) { // The "full" of do_full_collection call below "forces" // a collection; the second arg, 0, below ensures that // only the young gen is collected. XXX In the future, @@ -173,21 +174,21 @@ void VM_GenCollectFullConcurrent::doit() { // for the future. assert(SafepointSynchronize::is_at_safepoint(), "We can only be executing this arm of if at a safepoint"); - GCCauseSetter gccs(gch, _gc_cause); - gch->do_full_collection(gch->must_clear_all_soft_refs(), GenCollectedHeap::YoungGen); + GCCauseSetter gccs(heap, _gc_cause); + heap->do_full_collection(heap->must_clear_all_soft_refs(), GenCollectedHeap::YoungGen); } // Else no need for a foreground young gc - assert((_gc_count_before < gch->total_collections()) || + assert((_gc_count_before < heap->total_collections()) || (GCLocker::is_active() /* gc may have been skipped */ - && (_gc_count_before == gch->total_collections())), + && (_gc_count_before == heap->total_collections())), "total_collections() should be monotonically increasing"); MutexLockerEx x(FullGCCount_lock, Mutex::_no_safepoint_check_flag); - assert(_full_gc_count_before <= gch->total_full_collections(), "Error"); - if (gch->total_full_collections() == _full_gc_count_before) { + assert(_full_gc_count_before <= heap->total_full_collections(), "Error"); + if (heap->total_full_collections() == _full_gc_count_before) { // Nudge the CMS thread to start a concurrent collection. CMSCollector::request_full_gc(_full_gc_count_before, _gc_cause); } else { - assert(_full_gc_count_before < gch->total_full_collections(), "Error"); + assert(_full_gc_count_before < heap->total_full_collections(), "Error"); FullGCCount_lock->notify_all(); // Inform the Java thread its work is done } } @@ -197,11 +198,11 @@ bool VM_GenCollectFullConcurrent::evaluate_at_safepoint() const { assert(thr != NULL, "Unexpected tid"); if (!thr->is_Java_thread()) { assert(thr->is_VM_thread(), "Expected to be evaluated by VM thread"); - GenCollectedHeap* gch = GenCollectedHeap::heap(); - if (_gc_count_before != gch->total_collections()) { + CMSHeap* heap = CMSHeap::heap(); + if (_gc_count_before != heap->total_collections()) { // No need to do a young gc, we'll just nudge the CMS thread // in the doit() method above, to be executed soon. - assert(_gc_count_before < gch->total_collections(), + assert(_gc_count_before < heap->total_collections(), "total_collections() should be monotonically increasing"); return false; // no need for foreground young gc } @@ -227,9 +228,9 @@ void VM_GenCollectFullConcurrent::doit_epilogue() { // count overflows and wraps around. XXX fix me !!! // e.g. at the rate of 1 full gc per ms, this could // overflow in about 1000 years. - GenCollectedHeap* gch = GenCollectedHeap::heap(); + CMSHeap* heap = CMSHeap::heap(); if (_gc_cause != GCCause::_gc_locker && - gch->total_full_collections_completed() <= _full_gc_count_before) { + heap->total_full_collections_completed() <= _full_gc_count_before) { // maybe we should change the condition to test _gc_cause == // GCCause::_java_lang_system_gc or GCCause::_dcmd_gc_run, // instead of _gc_cause != GCCause::_gc_locker @@ -245,7 +246,7 @@ void VM_GenCollectFullConcurrent::doit_epilogue() { MutexLockerEx ml(FullGCCount_lock, Mutex::_no_safepoint_check_flag); // Either a concurrent or a stop-world full gc is sufficient // witness to our request. - while (gch->total_full_collections_completed() <= _full_gc_count_before) { + while (heap->total_full_collections_completed() <= _full_gc_count_before) { FullGCCount_lock->wait(Mutex::_no_safepoint_check_flag); } } diff --git a/src/hotspot/share/gc/serial/defNewGeneration.cpp b/src/hotspot/share/gc/serial/defNewGeneration.cpp index e65d12a469c..f92660cb232 100644 --- a/src/hotspot/share/gc/serial/defNewGeneration.cpp +++ b/src/hotspot/share/gc/serial/defNewGeneration.cpp @@ -734,8 +734,11 @@ void DefNewGeneration::remove_forwarding_pointers() { RemoveForwardedPointerClosure rspc; eden()->object_iterate(&rspc); from()->object_iterate(&rspc); + restore_preserved_marks(); +} - SharedRestorePreservedMarksTaskExecutor task_executor(GenCollectedHeap::heap()->workers()); +void DefNewGeneration::restore_preserved_marks() { + SharedRestorePreservedMarksTaskExecutor task_executor(NULL); _preserved_marks_set.restore(&task_executor); } diff --git a/src/hotspot/share/gc/serial/defNewGeneration.hpp b/src/hotspot/share/gc/serial/defNewGeneration.hpp index e2ff971ddda..19ca2ac4707 100644 --- a/src/hotspot/share/gc/serial/defNewGeneration.hpp +++ b/src/hotspot/share/gc/serial/defNewGeneration.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2001, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2001, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -89,6 +89,8 @@ protected: // therefore we must remove their forwarding pointers. void remove_forwarding_pointers(); + virtual void restore_preserved_marks(); + // Preserved marks PreservedMarksSet _preserved_marks_set; diff --git a/src/hotspot/share/gc/shared/collectedHeap.hpp b/src/hotspot/share/gc/shared/collectedHeap.hpp index 10b9fb302e2..6dc88de6921 100644 --- a/src/hotspot/share/gc/shared/collectedHeap.hpp +++ b/src/hotspot/share/gc/shared/collectedHeap.hpp @@ -83,6 +83,7 @@ class GCHeapLog : public EventLogBase { // GenCollectedHeap // G1CollectedHeap // ParallelScavengeHeap +// CMSHeap // class CollectedHeap : public CHeapObj { friend class VMStructs; @@ -194,7 +195,8 @@ class CollectedHeap : public CHeapObj { enum Name { GenCollectedHeap, ParallelScavengeHeap, - G1CollectedHeap + G1CollectedHeap, + CMSHeap }; static inline size_t filler_array_max_size() { diff --git a/src/hotspot/share/gc/shared/genCollectedHeap.cpp b/src/hotspot/share/gc/shared/genCollectedHeap.cpp index 139fc32f2a6..ea9afb1ec4a 100644 --- a/src/hotspot/share/gc/shared/genCollectedHeap.cpp +++ b/src/hotspot/share/gc/shared/genCollectedHeap.cpp @@ -58,28 +58,6 @@ #include "utilities/macros.hpp" #include "utilities/stack.inline.hpp" #include "utilities/vmError.hpp" -#if INCLUDE_ALL_GCS -#include "gc/cms/concurrentMarkSweepThread.hpp" -#include "gc/cms/vmCMSOperations.hpp" -#endif // INCLUDE_ALL_GCS - -NOT_PRODUCT(size_t GenCollectedHeap::_skip_header_HeapWords = 0;) - -// The set of potentially parallel tasks in root scanning. -enum GCH_strong_roots_tasks { - GCH_PS_Universe_oops_do, - GCH_PS_JNIHandles_oops_do, - GCH_PS_ObjectSynchronizer_oops_do, - GCH_PS_Management_oops_do, - GCH_PS_SystemDictionary_oops_do, - GCH_PS_ClassLoaderDataGraph_oops_do, - GCH_PS_jvmti_oops_do, - GCH_PS_CodeCache_oops_do, - GCH_PS_aot_oops_do, - GCH_PS_younger_gens, - // Leave this one last. - GCH_PS_NumElements -}; GenCollectedHeap::GenCollectedHeap(GenCollectorPolicy *policy) : CollectedHeap(), @@ -89,15 +67,6 @@ GenCollectedHeap::GenCollectedHeap(GenCollectorPolicy *policy) : _full_collections_completed(0) { assert(policy != NULL, "Sanity check"); - if (UseConcMarkSweepGC) { - _workers = new WorkGang("GC Thread", ParallelGCThreads, - /* are_GC_task_threads */true, - /* are_ConcurrentGC_threads */false); - _workers->initialize_workers(); - } else { - // Serial GC does not use workers. - _workers = NULL; - } } jint GenCollectedHeap::initialize() { @@ -138,15 +107,6 @@ jint GenCollectedHeap::initialize() { _old_gen = gen_policy()->old_gen_spec()->init(old_rs, rem_set()); clear_incremental_collection_failed(); -#if INCLUDE_ALL_GCS - // If we are running CMS, create the collector responsible - // for collecting the CMS generations. - if (collector_policy()->is_concurrent_mark_sweep_policy()) { - bool success = create_cms_collector(); - if (!success) return JNI_ENOMEM; - } -#endif // INCLUDE_ALL_GCS - return JNI_OK; } @@ -183,21 +143,22 @@ char* GenCollectedHeap::allocate(size_t alignment, void GenCollectedHeap::post_initialize() { ref_processing_init(); - assert((_young_gen->kind() == Generation::DefNew) || - (_young_gen->kind() == Generation::ParNew), - "Wrong youngest generation type"); + check_gen_kinds(); DefNewGeneration* def_new_gen = (DefNewGeneration*)_young_gen; - assert(_old_gen->kind() == Generation::ConcurrentMarkSweep || - _old_gen->kind() == Generation::MarkSweepCompact, - "Wrong generation kind"); - _gen_policy->initialize_size_policy(def_new_gen->eden()->capacity(), _old_gen->capacity(), def_new_gen->from()->capacity()); _gen_policy->initialize_gc_policy_counters(); } +void GenCollectedHeap::check_gen_kinds() { + assert(young_gen()->kind() == Generation::DefNew, + "Wrong youngest generation type"); + assert(old_gen()->kind() == Generation::MarkSweepCompact, + "Wrong generation kind"); +} + void GenCollectedHeap::ref_processing_init() { _young_gen->ref_processor_init(); _old_gen->ref_processor_init(); @@ -309,19 +270,6 @@ bool GenCollectedHeap::must_clear_all_soft_refs() { _gc_cause == GCCause::_wb_full_gc; } -bool GenCollectedHeap::should_do_concurrent_full_gc(GCCause::Cause cause) { - if (!UseConcMarkSweepGC) { - return false; - } - - switch (cause) { - case GCCause::_gc_locker: return GCLockerInvokesConcurrent; - case GCCause::_java_lang_system_gc: - case GCCause::_dcmd_gc_run: return ExplicitGCInvokesConcurrent; - default: return false; - } -} - void GenCollectedHeap::collect_generation(Generation* gen, bool full, size_t size, bool is_tlab, bool run_verification, bool clear_soft_refs, bool restore_marks_for_biased_locking) { @@ -674,31 +622,6 @@ void GenCollectedHeap::young_process_roots(StrongRootsScope* scope, _process_strong_tasks->all_tasks_completed(scope->n_threads()); } -void GenCollectedHeap::cms_process_roots(StrongRootsScope* scope, - bool young_gen_as_roots, - ScanningOption so, - bool only_strong_roots, - OopsInGenClosure* root_closure, - CLDClosure* cld_closure) { - MarkingCodeBlobClosure mark_code_closure(root_closure, !CodeBlobToOopClosure::FixRelocations); - OopsInGenClosure* weak_roots = only_strong_roots ? NULL : root_closure; - CLDClosure* weak_cld_closure = only_strong_roots ? NULL : cld_closure; - - process_roots(scope, so, root_closure, weak_roots, cld_closure, weak_cld_closure, &mark_code_closure); - if (!only_strong_roots) { - process_string_table_roots(scope, root_closure); - } - - if (young_gen_as_roots && - !_process_strong_tasks->is_task_claimed(GCH_PS_younger_gens)) { - root_closure->set_generation(_young_gen); - _young_gen->oop_iterate(root_closure); - root_closure->reset_generation(); - } - - _process_strong_tasks->all_tasks_completed(scope->n_threads()); -} - void GenCollectedHeap::full_process_roots(StrongRootsScope* scope, bool is_adjust_phase, ScanningOption so, @@ -763,14 +686,7 @@ HeapWord** GenCollectedHeap::end_addr() const { // public collection interfaces void GenCollectedHeap::collect(GCCause::Cause cause) { - if (should_do_concurrent_full_gc(cause)) { -#if INCLUDE_ALL_GCS - // Mostly concurrent full collection. - collect_mostly_concurrent(cause); -#else // INCLUDE_ALL_GCS - ShouldNotReachHere(); -#endif // INCLUDE_ALL_GCS - } else if (cause == GCCause::_wb_young_gc) { + if (cause == GCCause::_wb_young_gc) { // Young collection for the WhiteBox API. collect(cause, YoungGen); } else { @@ -817,44 +733,6 @@ void GenCollectedHeap::collect_locked(GCCause::Cause cause, GenerationType max_g } } -#if INCLUDE_ALL_GCS -bool GenCollectedHeap::create_cms_collector() { - - assert(_old_gen->kind() == Generation::ConcurrentMarkSweep, - "Unexpected generation kinds"); - // Skip two header words in the block content verification - NOT_PRODUCT(_skip_header_HeapWords = CMSCollector::skip_header_HeapWords();) - assert(_gen_policy->is_concurrent_mark_sweep_policy(), "Unexpected policy type"); - CMSCollector* collector = - new CMSCollector((ConcurrentMarkSweepGeneration*)_old_gen, - _rem_set, - _gen_policy->as_concurrent_mark_sweep_policy()); - - if (collector == NULL || !collector->completed_initialization()) { - if (collector) { - delete collector; // Be nice in embedded situation - } - vm_shutdown_during_initialization("Could not create CMS collector"); - return false; - } - return true; // success -} - -void GenCollectedHeap::collect_mostly_concurrent(GCCause::Cause cause) { - assert(!Heap_lock->owned_by_self(), "Should not own Heap_lock"); - - MutexLocker ml(Heap_lock); - // Read the GC counts while holding the Heap_lock - unsigned int full_gc_count_before = total_full_collections(); - unsigned int gc_count_before = total_collections(); - { - MutexUnlocker mu(Heap_lock); - VM_GenCollectFullConcurrent op(gc_count_before, full_gc_count_before, cause); - VMThread::execute(&op); - } -} -#endif // INCLUDE_ALL_GCS - void GenCollectedHeap::do_full_collection(bool clear_all_soft_refs) { do_full_collection(clear_all_soft_refs, OldGen); } @@ -1097,8 +975,9 @@ void GenCollectedHeap::save_marks() { GenCollectedHeap* GenCollectedHeap::heap() { CollectedHeap* heap = Universe::heap(); assert(heap != NULL, "Uninitialized access to GenCollectedHeap::heap()"); - assert(heap->kind() == CollectedHeap::GenCollectedHeap, "Not a GenCollectedHeap"); - return (GenCollectedHeap*)heap; + assert(heap->kind() == CollectedHeap::GenCollectedHeap || + heap->kind() == CollectedHeap::CMSHeap, "Not a GenCollectedHeap"); + return (GenCollectedHeap*) heap; } void GenCollectedHeap::prepare_for_compaction() { @@ -1126,34 +1005,9 @@ void GenCollectedHeap::print_on(outputStream* st) const { } void GenCollectedHeap::gc_threads_do(ThreadClosure* tc) const { - if (workers() != NULL) { - workers()->threads_do(tc); - } -#if INCLUDE_ALL_GCS - if (UseConcMarkSweepGC) { - ConcurrentMarkSweepThread::threads_do(tc); - } -#endif // INCLUDE_ALL_GCS } void GenCollectedHeap::print_gc_threads_on(outputStream* st) const { -#if INCLUDE_ALL_GCS - if (UseConcMarkSweepGC) { - workers()->print_worker_threads_on(st); - ConcurrentMarkSweepThread::print_all_on(st); - } -#endif // INCLUDE_ALL_GCS -} - -void GenCollectedHeap::print_on_error(outputStream* st) const { - this->CollectedHeap::print_on_error(st); - -#if INCLUDE_ALL_GCS - if (UseConcMarkSweepGC) { - st->cr(); - CMSCollector::print_on_error(st); - } -#endif // INCLUDE_ALL_GCS } void GenCollectedHeap::print_tracing_info() const { @@ -1184,7 +1038,6 @@ class GenGCPrologueClosure: public GenCollectedHeap::GenClosure { void GenCollectedHeap::gc_prologue(bool full) { assert(InlineCacheBuffer::is_empty(), "should have cleaned up ICBuffer"); - always_do_update_barrier = false; // Fill TLAB's and such CollectedHeap::accumulate_statistics_all_tlabs(); ensure_parsability(true); // retire TLABs @@ -1222,8 +1075,6 @@ void GenCollectedHeap::gc_epilogue(bool full) { MetaspaceCounters::update_performance_counters(); CompressedClassSpaceCounters::update_performance_counters(); - - always_do_update_barrier = UseConcMarkSweepGC; }; #ifndef PRODUCT @@ -1304,11 +1155,3 @@ jlong GenCollectedHeap::millis_since_last_gc() { } return retVal; } - -void GenCollectedHeap::stop() { -#if INCLUDE_ALL_GCS - if (UseConcMarkSweepGC) { - ConcurrentMarkSweepThread::cmst()->stop(); - } -#endif -} diff --git a/src/hotspot/share/gc/shared/genCollectedHeap.hpp b/src/hotspot/share/gc/shared/genCollectedHeap.hpp index 4d9087341d4..48b2371227d 100644 --- a/src/hotspot/share/gc/shared/genCollectedHeap.hpp +++ b/src/hotspot/share/gc/shared/genCollectedHeap.hpp @@ -1,5 +1,5 @@ /* - * Copyright (c) 2000, 2016, Oracle and/or its affiliates. All rights reserved. + * Copyright (c) 2000, 2017, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it @@ -78,21 +78,34 @@ private: // In support of ExplicitGCInvokesConcurrent functionality unsigned int _full_collections_completed; - // Data structure for claiming the (potentially) parallel tasks in - // (gen-specific) roots processing. - SubTasksDone* _process_strong_tasks; - // Collects the given generation. void collect_generation(Generation* gen, bool full, size_t size, bool is_tlab, bool run_verification, bool clear_soft_refs, bool restore_marks_for_biased_locking); - // In block contents verification, the number of header words to skip - NOT_PRODUCT(static size_t _skip_header_HeapWords;) - - WorkGang* _workers; - protected: + + // The set of potentially parallel tasks in root scanning. + enum GCH_strong_roots_tasks { + GCH_PS_Universe_oops_do, + GCH_PS_JNIHandles_oops_do, + GCH_PS_ObjectSynchronizer_oops_do, + GCH_PS_FlatProfiler_oops_do, + GCH_PS_Management_oops_do, + GCH_PS_SystemDictionary_oops_do, + GCH_PS_ClassLoaderDataGraph_oops_do, + GCH_PS_jvmti_oops_do, + GCH_PS_CodeCache_oops_do, + GCH_PS_aot_oops_do, + GCH_PS_younger_gens, + // Leave this one last. + GCH_PS_NumElements + }; + + // Data structure for claiming the (potentially) parallel tasks in + // (gen-specific) roots processing. + SubTasksDone* _process_strong_tasks; + // Helper functions for allocation HeapWord* attempt_allocation(size_t size, bool is_tlab, @@ -124,8 +137,6 @@ protected: public: GenCollectedHeap(GenCollectorPolicy *policy); - WorkGang* workers() const { return _workers; } - // Returns JNI_OK on success virtual jint initialize(); @@ -135,6 +146,8 @@ public: // Does operations required after initialization has been done. void post_initialize(); + virtual void check_gen_kinds(); + // Initialize ("weak") refs processing support virtual void ref_processing_init(); @@ -143,11 +156,7 @@ public: } virtual const char* name() const { - if (UseConcMarkSweepGC) { - return "Concurrent Mark Sweep"; - } else { - return "Serial"; - } + return "Serial"; } Generation* young_gen() const { return _young_gen; } @@ -190,7 +199,7 @@ public: // Perform a full collection of the heap; intended for use in implementing // "System.gc". This implies as full a collection as the CollectedHeap // supports. Caller does not hold the Heap_lock on entry. - void collect(GCCause::Cause cause); + virtual void collect(GCCause::Cause cause); // The same as above but assume that the caller holds the Heap_lock. void collect_locked(GCCause::Cause cause); @@ -207,12 +216,8 @@ public: bool is_in(const void* p) const; // override - bool is_in_closed_subset(const void* p) const { - if (UseConcMarkSweepGC) { - return is_in_reserved(p); - } else { - return is_in(p); - } + virtual bool is_in_closed_subset(const void* p) const { + return is_in(p); } // Returns true if the reference is to an object in the reserved space @@ -278,7 +283,7 @@ public: } virtual bool card_mark_must_follow_store() const { - return UseConcMarkSweepGC; + return false; } // We don't need barriers for stores to objects in the @@ -344,7 +349,6 @@ public: virtual void print_gc_threads_on(outputStream* st) const; virtual void gc_threads_do(ThreadClosure* tc) const; virtual void print_tracing_info() const; - virtual void print_on_error(outputStream* st) const; void print_heap_change(size_t young_prev_used, size_t old_prev_used) const; @@ -383,7 +387,7 @@ public: SO_ScavengeCodeCache = 0x10 }; - private: + protected: void process_roots(StrongRootsScope* scope, ScanningOption so, OopClosure* strong_roots, @@ -395,24 +399,20 @@ public: void process_string_table_roots(StrongRootsScope* scope, OopClosure* root_closure); + // Accessor for memory state verification support + NOT_PRODUCT( + virtual size_t skip_header_HeapWords() { return 0; } + ) + + virtual void gc_prologue(bool full); + virtual void gc_epilogue(bool full); + public: void young_process_roots(StrongRootsScope* scope, OopsInGenClosure* root_closure, OopsInGenClosure* old_gen_closure, CLDClosure* cld_closure); - // If "young_gen_as_roots" is false, younger generations are - // not scanned as roots; in this case, the caller must be arranging to - // scan the younger generations itself. (For example, a generation might - // explicitly mark reachable objects in younger generations, to avoid - // excess storage retention.) - void cms_process_roots(StrongRootsScope* scope, - bool young_gen_as_roots, - ScanningOption so, - bool only_strong_roots, - OopsInGenClosure* root_closure, - CLDClosure* cld_closure); - void full_process_roots(StrongRootsScope* scope, bool is_adjust_phase, ScanningOption so, @@ -479,12 +479,8 @@ public: oop obj, size_t obj_size); -private: - // Accessor for memory state verification support - NOT_PRODUCT( - static size_t skip_header_HeapWords() { return _skip_header_HeapWords; } - ) +private: // Override void check_for_non_bad_heap_word_value(HeapWord* addr, size_t size) PRODUCT_RETURN; @@ -499,22 +495,8 @@ private: // collect() and collect_locked(). Caller holds the Heap_lock on entry. void collect_locked(GCCause::Cause cause, GenerationType max_generation); - // Returns success or failure. - bool create_cms_collector(); - - // In support of ExplicitGCInvokesConcurrent functionality - bool should_do_concurrent_full_gc(GCCause::Cause cause); - void collect_mostly_concurrent(GCCause::Cause cause); - // Save the tops of the spaces in all generations void record_gen_tops_before_GC() PRODUCT_RETURN; - -protected: - void gc_prologue(bool full); - void gc_epilogue(bool full); - -public: - void stop(); }; #endif // SHARE_VM_GC_SHARED_GENCOLLECTEDHEAP_HPP diff --git a/src/hotspot/share/memory/universe.cpp b/src/hotspot/share/memory/universe.cpp index 335df28fe79..852c058b756 100644 --- a/src/hotspot/share/memory/universe.cpp +++ b/src/hotspot/share/memory/universe.cpp @@ -84,6 +84,7 @@ #include "utilities/preserveException.hpp" #if INCLUDE_ALL_GCS #include "gc/cms/cmsCollectorPolicy.hpp" +#include "gc/cms/cmsHeap.hpp" #include "gc/g1/g1CollectedHeap.inline.hpp" #include "gc/g1/g1CollectorPolicy.hpp" #include "gc/parallel/parallelScavengeHeap.hpp" @@ -758,7 +759,7 @@ CollectedHeap* Universe::create_heap() { } else if (UseG1GC) { return Universe::create_heap_with_policy(); } else if (UseConcMarkSweepGC) { - return Universe::create_heap_with_policy(); + return Universe::create_heap_with_policy(); #endif } else if (UseSerialGC) { return Universe::create_heap_with_policy(); diff --git a/src/hotspot/share/services/memoryService.cpp b/src/hotspot/share/services/memoryService.cpp index aed39e9451b..31a32b4bdd6 100644 --- a/src/hotspot/share/services/memoryService.cpp +++ b/src/hotspot/share/services/memoryService.cpp @@ -86,7 +86,8 @@ void GcThreadCountClosure::do_thread(Thread* thread) { void MemoryService::set_universe_heap(CollectedHeap* heap) { CollectedHeap::Name kind = heap->kind(); switch (kind) { - case CollectedHeap::GenCollectedHeap : { + case CollectedHeap::GenCollectedHeap : + case CollectedHeap::CMSHeap : { add_gen_collected_heap_info(GenCollectedHeap::heap()); break; } From 34622112b6c2026f2863f923b6538e392d7231f3 Mon Sep 17 00:00:00 2001 From: Tobias Hartmann Date: Fri, 13 Oct 2017 14:02:01 +0200 Subject: [PATCH 78/80] 8189067: SuperWord optimization crashes with "assert(out == prev || prev == __null) failed: no branches off of store slice" Only move the store if the LCA of all users is outside of the loop. Re-enable UseSubwordForMaxVector. Reviewed-by: kvn, roland --- src/hotspot/share/opto/c2_globals.hpp | 2 +- src/hotspot/share/opto/loopopts.cpp | 47 ++++++------------- .../loopopts/TestMoveStoresOutOfLoops.java | 24 +++++++++- 3 files changed, 38 insertions(+), 35 deletions(-) diff --git a/src/hotspot/share/opto/c2_globals.hpp b/src/hotspot/share/opto/c2_globals.hpp index febeb5f56f9..e1c859c3af9 100644 --- a/src/hotspot/share/opto/c2_globals.hpp +++ b/src/hotspot/share/opto/c2_globals.hpp @@ -192,7 +192,7 @@ "of rounds of unroll,optimize,..") \ range(0, max_jint) \ \ - product(bool, UseSubwordForMaxVector, false, \ + product(bool, UseSubwordForMaxVector, true, \ "Use Subword Analysis to set maximum vector size") \ \ develop(intx, UnrollLimitForProfileCheck, 1, \ diff --git a/src/hotspot/share/opto/loopopts.cpp b/src/hotspot/share/opto/loopopts.cpp index 8bbb2c45e8d..45acc2fcae2 100644 --- a/src/hotspot/share/opto/loopopts.cpp +++ b/src/hotspot/share/opto/loopopts.cpp @@ -826,45 +826,26 @@ void PhaseIdealLoop::try_move_store_after_loop(Node* n) { } } if (mem_ok) { - // Move the Store out of the loop creating clones along - // all paths out of the loop that observe the stored value + // Move the store out of the loop if the LCA of all + // users (except for the phi) is outside the loop. + Node* hook = new Node(1); _igvn.rehash_node_delayed(phi); - int count = phi->replace_edge(n, n->in(MemNode::Memory)); + int count = phi->replace_edge(n, hook); assert(count > 0, "inconsistent phi"); - for (DUIterator_Fast imax, i = n->fast_outs(imax); i < imax; i++) { - Node* u = n->fast_out(i); - Node* c = get_ctrl(u); - if (u->is_Phi()) { - c = u->in(0)->in(u->find_edge(n)); - } - IdealLoopTree *u_loop = get_loop(c); - assert (!n_loop->is_member(u_loop), "only the phi should have been a use in the loop"); - while(true) { - Node* next_c = find_non_split_ctrl(idom(c)); - if (n_loop->is_member(get_loop(next_c))) { - break; - } - c = next_c; - } - - Node* st = n->clone(); - st->set_req(0, c); - _igvn.register_new_node_with_optimizer(st); - - set_ctrl(st, c); - IdealLoopTree* new_loop = get_loop(c); - assert(new_loop != n_loop, "should be moved out of loop"); - if (new_loop->_child == NULL) new_loop->_body.push(st); - - _igvn.replace_input_of(u, u->find_edge(n), st); - --imax; - --i; + // Compute latest point this store can go + Node* lca = get_late_ctrl(n, get_ctrl(n)); + if (n_loop->is_member(get_loop(lca))) { + // LCA is in the loop - bail out + _igvn.replace_node(hook, n); + return; } + // Move store out of the loop + _igvn.replace_node(hook, n->in(MemNode::Memory)); + _igvn.replace_input_of(n, 0, lca); + set_ctrl_and_loop(n, lca); - assert(n->outcnt() == 0, "all uses should be gone"); - _igvn.replace_input_of(n, MemNode::Memory, C->top()); // Disconnect the phi now. An empty phi can confuse other // optimizations in this pass of loop opts.. if (phi->in(LoopNode::LoopBackControl) == phi) { diff --git a/test/hotspot/jtreg/compiler/loopopts/TestMoveStoresOutOfLoops.java b/test/hotspot/jtreg/compiler/loopopts/TestMoveStoresOutOfLoops.java index ed86d36c338..38ce019db08 100644 --- a/test/hotspot/jtreg/compiler/loopopts/TestMoveStoresOutOfLoops.java +++ b/test/hotspot/jtreg/compiler/loopopts/TestMoveStoresOutOfLoops.java @@ -23,7 +23,7 @@ /** * @test - * @bug 8080289 + * @bug 8080289 8189067 * @summary Move stores out of loops if possible * * @run main/othervm -XX:-UseOnStackReplacement -XX:-BackgroundCompilation @@ -43,6 +43,7 @@ public class TestMoveStoresOutOfLoops { private static long[] array = new long[10]; private static long[] array2 = new long[10]; private static boolean[] array3 = new boolean[1000]; + private static int[] array4 = new int[1000]; private static byte[] byte_array = new byte[10]; // Array store should be moved out of the loop, value stored @@ -108,6 +109,15 @@ public class TestMoveStoresOutOfLoops { } } + // Array store can be moved out of the inner loop + static void test_after_7(int idx) { + for (int i = 0; i < 1000; i++) { + for (int j = 0; j <= 42; j++) { + array4[i] = j; + } + } + } + // Optimize out redundant stores static void test_stores_1(int ignored) { array[0] = 0; @@ -285,6 +295,17 @@ public class TestMoveStoresOutOfLoops { return success; } + static boolean array_check5(String name) { + boolean success = true; + for (int i = 0; i < 1000; i++) { + if (array4[i] != 42) { + success = false; + System.out.println(name + " failed: array[" + i + "] = " + array4[i]); + } + } + return success; + } + static public void main(String[] args) throws Exception { TestMoveStoresOutOfLoops test = new TestMoveStoresOutOfLoops(); test.doTest("test_after_1", TestMoveStoresOutOfLoops::array_init, TestMoveStoresOutOfLoops::array_check); @@ -295,6 +316,7 @@ public class TestMoveStoresOutOfLoops { test.doTest("test_after_6", TestMoveStoresOutOfLoops::array_init, TestMoveStoresOutOfLoops::array_check); array3[999] = true; test.doTest("test_after_6", TestMoveStoresOutOfLoops::array_init, TestMoveStoresOutOfLoops::array_check); + test.doTest("test_after_7", TestMoveStoresOutOfLoops::array_init, TestMoveStoresOutOfLoops::array_check5); test.doTest("test_stores_1", TestMoveStoresOutOfLoops::array_init3, TestMoveStoresOutOfLoops::array_check3); test.doTest("test_stores_2", TestMoveStoresOutOfLoops::array_init3, TestMoveStoresOutOfLoops::array_check3); From ebf1633bd21e58d0c86a7054ccb461529915573e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Erik=20=C3=96sterlund?= Date: Fri, 13 Oct 2017 15:08:56 +0200 Subject: [PATCH 79/80] 8185141: Generalize scavengeable nmethod root handling Reviewed-by: tschatzl, pliden, rkennke --- src/hotspot/share/c1/c1_Runtime1.cpp | 5 --- src/hotspot/share/code/codeCache.cpp | 45 +++++++------------ src/hotspot/share/code/codeCache.hpp | 4 ++ src/hotspot/share/code/nmethod.cpp | 23 +++------- src/hotspot/share/gc/g1/g1CollectedHeap.cpp | 18 +++----- src/hotspot/share/gc/g1/g1CollectedHeap.hpp | 5 ++- .../gc/parallel/parallelScavengeHeap.cpp | 17 +++++-- .../gc/parallel/parallelScavengeHeap.hpp | 4 +- src/hotspot/share/gc/shared/collectedHeap.cpp | 8 ---- src/hotspot/share/gc/shared/collectedHeap.hpp | 12 ++--- .../share/gc/shared/genCollectedHeap.cpp | 8 ++++ .../share/gc/shared/genCollectedHeap.hpp | 8 +++- src/hotspot/share/oops/oop.inline.hpp | 2 +- 13 files changed, 73 insertions(+), 86 deletions(-) diff --git a/src/hotspot/share/c1/c1_Runtime1.cpp b/src/hotspot/share/c1/c1_Runtime1.cpp index c66a69dd689..78987c99b48 100644 --- a/src/hotspot/share/c1/c1_Runtime1.cpp +++ b/src/hotspot/share/c1/c1_Runtime1.cpp @@ -1221,11 +1221,6 @@ JRT_ENTRY(void, Runtime1::patch_code(JavaThread* thread, Runtime1::StubID stub_i MutexLockerEx ml_code (CodeCache_lock, Mutex::_no_safepoint_check_flag); nmethod* nm = CodeCache::find_nmethod(caller_frame.pc()); guarantee(nm != NULL, "only nmethods can contain non-perm oops"); - if (!nm->on_scavenge_root_list() && - ((mirror.not_null() && mirror()->is_scavengable()) || - (appendix.not_null() && appendix->is_scavengable()))) { - CodeCache::add_scavenge_root_nmethod(nm); - } // Since we've patched some oops in the nmethod, // (re)register it with the heap. diff --git a/src/hotspot/share/code/codeCache.cpp b/src/hotspot/share/code/codeCache.cpp index 56c230e3bbf..5caf167c55b 100644 --- a/src/hotspot/share/code/codeCache.cpp +++ b/src/hotspot/share/code/codeCache.cpp @@ -683,22 +683,19 @@ void CodeCache::blobs_do(CodeBlobClosure* f) { if (cb->is_alive()) { f->do_code_blob(cb); #ifdef ASSERT - if (cb->is_nmethod()) - ((nmethod*)cb)->verify_scavenge_root_oops(); + if (cb->is_nmethod()) { + Universe::heap()->verify_nmethod((nmethod*)cb); + } #endif //ASSERT } } } } -// Walk the list of methods which might contain non-perm oops. +// Walk the list of methods which might contain oops to the java heap. void CodeCache::scavenge_root_nmethods_do(CodeBlobToOopClosure* f) { assert_locked_or_safepoint(CodeCache_lock); - if (UseG1GC) { - return; - } - const bool fix_relocations = f->fix_relocations(); debug_only(mark_scavenge_root_nmethods()); @@ -735,13 +732,20 @@ void CodeCache::scavenge_root_nmethods_do(CodeBlobToOopClosure* f) { debug_only(verify_perm_nmethods(NULL)); } +void CodeCache::register_scavenge_root_nmethod(nmethod* nm) { + assert_locked_or_safepoint(CodeCache_lock); + if (!nm->on_scavenge_root_list() && nm->detect_scavenge_root_oops()) { + add_scavenge_root_nmethod(nm); + } +} + +void CodeCache::verify_scavenge_root_nmethod(nmethod* nm) { + nm->verify_scavenge_root_oops(); +} + void CodeCache::add_scavenge_root_nmethod(nmethod* nm) { assert_locked_or_safepoint(CodeCache_lock); - if (UseG1GC) { - return; - } - nm->set_on_scavenge_root_list(); nm->set_scavenge_root_link(_scavenge_root_nmethods); set_scavenge_root_nmethods(nm); @@ -754,8 +758,6 @@ void CodeCache::unlink_scavenge_root_nmethod(nmethod* nm, nmethod* prev) { assert((prev == NULL && scavenge_root_nmethods() == nm) || (prev != NULL && prev->scavenge_root_link() == nm), "precondition"); - assert(!UseG1GC, "G1 does not use the scavenge_root_nmethods list"); - print_trace("unlink_scavenge_root", nm); if (prev == NULL) { set_scavenge_root_nmethods(nm->scavenge_root_link()); @@ -769,10 +771,6 @@ void CodeCache::unlink_scavenge_root_nmethod(nmethod* nm, nmethod* prev) { void CodeCache::drop_scavenge_root_nmethod(nmethod* nm) { assert_locked_or_safepoint(CodeCache_lock); - if (UseG1GC) { - return; - } - print_trace("drop_scavenge_root", nm); nmethod* prev = NULL; for (nmethod* cur = scavenge_root_nmethods(); cur != NULL; cur = cur->scavenge_root_link()) { @@ -788,10 +786,6 @@ void CodeCache::drop_scavenge_root_nmethod(nmethod* nm) { void CodeCache::prune_scavenge_root_nmethods() { assert_locked_or_safepoint(CodeCache_lock); - if (UseG1GC) { - return; - } - debug_only(mark_scavenge_root_nmethods()); nmethod* last = NULL; @@ -820,10 +814,6 @@ void CodeCache::prune_scavenge_root_nmethods() { #ifndef PRODUCT void CodeCache::asserted_non_scavengable_nmethods_do(CodeBlobClosure* f) { - if (UseG1GC) { - return; - } - // While we are here, verify the integrity of the list. mark_scavenge_root_nmethods(); for (nmethod* cur = scavenge_root_nmethods(); cur != NULL; cur = cur->scavenge_root_link()) { @@ -833,7 +823,7 @@ void CodeCache::asserted_non_scavengable_nmethods_do(CodeBlobClosure* f) { verify_perm_nmethods(f); } -// Temporarily mark nmethods that are claimed to be on the non-perm list. +// Temporarily mark nmethods that are claimed to be on the scavenge list. void CodeCache::mark_scavenge_root_nmethods() { NMethodIterator iter; while(iter.next_alive()) { @@ -854,7 +844,7 @@ void CodeCache::verify_perm_nmethods(CodeBlobClosure* f_or_null) { assert(nm->scavenge_root_not_marked(), "must be already processed"); if (nm->on_scavenge_root_list()) call_f = false; // don't show this one to the client - nm->verify_scavenge_root_oops(); + Universe::heap()->verify_nmethod(nm); if (call_f) f_or_null->do_code_blob(nm); } } @@ -1640,4 +1630,3 @@ void CodeCache::log_state(outputStream* st) { blob_count(), nmethod_count(), adapter_count(), unallocated_capacity()); } - diff --git a/src/hotspot/share/code/codeCache.hpp b/src/hotspot/share/code/codeCache.hpp index 37e63e7089c..03c0f5c3f0d 100644 --- a/src/hotspot/share/code/codeCache.hpp +++ b/src/hotspot/share/code/codeCache.hpp @@ -181,6 +181,10 @@ class CodeCache : AllStatic { static void scavenge_root_nmethods_do(CodeBlobToOopClosure* f); static nmethod* scavenge_root_nmethods() { return _scavenge_root_nmethods; } + // register_scavenge_root_nmethod() conditionally adds the nmethod to the list + // if it is not already on the list and has a scavengeable root + static void register_scavenge_root_nmethod(nmethod* nm); + static void verify_scavenge_root_nmethod(nmethod* nm); static void add_scavenge_root_nmethod(nmethod* nm); static void drop_scavenge_root_nmethod(nmethod* nm); diff --git a/src/hotspot/share/code/nmethod.cpp b/src/hotspot/share/code/nmethod.cpp index 1772feedde1..b1a6c481555 100644 --- a/src/hotspot/share/code/nmethod.cpp +++ b/src/hotspot/share/code/nmethod.cpp @@ -411,11 +411,8 @@ void nmethod::init_defaults() { _oops_do_mark_link = NULL; _jmethod_id = NULL; _osr_link = NULL; - if (UseG1GC) { - _unloading_next = NULL; - } else { - _scavenge_root_link = NULL; - } + _unloading_next = NULL; + _scavenge_root_link = NULL; _scavenge_root_state = 0; #if INCLUDE_RTM_OPT _rtm_state = NoRTM; @@ -599,12 +596,9 @@ nmethod::nmethod( code_buffer->copy_code_and_locs_to(this); code_buffer->copy_values_to(this); if (ScavengeRootsInCode) { - if (detect_scavenge_root_oops()) { - CodeCache::add_scavenge_root_nmethod(this); - } Universe::heap()->register_nmethod(this); } - debug_only(verify_scavenge_root_oops()); + debug_only(Universe::heap()->verify_nmethod(this)); CodeCache::commit(this); } @@ -754,12 +748,9 @@ nmethod::nmethod( debug_info->copy_to(this); dependencies->copy_to(this); if (ScavengeRootsInCode) { - if (detect_scavenge_root_oops()) { - CodeCache::add_scavenge_root_nmethod(this); - } Universe::heap()->register_nmethod(this); } - debug_only(verify_scavenge_root_oops()); + debug_only(Universe::heap()->verify_nmethod(this)); CodeCache::commit(this); @@ -2137,7 +2128,7 @@ void nmethod::verify() { VerifyOopsClosure voc(this); oops_do(&voc); assert(voc.ok(), "embedded oops must be OK"); - verify_scavenge_root_oops(); + Universe::heap()->verify_nmethod(this); verify_scopes(); } @@ -2230,10 +2221,6 @@ public: }; void nmethod::verify_scavenge_root_oops() { - if (UseG1GC) { - return; - } - if (!on_scavenge_root_list()) { // Actually look inside, to verify the claim that it's clean. DebugScavengeRoot debug_scavenge_root(this); diff --git a/src/hotspot/share/gc/g1/g1CollectedHeap.cpp b/src/hotspot/share/gc/g1/g1CollectedHeap.cpp index 19e2998a50d..f57caa841bd 100644 --- a/src/hotspot/share/gc/g1/g1CollectedHeap.cpp +++ b/src/hotspot/share/gc/g1/g1CollectedHeap.cpp @@ -141,13 +141,6 @@ void G1RegionMappingChangedListener::on_commit(uint start_idx, size_t num_region reset_from_card_cache(start_idx, num_regions); } -// Returns true if the reference points to an object that -// can move in an incremental collection. -bool G1CollectedHeap::is_scavengable(const void* p) { - HeapRegion* hr = heap_region_containing(p); - return !hr->is_pinned(); -} - // Private methods. HeapRegion* @@ -5323,17 +5316,20 @@ public: void do_oop(narrowOop* p) { do_oop_work(p); } }; -void G1CollectedHeap::register_nmethod(nmethod* nm) { - CollectedHeap::register_nmethod(nm); +// Returns true if the reference points to an object that +// can move in an incremental collection. +bool G1CollectedHeap::is_scavengable(oop obj) { + HeapRegion* hr = heap_region_containing(obj); + return !hr->is_pinned(); +} +void G1CollectedHeap::register_nmethod(nmethod* nm) { guarantee(nm != NULL, "sanity"); RegisterNMethodOopClosure reg_cl(this, nm); nm->oops_do(®_cl); } void G1CollectedHeap::unregister_nmethod(nmethod* nm) { - CollectedHeap::unregister_nmethod(nm); - guarantee(nm != NULL, "sanity"); UnregisterNMethodOopClosure reg_cl(this, nm); nm->oops_do(®_cl, true); diff --git a/src/hotspot/share/gc/g1/g1CollectedHeap.hpp b/src/hotspot/share/gc/g1/g1CollectedHeap.hpp index 266fffa2d02..6c25f60b089 100644 --- a/src/hotspot/share/gc/g1/g1CollectedHeap.hpp +++ b/src/hotspot/share/gc/g1/g1CollectedHeap.hpp @@ -1282,8 +1282,6 @@ public: inline bool is_in_young(const oop obj); - virtual bool is_scavengable(const void* addr); - // We don't need barriers for initializing stores to objects // in the young gen: for the SATB pre-barrier, there is no // pre-value that needs to be remembered; for the remembered-set @@ -1395,6 +1393,9 @@ public: // Optimized nmethod scanning support routines + // Is an oop scavengeable + virtual bool is_scavengable(oop obj); + // Register the given nmethod with the G1 heap. virtual void register_nmethod(nmethod* nm); diff --git a/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp b/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp index d3f960dfaae..27fcf5c1adc 100644 --- a/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp +++ b/src/hotspot/share/gc/parallel/parallelScavengeHeap.cpp @@ -23,6 +23,7 @@ */ #include "precompiled.hpp" +#include "code/codeCache.hpp" #include "gc/parallel/adjoiningGenerations.hpp" #include "gc/parallel/adjoiningVirtualSpaces.hpp" #include "gc/parallel/cardTableExtension.hpp" @@ -169,10 +170,6 @@ bool ParallelScavengeHeap::is_in_reserved(const void* p) const { return young_gen()->is_in_reserved(p) || old_gen()->is_in_reserved(p); } -bool ParallelScavengeHeap::is_scavengable(const void* addr) { - return is_in_young((oop)addr); -} - // There are two levels of allocation policy here. // // When an allocation request fails, the requesting thread must invoke a VM @@ -665,3 +662,15 @@ void ParallelScavengeHeap::gen_mangle_unused_area() { } } #endif + +bool ParallelScavengeHeap::is_scavengable(oop obj) { + return is_in_young(obj); +} + +void ParallelScavengeHeap::register_nmethod(nmethod* nm) { + CodeCache::register_scavenge_root_nmethod(nm); +} + +void ParallelScavengeHeap::verify_nmethod(nmethod* nm) { + CodeCache::verify_scavenge_root_nmethod(nm); +} diff --git a/src/hotspot/share/gc/parallel/parallelScavengeHeap.hpp b/src/hotspot/share/gc/parallel/parallelScavengeHeap.hpp index e83cb3e5f2f..bfdc55f07f7 100644 --- a/src/hotspot/share/gc/parallel/parallelScavengeHeap.hpp +++ b/src/hotspot/share/gc/parallel/parallelScavengeHeap.hpp @@ -134,7 +134,9 @@ class ParallelScavengeHeap : public CollectedHeap { // can be moved in a partial collection. For currently implemented // generational collectors that means during a collection of // the young gen. - virtual bool is_scavengable(const void* addr); + virtual bool is_scavengable(oop obj); + virtual void register_nmethod(nmethod* nm); + virtual void verify_nmethod(nmethod* nmethod); size_t max_capacity() const; diff --git a/src/hotspot/share/gc/shared/collectedHeap.cpp b/src/hotspot/share/gc/shared/collectedHeap.cpp index deb9da3cbd8..ed5b4a6b66a 100644 --- a/src/hotspot/share/gc/shared/collectedHeap.cpp +++ b/src/hotspot/share/gc/shared/collectedHeap.cpp @@ -135,14 +135,6 @@ void CollectedHeap::print_on_error(outputStream* st) const { _barrier_set->print_on(st); } -void CollectedHeap::register_nmethod(nmethod* nm) { - assert_locked_or_safepoint(CodeCache_lock); -} - -void CollectedHeap::unregister_nmethod(nmethod* nm) { - assert_locked_or_safepoint(CodeCache_lock); -} - void CollectedHeap::trace_heap(GCWhen::Type when, const GCTracer* gc_tracer) { const GCHeapSummary& heap_summary = create_heap_summary(); gc_tracer->report_gc_heap_summary(when, heap_summary); diff --git a/src/hotspot/share/gc/shared/collectedHeap.hpp b/src/hotspot/share/gc/shared/collectedHeap.hpp index 6dc88de6921..0f72c8c1f6b 100644 --- a/src/hotspot/share/gc/shared/collectedHeap.hpp +++ b/src/hotspot/share/gc/shared/collectedHeap.hpp @@ -289,10 +289,6 @@ class CollectedHeap : public CHeapObj { return p == NULL || is_in_closed_subset(p); } - // An object is scavengable if its location may move during a scavenge. - // (A scavenge is a GC which is not a full GC.) - virtual bool is_scavengable(const void *p) = 0; - void set_gc_cause(GCCause::Cause v) { if (UsePerfData) { _gc_lastcause = _gc_cause; @@ -570,10 +566,14 @@ class CollectedHeap : public CHeapObj { void print_heap_before_gc(); void print_heap_after_gc(); + // An object is scavengable if its location may move during a scavenge. + // (A scavenge is a GC which is not a full GC.) + virtual bool is_scavengable(oop obj) = 0; // Registering and unregistering an nmethod (compiled code) with the heap. // Override with specific mechanism for each specialized heap type. - virtual void register_nmethod(nmethod* nm); - virtual void unregister_nmethod(nmethod* nm); + virtual void register_nmethod(nmethod* nm) {} + virtual void unregister_nmethod(nmethod* nm) {} + virtual void verify_nmethod(nmethod* nmethod) {} void trace_heap_before_gc(const GCTracer* gc_tracer); void trace_heap_after_gc(const GCTracer* gc_tracer); diff --git a/src/hotspot/share/gc/shared/genCollectedHeap.cpp b/src/hotspot/share/gc/shared/genCollectedHeap.cpp index ea9afb1ec4a..95e6e34789b 100644 --- a/src/hotspot/share/gc/shared/genCollectedHeap.cpp +++ b/src/hotspot/share/gc/shared/genCollectedHeap.cpp @@ -501,6 +501,14 @@ void GenCollectedHeap::do_collection(bool full, #endif } +void GenCollectedHeap::register_nmethod(nmethod* nm) { + CodeCache::register_scavenge_root_nmethod(nm); +} + +void GenCollectedHeap::verify_nmethod(nmethod* nm) { + CodeCache::verify_scavenge_root_nmethod(nm); +} + HeapWord* GenCollectedHeap::satisfy_failed_allocation(size_t size, bool is_tlab) { return gen_policy()->satisfy_failed_allocation(size, is_tlab); } diff --git a/src/hotspot/share/gc/shared/genCollectedHeap.hpp b/src/hotspot/share/gc/shared/genCollectedHeap.hpp index 48b2371227d..4b51f679623 100644 --- a/src/hotspot/share/gc/shared/genCollectedHeap.hpp +++ b/src/hotspot/share/gc/shared/genCollectedHeap.hpp @@ -229,10 +229,14 @@ public: bool is_in_partial_collection(const void* p); #endif - virtual bool is_scavengable(const void* addr) { - return is_in_young((oop)addr); + virtual bool is_scavengable(oop obj) { + return is_in_young(obj); } + // Optimized nmethod scanning support routines + virtual void register_nmethod(nmethod* nm); + virtual void verify_nmethod(nmethod* nmethod); + // Iteration functions. void oop_iterate_no_header(OopClosure* cl); void oop_iterate(ExtendedOopClosure* cl); diff --git a/src/hotspot/share/oops/oop.inline.hpp b/src/hotspot/share/oops/oop.inline.hpp index 83c5b564b85..88ae9950ead 100644 --- a/src/hotspot/share/oops/oop.inline.hpp +++ b/src/hotspot/share/oops/oop.inline.hpp @@ -539,7 +539,7 @@ bool oopDesc::is_gc_marked() const { } bool oopDesc::is_scavengable() const { - return Universe::heap()->is_scavengable(this); + return Universe::heap()->is_scavengable(oop(const_cast(this))); } // Used by scavengers From 9d33d6f6bb12c359d71bc32c6aa3ad0b22200d7e Mon Sep 17 00:00:00 2001 From: Dean Long Date: Fri, 13 Oct 2017 12:29:45 -0700 Subject: [PATCH 80/80] 8189244: x86: eliminate frame::adjust_unextended_sp() overhead Reviewed-by: kvn --- src/hotspot/cpu/x86/frame_x86.cpp | 4 +++- src/hotspot/cpu/x86/frame_x86.hpp | 2 +- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/src/hotspot/cpu/x86/frame_x86.cpp b/src/hotspot/cpu/x86/frame_x86.cpp index a64ceb2a2ed..918a413adee 100644 --- a/src/hotspot/cpu/x86/frame_x86.cpp +++ b/src/hotspot/cpu/x86/frame_x86.cpp @@ -383,6 +383,7 @@ void frame::verify_deopt_original_pc(CompiledMethod* nm, intptr_t* unextended_sp //------------------------------------------------------------------------------ // frame::adjust_unextended_sp +#ifdef ASSERT void frame::adjust_unextended_sp() { // On x86, sites calling method handle intrinsics and lambda forms are treated // as any other call site. Therefore, no special action is needed when we are @@ -394,11 +395,12 @@ void frame::adjust_unextended_sp() { // If the sender PC is a deoptimization point, get the original PC. if (sender_cm->is_deopt_entry(_pc) || sender_cm->is_deopt_mh_entry(_pc)) { - DEBUG_ONLY(verify_deopt_original_pc(sender_cm, _unextended_sp)); + verify_deopt_original_pc(sender_cm, _unextended_sp); } } } } +#endif //------------------------------------------------------------------------------ // frame::update_map_with_saved_link diff --git a/src/hotspot/cpu/x86/frame_x86.hpp b/src/hotspot/cpu/x86/frame_x86.hpp index dbfcaf70dc3..db8d5dc71ea 100644 --- a/src/hotspot/cpu/x86/frame_x86.hpp +++ b/src/hotspot/cpu/x86/frame_x86.hpp @@ -117,7 +117,7 @@ // original sp we use that convention. intptr_t* _unextended_sp; - void adjust_unextended_sp(); + void adjust_unextended_sp() NOT_DEBUG_RETURN; intptr_t* ptr_at_addr(int offset) const { return (intptr_t*) addr_at(offset);