1 /*
2  * Copyright (c) 2009, 2020, Oracle and/or its affiliates. All rights reserved.
3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4  *
5  * This code is free software; you can redistribute it and/or modify it
6  * under the terms of the GNU General Public License version 2 only, as
7  * published by the Free Software Foundation.
8  *
9  * This code is distributed in the hope that it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12  * version 2 for more details (a copy is included in the LICENSE file that
13  * accompanied this code).
14  *
15  * You should have received a copy of the GNU General Public License version
16  * 2 along with this work; if not, write to the Free Software Foundation,
17  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18  *
19  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20  * or visit www.oracle.com if you need additional information or have any
21  * questions.
22  *
23  */
24 
25 #include "precompiled.hpp"
26 #include "compiler/compileLog.hpp"
27 #include "opto/addnode.hpp"
28 #include "opto/callGenerator.hpp"
29 #include "opto/callnode.hpp"
30 #include "opto/divnode.hpp"
31 #include "opto/graphKit.hpp"
32 #include "opto/idealKit.hpp"
33 #include "opto/rootnode.hpp"
34 #include "opto/runtime.hpp"
35 #include "opto/stringopts.hpp"
36 #include "opto/subnode.hpp"
37 #include "runtime/sharedRuntime.hpp"
38 
39 #define __ kit.
40 
41 class StringConcat : public ResourceObj {
42  private:
43   PhaseStringOpts*    _stringopts;
44   Node*               _string_alloc;
45   AllocateNode*       _begin;          // The allocation the begins the pattern
46   CallStaticJavaNode* _end;            // The final call of the pattern.  Will either be
47                                        // SB.toString or or String.<init>(SB.toString)
48   bool                _multiple;       // indicates this is a fusion of two or more
49                                        // separate StringBuilders
50 
51   Node*               _arguments;      // The list of arguments to be concatenated
52   GrowableArray<int>  _mode;           // into a String along with a mode flag
53                                        // indicating how to treat the value.
54   Node_List           _constructors;   // List of constructors (many in case of stacked concat)
55   Node_List           _control;        // List of control nodes that will be deleted
56   Node_List           _uncommon_traps; // Uncommon traps that needs to be rewritten
57                                        // to restart at the initial JVMState.
58 
59  public:
60   // Mode for converting arguments to Strings
61   enum {
62     StringMode,
63     IntMode,
64     CharMode,
65     StringNullCheckMode
66   };
67 
StringConcat(PhaseStringOpts * stringopts,CallStaticJavaNode * end)68   StringConcat(PhaseStringOpts* stringopts, CallStaticJavaNode* end):
69     _stringopts(stringopts),
70     _string_alloc(NULL),
71     _begin(NULL),
72     _end(end),
73     _multiple(false) {
74     _arguments = new Node(1);
75     _arguments->del_req(0);
76   }
77 
78   bool validate_mem_flow();
79   bool validate_control_flow();
80 
merge_add()81   void merge_add() {
82 #if 0
83     // XXX This is place holder code for reusing an existing String
84     // allocation but the logic for checking the state safety is
85     // probably inadequate at the moment.
86     CallProjections endprojs;
87     sc->end()->extract_projections(&endprojs, false);
88     if (endprojs.resproj != NULL) {
89       for (SimpleDUIterator i(endprojs.resproj); i.has_next(); i.next()) {
90         CallStaticJavaNode *use = i.get()->isa_CallStaticJava();
91         if (use != NULL && use->method() != NULL &&
92             use->method()->intrinsic_id() == vmIntrinsics::_String_String &&
93             use->in(TypeFunc::Parms + 1) == endprojs.resproj) {
94           // Found useless new String(sb.toString()) so reuse the newly allocated String
95           // when creating the result instead of allocating a new one.
96           sc->set_string_alloc(use->in(TypeFunc::Parms));
97           sc->set_end(use);
98         }
99       }
100     }
101 #endif
102   }
103 
104   StringConcat* merge(StringConcat* other, Node* arg);
105 
set_allocation(AllocateNode * alloc)106   void set_allocation(AllocateNode* alloc) {
107     _begin = alloc;
108   }
109 
append(Node * value,int mode)110   void append(Node* value, int mode) {
111     _arguments->add_req(value);
112     _mode.append(mode);
113   }
push(Node * value,int mode)114   void push(Node* value, int mode) {
115     _arguments->ins_req(0, value);
116     _mode.insert_before(0, mode);
117   }
118 
push_string(Node * value)119   void push_string(Node* value) {
120     push(value, StringMode);
121   }
push_string_null_check(Node * value)122   void push_string_null_check(Node* value) {
123     push(value, StringNullCheckMode);
124   }
push_int(Node * value)125   void push_int(Node* value) {
126     push(value, IntMode);
127   }
push_char(Node * value)128   void push_char(Node* value) {
129     push(value, CharMode);
130   }
131 
is_SB_toString(Node * call)132   static bool is_SB_toString(Node* call) {
133     if (call->is_CallStaticJava()) {
134       CallStaticJavaNode* csj = call->as_CallStaticJava();
135       ciMethod* m = csj->method();
136       if (m != NULL &&
137           (m->intrinsic_id() == vmIntrinsics::_StringBuilder_toString ||
138            m->intrinsic_id() == vmIntrinsics::_StringBuffer_toString)) {
139         return true;
140       }
141     }
142     return false;
143   }
144 
skip_string_null_check(Node * value)145   static Node* skip_string_null_check(Node* value) {
146     // Look for a diamond shaped Null check of toString() result
147     // (could be code from String.valueOf()):
148     // (Proj == NULL) ? "null":"CastPP(Proj)#NotNULL
149     if (value->is_Phi()) {
150       int true_path = value->as_Phi()->is_diamond_phi();
151       if (true_path != 0) {
152         // phi->region->if_proj->ifnode->bool
153         BoolNode* b = value->in(0)->in(1)->in(0)->in(1)->as_Bool();
154         Node* cmp = b->in(1);
155         Node* v1 = cmp->in(1);
156         Node* v2 = cmp->in(2);
157         // Null check of the return of toString which can simply be skipped.
158         if (b->_test._test == BoolTest::ne &&
159             v2->bottom_type() == TypePtr::NULL_PTR &&
160             value->in(true_path)->Opcode() == Op_CastPP &&
161             value->in(true_path)->in(1) == v1 &&
162             v1->is_Proj() && is_SB_toString(v1->in(0))) {
163           return v1;
164         }
165       }
166     }
167     return value;
168   }
169 
argument(int i)170   Node* argument(int i) {
171     return _arguments->in(i);
172   }
argument_uncast(int i)173   Node* argument_uncast(int i) {
174     Node* arg = argument(i);
175     int amode = mode(i);
176     if (amode == StringConcat::StringMode ||
177         amode == StringConcat::StringNullCheckMode) {
178       arg = skip_string_null_check(arg);
179     }
180     return arg;
181   }
set_argument(int i,Node * value)182   void set_argument(int i, Node* value) {
183     _arguments->set_req(i, value);
184   }
num_arguments()185   int num_arguments() {
186     return _mode.length();
187   }
mode(int i)188   int mode(int i) {
189     return _mode.at(i);
190   }
add_control(Node * ctrl)191   void add_control(Node* ctrl) {
192     assert(!_control.contains(ctrl), "only push once");
193     _control.push(ctrl);
194   }
add_constructor(Node * init)195   void add_constructor(Node* init) {
196     assert(!_constructors.contains(init), "only push once");
197     _constructors.push(init);
198   }
end()199   CallStaticJavaNode* end() { return _end; }
begin()200   AllocateNode* begin() { return _begin; }
string_alloc()201   Node* string_alloc() { return _string_alloc; }
202 
203   void eliminate_unneeded_control();
204   void eliminate_initialize(InitializeNode* init);
205   void eliminate_call(CallNode* call);
206 
maybe_log_transform()207   void maybe_log_transform() {
208     CompileLog* log = _stringopts->C->log();
209     if (log != NULL) {
210       log->head("replace_string_concat arguments='%d' string_alloc='%d' multiple='%d'",
211                 num_arguments(),
212                 _string_alloc != NULL,
213                 _multiple);
214       JVMState* p = _begin->jvms();
215       while (p != NULL) {
216         log->elem("jvms bci='%d' method='%d'", p->bci(), log->identify(p->method()));
217         p = p->caller();
218       }
219       log->tail("replace_string_concat");
220     }
221   }
222 
convert_uncommon_traps(GraphKit & kit,const JVMState * jvms)223   void convert_uncommon_traps(GraphKit& kit, const JVMState* jvms) {
224     for (uint u = 0; u < _uncommon_traps.size(); u++) {
225       Node* uct = _uncommon_traps.at(u);
226 
227       // Build a new call using the jvms state of the allocate
228       address call_addr = SharedRuntime::uncommon_trap_blob()->entry_point();
229       const TypeFunc* call_type = OptoRuntime::uncommon_trap_Type();
230       const TypePtr* no_memory_effects = NULL;
231       Compile* C = _stringopts->C;
232       CallStaticJavaNode* call = new CallStaticJavaNode(call_type, call_addr, "uncommon_trap",
233                                                         jvms->bci(), no_memory_effects);
234       for (int e = 0; e < TypeFunc::Parms; e++) {
235         call->init_req(e, uct->in(e));
236       }
237       // Set the trap request to record intrinsic failure if this trap
238       // is taken too many times.  Ideally we would handle then traps by
239       // doing the original bookkeeping in the MDO so that if it caused
240       // the code to be thrown out we could still recompile and use the
241       // optimization.  Failing the uncommon traps doesn't really mean
242       // that the optimization is a bad idea but there's no other way to
243       // do the MDO updates currently.
244       int trap_request = Deoptimization::make_trap_request(Deoptimization::Reason_intrinsic,
245                                                            Deoptimization::Action_make_not_entrant);
246       call->init_req(TypeFunc::Parms, __ intcon(trap_request));
247       kit.add_safepoint_edges(call);
248 
249       _stringopts->gvn()->transform(call);
250       C->gvn_replace_by(uct, call);
251       uct->disconnect_inputs(NULL, C);
252     }
253   }
254 
cleanup()255   void cleanup() {
256     // disconnect the hook node
257     _arguments->disconnect_inputs(NULL, _stringopts->C);
258   }
259 };
260 
261 
eliminate_unneeded_control()262 void StringConcat::eliminate_unneeded_control() {
263   for (uint i = 0; i < _control.size(); i++) {
264     Node* n = _control.at(i);
265     if (n->is_Allocate()) {
266       eliminate_initialize(n->as_Allocate()->initialization());
267     }
268     if (n->is_Call()) {
269       if (n != _end) {
270         eliminate_call(n->as_Call());
271       }
272     } else if (n->is_IfTrue()) {
273       Compile* C = _stringopts->C;
274       C->gvn_replace_by(n, n->in(0)->in(0));
275       // get rid of the other projection
276       C->gvn_replace_by(n->in(0)->as_If()->proj_out(false), C->top());
277     }
278   }
279 }
280 
281 
merge(StringConcat * other,Node * arg)282 StringConcat* StringConcat::merge(StringConcat* other, Node* arg) {
283   StringConcat* result = new StringConcat(_stringopts, _end);
284   for (uint x = 0; x < _control.size(); x++) {
285     Node* n = _control.at(x);
286     if (n->is_Call()) {
287       result->_control.push(n);
288     }
289   }
290   for (uint x = 0; x < other->_control.size(); x++) {
291     Node* n = other->_control.at(x);
292     if (n->is_Call()) {
293       result->_control.push(n);
294     }
295   }
296   assert(result->_control.contains(other->_end), "what?");
297   assert(result->_control.contains(_begin), "what?");
298   for (int x = 0; x < num_arguments(); x++) {
299     Node* argx = argument_uncast(x);
300     if (argx == arg) {
301       // replace the toString result with the all the arguments that
302       // made up the other StringConcat
303       for (int y = 0; y < other->num_arguments(); y++) {
304         result->append(other->argument(y), other->mode(y));
305       }
306     } else {
307       result->append(argx, mode(x));
308     }
309   }
310   result->set_allocation(other->_begin);
311   for (uint i = 0; i < _constructors.size(); i++) {
312     result->add_constructor(_constructors.at(i));
313   }
314   for (uint i = 0; i < other->_constructors.size(); i++) {
315     result->add_constructor(other->_constructors.at(i));
316   }
317   result->_multiple = true;
318   return result;
319 }
320 
321 
eliminate_call(CallNode * call)322 void StringConcat::eliminate_call(CallNode* call) {
323   Compile* C = _stringopts->C;
324   CallProjections projs;
325   call->extract_projections(&projs, false);
326   if (projs.fallthrough_catchproj != NULL) {
327     C->gvn_replace_by(projs.fallthrough_catchproj, call->in(TypeFunc::Control));
328   }
329   if (projs.fallthrough_memproj != NULL) {
330     C->gvn_replace_by(projs.fallthrough_memproj, call->in(TypeFunc::Memory));
331   }
332   if (projs.catchall_memproj != NULL) {
333     C->gvn_replace_by(projs.catchall_memproj, C->top());
334   }
335   if (projs.fallthrough_ioproj != NULL) {
336     C->gvn_replace_by(projs.fallthrough_ioproj, call->in(TypeFunc::I_O));
337   }
338   if (projs.catchall_ioproj != NULL) {
339     C->gvn_replace_by(projs.catchall_ioproj, C->top());
340   }
341   if (projs.catchall_catchproj != NULL) {
342     // EA can't cope with the partially collapsed graph this
343     // creates so put it on the worklist to be collapsed later.
344     for (SimpleDUIterator i(projs.catchall_catchproj); i.has_next(); i.next()) {
345       Node *use = i.get();
346       int opc = use->Opcode();
347       if (opc == Op_CreateEx || opc == Op_Region) {
348         _stringopts->record_dead_node(use);
349       }
350     }
351     C->gvn_replace_by(projs.catchall_catchproj, C->top());
352   }
353   if (projs.resproj != NULL) {
354     C->gvn_replace_by(projs.resproj, C->top());
355   }
356   C->gvn_replace_by(call, C->top());
357 }
358 
eliminate_initialize(InitializeNode * init)359 void StringConcat::eliminate_initialize(InitializeNode* init) {
360   Compile* C = _stringopts->C;
361 
362   // Eliminate Initialize node.
363   assert(init->outcnt() <= 2, "only a control and memory projection expected");
364   assert(init->req() <= InitializeNode::RawStores, "no pending inits");
365   Node *ctrl_proj = init->proj_out_or_null(TypeFunc::Control);
366   if (ctrl_proj != NULL) {
367     C->gvn_replace_by(ctrl_proj, init->in(TypeFunc::Control));
368   }
369   Node *mem_proj = init->proj_out_or_null(TypeFunc::Memory);
370   if (mem_proj != NULL) {
371     Node *mem = init->in(TypeFunc::Memory);
372     C->gvn_replace_by(mem_proj, mem);
373   }
374   C->gvn_replace_by(init, C->top());
375   init->disconnect_inputs(NULL, C);
376 }
377 
collect_toString_calls()378 Node_List PhaseStringOpts::collect_toString_calls() {
379   Node_List string_calls;
380   Node_List worklist;
381 
382   _visited.clear();
383 
384   // Prime the worklist
385   for (uint i = 1; i < C->root()->len(); i++) {
386     Node* n = C->root()->in(i);
387     if (n != NULL && !_visited.test_set(n->_idx)) {
388       worklist.push(n);
389     }
390   }
391 
392   while (worklist.size() > 0) {
393     Node* ctrl = worklist.pop();
394     if (StringConcat::is_SB_toString(ctrl)) {
395       CallStaticJavaNode* csj = ctrl->as_CallStaticJava();
396       string_calls.push(csj);
397     }
398     if (ctrl->in(0) != NULL && !_visited.test_set(ctrl->in(0)->_idx)) {
399       worklist.push(ctrl->in(0));
400     }
401     if (ctrl->is_Region()) {
402       for (uint i = 1; i < ctrl->len(); i++) {
403         if (ctrl->in(i) != NULL && !_visited.test_set(ctrl->in(i)->_idx)) {
404           worklist.push(ctrl->in(i));
405         }
406       }
407     }
408   }
409   return string_calls;
410 }
411 
412 
build_candidate(CallStaticJavaNode * call)413 StringConcat* PhaseStringOpts::build_candidate(CallStaticJavaNode* call) {
414   ciMethod* m = call->method();
415   ciSymbol* string_sig;
416   ciSymbol* int_sig;
417   ciSymbol* char_sig;
418   if (m->holder() == C->env()->StringBuilder_klass()) {
419     string_sig = ciSymbol::String_StringBuilder_signature();
420     int_sig = ciSymbol::int_StringBuilder_signature();
421     char_sig = ciSymbol::char_StringBuilder_signature();
422   } else if (m->holder() == C->env()->StringBuffer_klass()) {
423     string_sig = ciSymbol::String_StringBuffer_signature();
424     int_sig = ciSymbol::int_StringBuffer_signature();
425     char_sig = ciSymbol::char_StringBuffer_signature();
426   } else {
427     return NULL;
428   }
429 #ifndef PRODUCT
430   if (PrintOptimizeStringConcat) {
431     tty->print("considering toString call in ");
432     call->jvms()->dump_spec(tty); tty->cr();
433   }
434 #endif
435 
436   StringConcat* sc = new StringConcat(this, call);
437 
438   AllocateNode* alloc = NULL;
439   InitializeNode* init = NULL;
440 
441   // possible opportunity for StringBuilder fusion
442   CallStaticJavaNode* cnode = call;
443   while (cnode) {
444     Node* recv = cnode->in(TypeFunc::Parms)->uncast();
445     if (recv->is_Proj()) {
446       recv = recv->in(0);
447     }
448     cnode = recv->isa_CallStaticJava();
449     if (cnode == NULL) {
450       alloc = recv->isa_Allocate();
451       if (alloc == NULL) {
452         break;
453       }
454       // Find the constructor call
455       Node* result = alloc->result_cast();
456       if (result == NULL || !result->is_CheckCastPP() || alloc->in(TypeFunc::Memory)->is_top()) {
457         // strange looking allocation
458 #ifndef PRODUCT
459         if (PrintOptimizeStringConcat) {
460           tty->print("giving up because allocation looks strange ");
461           alloc->jvms()->dump_spec(tty); tty->cr();
462         }
463 #endif
464         break;
465       }
466       Node* constructor = NULL;
467       for (SimpleDUIterator i(result); i.has_next(); i.next()) {
468         CallStaticJavaNode *use = i.get()->isa_CallStaticJava();
469         if (use != NULL &&
470             use->method() != NULL &&
471             !use->method()->is_static() &&
472             use->method()->name() == ciSymbol::object_initializer_name() &&
473             use->method()->holder() == m->holder()) {
474           // Matched the constructor.
475           ciSymbol* sig = use->method()->signature()->as_symbol();
476           if (sig == ciSymbol::void_method_signature() ||
477               sig == ciSymbol::int_void_signature() ||
478               sig == ciSymbol::string_void_signature()) {
479             if (sig == ciSymbol::string_void_signature()) {
480               // StringBuilder(String) so pick this up as the first argument
481               assert(use->in(TypeFunc::Parms + 1) != NULL, "what?");
482               const Type* type = _gvn->type(use->in(TypeFunc::Parms + 1));
483               if (type == TypePtr::NULL_PTR) {
484                 // StringBuilder(null) throws exception.
485 #ifndef PRODUCT
486                 if (PrintOptimizeStringConcat) {
487                   tty->print("giving up because StringBuilder(null) throws exception");
488                   alloc->jvms()->dump_spec(tty); tty->cr();
489                 }
490 #endif
491                 return NULL;
492               }
493               // StringBuilder(str) argument needs null check.
494               sc->push_string_null_check(use->in(TypeFunc::Parms + 1));
495             }
496             // The int variant takes an initial size for the backing
497             // array so just treat it like the void version.
498             constructor = use;
499           } else {
500 #ifndef PRODUCT
501             if (PrintOptimizeStringConcat) {
502               tty->print("unexpected constructor signature: %s", sig->as_utf8());
503             }
504 #endif
505           }
506           break;
507         }
508       }
509       if (constructor == NULL) {
510         // couldn't find constructor
511 #ifndef PRODUCT
512         if (PrintOptimizeStringConcat) {
513           tty->print("giving up because couldn't find constructor ");
514           alloc->jvms()->dump_spec(tty); tty->cr();
515         }
516 #endif
517         break;
518       }
519 
520       // Walked all the way back and found the constructor call so see
521       // if this call converted into a direct string concatenation.
522       sc->add_control(call);
523       sc->add_control(constructor);
524       sc->add_control(alloc);
525       sc->set_allocation(alloc);
526       sc->add_constructor(constructor);
527       if (sc->validate_control_flow() && sc->validate_mem_flow()) {
528         return sc;
529       } else {
530         return NULL;
531       }
532     } else if (cnode->method() == NULL) {
533       break;
534     } else if (!cnode->method()->is_static() &&
535                cnode->method()->holder() == m->holder() &&
536                cnode->method()->name() == ciSymbol::append_name() &&
537                (cnode->method()->signature()->as_symbol() == string_sig ||
538                 cnode->method()->signature()->as_symbol() == char_sig ||
539                 cnode->method()->signature()->as_symbol() == int_sig)) {
540       sc->add_control(cnode);
541       Node* arg = cnode->in(TypeFunc::Parms + 1);
542       if (arg == NULL || arg->is_top()) {
543 #ifndef PRODUCT
544         if (PrintOptimizeStringConcat) {
545           tty->print("giving up because the call is effectively dead");
546           cnode->jvms()->dump_spec(tty); tty->cr();
547         }
548 #endif
549         break;
550       }
551       if (cnode->method()->signature()->as_symbol() == int_sig) {
552         sc->push_int(arg);
553       } else if (cnode->method()->signature()->as_symbol() == char_sig) {
554         sc->push_char(arg);
555       } else {
556         if (arg->is_Proj() && arg->in(0)->is_CallStaticJava()) {
557           CallStaticJavaNode* csj = arg->in(0)->as_CallStaticJava();
558           if (csj->method() != NULL &&
559               csj->method()->intrinsic_id() == vmIntrinsics::_Integer_toString &&
560               arg->outcnt() == 1) {
561             // _control is the list of StringBuilder calls nodes which
562             // will be replaced by new String code after this optimization.
563             // Integer::toString() call is not part of StringBuilder calls
564             // chain. It could be eliminated only if its result is used
565             // only by this SB calls chain.
566             // Another limitation: it should be used only once because
567             // it is unknown that it is used only by this SB calls chain
568             // until all related SB calls nodes are collected.
569             assert(arg->unique_out() == cnode, "sanity");
570             sc->add_control(csj);
571             sc->push_int(csj->in(TypeFunc::Parms));
572             continue;
573           }
574         }
575         sc->push_string(arg);
576       }
577       continue;
578     } else {
579       // some unhandled signature
580 #ifndef PRODUCT
581       if (PrintOptimizeStringConcat) {
582         tty->print("giving up because encountered unexpected signature ");
583         cnode->tf()->dump(); tty->cr();
584         cnode->in(TypeFunc::Parms + 1)->dump();
585       }
586 #endif
587       break;
588     }
589   }
590   return NULL;
591 }
592 
593 
PhaseStringOpts(PhaseGVN * gvn,Unique_Node_List *)594 PhaseStringOpts::PhaseStringOpts(PhaseGVN* gvn, Unique_Node_List*):
595   Phase(StringOpts),
596   _gvn(gvn),
597   _visited(Thread::current()->resource_area()) {
598 
599   assert(OptimizeStringConcat, "shouldn't be here");
600 
601   size_table_field = C->env()->Integer_klass()->get_field_by_name(ciSymbol::make("sizeTable"),
602                                                                   ciSymbol::make("[I"), true);
603   if (size_table_field == NULL) {
604     // Something wrong so give up.
605     assert(false, "why can't we find Integer.sizeTable?");
606     return;
607   }
608 
609   // Collect the types needed to talk about the various slices of memory
610   byte_adr_idx = C->get_alias_index(TypeAryPtr::BYTES);
611 
612   // For each locally allocated StringBuffer see if the usages can be
613   // collapsed into a single String construction.
614 
615   // Run through the list of allocation looking for SB.toString to see
616   // if it's possible to fuse the usage of the SB into a single String
617   // construction.
618   GrowableArray<StringConcat*> concats;
619   Node_List toStrings = collect_toString_calls();
620   while (toStrings.size() > 0) {
621     StringConcat* sc = build_candidate(toStrings.pop()->as_CallStaticJava());
622     if (sc != NULL) {
623       concats.push(sc);
624     }
625   }
626 
627   // try to coalesce separate concats
628  restart:
629   for (int c = 0; c < concats.length(); c++) {
630     StringConcat* sc = concats.at(c);
631     for (int i = 0; i < sc->num_arguments(); i++) {
632       Node* arg = sc->argument_uncast(i);
633       if (arg->is_Proj() && StringConcat::is_SB_toString(arg->in(0))) {
634         CallStaticJavaNode* csj = arg->in(0)->as_CallStaticJava();
635         for (int o = 0; o < concats.length(); o++) {
636           if (c == o) continue;
637           StringConcat* other = concats.at(o);
638           if (other->end() == csj) {
639 #ifndef PRODUCT
640             if (PrintOptimizeStringConcat) {
641               tty->print_cr("considering stacked concats");
642             }
643 #endif
644 
645             StringConcat* merged = sc->merge(other, arg);
646             if (merged->validate_control_flow() && merged->validate_mem_flow()) {
647 #ifndef PRODUCT
648               if (PrintOptimizeStringConcat) {
649                 tty->print_cr("stacking would succeed");
650               }
651 #endif
652               if (c < o) {
653                 concats.remove_at(o);
654                 concats.at_put(c, merged);
655               } else {
656                 concats.remove_at(c);
657                 concats.at_put(o, merged);
658               }
659               goto restart;
660             } else {
661 #ifndef PRODUCT
662               if (PrintOptimizeStringConcat) {
663                 tty->print_cr("stacking would fail");
664               }
665 #endif
666             }
667           }
668         }
669       }
670     }
671   }
672 
673 
674   for (int c = 0; c < concats.length(); c++) {
675     StringConcat* sc = concats.at(c);
676     replace_string_concat(sc);
677   }
678 
679   remove_dead_nodes();
680 }
681 
record_dead_node(Node * dead)682 void PhaseStringOpts::record_dead_node(Node* dead) {
683   dead_worklist.push(dead);
684 }
685 
remove_dead_nodes()686 void PhaseStringOpts::remove_dead_nodes() {
687   // Delete any dead nodes to make things clean enough that escape
688   // analysis doesn't get unhappy.
689   while (dead_worklist.size() > 0) {
690     Node* use = dead_worklist.pop();
691     int opc = use->Opcode();
692     switch (opc) {
693       case Op_Region: {
694         uint i = 1;
695         for (i = 1; i < use->req(); i++) {
696           if (use->in(i) != C->top()) {
697             break;
698           }
699         }
700         if (i >= use->req()) {
701           for (SimpleDUIterator i(use); i.has_next(); i.next()) {
702             Node* m = i.get();
703             if (m->is_Phi()) {
704               dead_worklist.push(m);
705             }
706           }
707           C->gvn_replace_by(use, C->top());
708         }
709         break;
710       }
711       case Op_AddP:
712       case Op_CreateEx: {
713         // Recurisvely clean up references to CreateEx so EA doesn't
714         // get unhappy about the partially collapsed graph.
715         for (SimpleDUIterator i(use); i.has_next(); i.next()) {
716           Node* m = i.get();
717           if (m->is_AddP()) {
718             dead_worklist.push(m);
719           }
720         }
721         C->gvn_replace_by(use, C->top());
722         break;
723       }
724       case Op_Phi:
725         if (use->in(0) == C->top()) {
726           C->gvn_replace_by(use, C->top());
727         }
728         break;
729     }
730   }
731 }
732 
733 
validate_mem_flow()734 bool StringConcat::validate_mem_flow() {
735   Compile* C = _stringopts->C;
736 
737   for (uint i = 0; i < _control.size(); i++) {
738 #ifndef PRODUCT
739     Node_List path;
740 #endif
741     Node* curr = _control.at(i);
742     if (curr->is_Call() && curr != _begin) { // For all calls except the first allocation
743       // Now here's the main invariant in our case:
744       // For memory between the constructor, and appends, and toString we should only see bottom memory,
745       // produced by the previous call we know about.
746       if (!_constructors.contains(curr)) {
747         NOT_PRODUCT(path.push(curr);)
748         Node* mem = curr->in(TypeFunc::Memory);
749         assert(mem != NULL, "calls should have memory edge");
750         assert(!mem->is_Phi(), "should be handled by control flow validation");
751         NOT_PRODUCT(path.push(mem);)
752         while (mem->is_MergeMem()) {
753           for (uint i = 1; i < mem->req(); i++) {
754             if (i != Compile::AliasIdxBot && mem->in(i) != C->top()) {
755 #ifndef PRODUCT
756               if (PrintOptimizeStringConcat) {
757                 tty->print("fusion has incorrect memory flow (side effects) for ");
758                 _begin->jvms()->dump_spec(tty); tty->cr();
759                 path.dump();
760               }
761 #endif
762               return false;
763             }
764           }
765           // skip through a potential MergeMem chain, linked through Bot
766           mem = mem->in(Compile::AliasIdxBot);
767           NOT_PRODUCT(path.push(mem);)
768         }
769         // now let it fall through, and see if we have a projection
770         if (mem->is_Proj()) {
771           // Should point to a previous known call
772           Node *prev = mem->in(0);
773           NOT_PRODUCT(path.push(prev);)
774           if (!prev->is_Call() || !_control.contains(prev)) {
775 #ifndef PRODUCT
776             if (PrintOptimizeStringConcat) {
777               tty->print("fusion has incorrect memory flow (unknown call) for ");
778               _begin->jvms()->dump_spec(tty); tty->cr();
779               path.dump();
780             }
781 #endif
782             return false;
783           }
784         } else {
785           assert(mem->is_Store() || mem->is_LoadStore(), "unexpected node type: %s", mem->Name());
786 #ifndef PRODUCT
787           if (PrintOptimizeStringConcat) {
788             tty->print("fusion has incorrect memory flow (unexpected source) for ");
789             _begin->jvms()->dump_spec(tty); tty->cr();
790             path.dump();
791           }
792 #endif
793           return false;
794         }
795       } else {
796         // For memory that feeds into constructors it's more complicated.
797         // However the advantage is that any side effect that happens between the Allocate/Initialize and
798         // the constructor will have to be control-dependent on Initialize.
799         // So we actually don't have to do anything, since it's going to be caught by the control flow
800         // analysis.
801 #ifdef ASSERT
802         // Do a quick verification of the control pattern between the constructor and the initialize node
803         assert(curr->is_Call(), "constructor should be a call");
804         // Go up the control starting from the constructor call
805         Node* ctrl = curr->in(0);
806         IfNode* iff = NULL;
807         RegionNode* copy = NULL;
808 
809         while (true) {
810           // skip known check patterns
811           if (ctrl->is_Region()) {
812             if (ctrl->as_Region()->is_copy()) {
813               copy = ctrl->as_Region();
814               ctrl = copy->is_copy();
815             } else { // a cast
816               assert(ctrl->req() == 3 &&
817                      ctrl->in(1) != NULL && ctrl->in(1)->is_Proj() &&
818                      ctrl->in(2) != NULL && ctrl->in(2)->is_Proj() &&
819                      ctrl->in(1)->in(0) == ctrl->in(2)->in(0) &&
820                      ctrl->in(1)->in(0) != NULL && ctrl->in(1)->in(0)->is_If(),
821                      "must be a simple diamond");
822               Node* true_proj = ctrl->in(1)->is_IfTrue() ? ctrl->in(1) : ctrl->in(2);
823               for (SimpleDUIterator i(true_proj); i.has_next(); i.next()) {
824                 Node* use = i.get();
825                 assert(use == ctrl || use->is_ConstraintCast(),
826                        "unexpected user: %s", use->Name());
827               }
828 
829               iff = ctrl->in(1)->in(0)->as_If();
830               ctrl = iff->in(0);
831             }
832           } else if (ctrl->is_IfTrue()) { // null checks, class checks
833             iff = ctrl->in(0)->as_If();
834             // Verify that the other arm is an uncommon trap
835             Node* otherproj = iff->proj_out(1 - ctrl->as_Proj()->_con);
836             CallStaticJavaNode* call = otherproj->unique_out()->isa_CallStaticJava();
837             assert(strcmp(call->_name, "uncommon_trap") == 0, "must be uncommon trap");
838             ctrl = iff->in(0);
839           } else {
840             break;
841           }
842         }
843 
844         assert(ctrl->is_Proj(), "must be a projection");
845         assert(ctrl->in(0)->is_Initialize(), "should be initialize");
846         for (SimpleDUIterator i(ctrl); i.has_next(); i.next()) {
847           Node* use = i.get();
848           assert(use == copy || use == iff || use == curr || use->is_CheckCastPP() || use->is_Load(),
849                  "unexpected user: %s", use->Name());
850         }
851 #endif // ASSERT
852       }
853     }
854   }
855 
856 #ifndef PRODUCT
857   if (PrintOptimizeStringConcat) {
858     tty->print("fusion has correct memory flow for ");
859     _begin->jvms()->dump_spec(tty); tty->cr();
860     tty->cr();
861   }
862 #endif
863   return true;
864 }
865 
validate_control_flow()866 bool StringConcat::validate_control_flow() {
867   // We found all the calls and arguments now lets see if it's
868   // safe to transform the graph as we would expect.
869 
870   // Check to see if this resulted in too many uncommon traps previously
871   if (Compile::current()->too_many_traps(_begin->jvms()->method(), _begin->jvms()->bci(),
872                         Deoptimization::Reason_intrinsic)) {
873     return false;
874   }
875 
876   // Walk backwards over the control flow from toString to the
877   // allocation and make sure all the control flow is ok.  This
878   // means it's either going to be eliminated once the calls are
879   // removed or it can safely be transformed into an uncommon
880   // trap.
881 
882   int null_check_count = 0;
883   Unique_Node_List ctrl_path;
884 
885   assert(_control.contains(_begin), "missing");
886   assert(_control.contains(_end), "missing");
887 
888   // Collect the nodes that we know about and will eliminate into ctrl_path
889   for (uint i = 0; i < _control.size(); i++) {
890     // Push the call and it's control projection
891     Node* n = _control.at(i);
892     if (n->is_Allocate()) {
893       AllocateNode* an = n->as_Allocate();
894       InitializeNode* init = an->initialization();
895       ctrl_path.push(init);
896       ctrl_path.push(init->as_Multi()->proj_out(0));
897     }
898     if (n->is_Call()) {
899       CallNode* cn = n->as_Call();
900       ctrl_path.push(cn);
901       ctrl_path.push(cn->proj_out(0));
902       ctrl_path.push(cn->proj_out(0)->unique_out());
903       Node* catchproj = cn->proj_out(0)->unique_out()->as_Catch()->proj_out_or_null(0);
904       if (catchproj != NULL) {
905         ctrl_path.push(catchproj);
906       }
907     } else {
908       ShouldNotReachHere();
909     }
910   }
911 
912   // Skip backwards through the control checking for unexpected control flow
913   Node* ptr = _end;
914   bool fail = false;
915   while (ptr != _begin) {
916     if (ptr->is_Call() && ctrl_path.member(ptr)) {
917       ptr = ptr->in(0);
918     } else if (ptr->is_CatchProj() && ctrl_path.member(ptr)) {
919       ptr = ptr->in(0)->in(0)->in(0);
920       assert(ctrl_path.member(ptr), "should be a known piece of control");
921     } else if (ptr->is_IfTrue()) {
922       IfNode* iff = ptr->in(0)->as_If();
923       BoolNode* b = iff->in(1)->isa_Bool();
924 
925       if (b == NULL) {
926 #ifndef PRODUCT
927         if (PrintOptimizeStringConcat) {
928           tty->print_cr("unexpected input to IfNode");
929           iff->in(1)->dump();
930           tty->cr();
931         }
932 #endif
933         fail = true;
934         break;
935       }
936 
937       Node* cmp = b->in(1);
938       Node* v1 = cmp->in(1);
939       Node* v2 = cmp->in(2);
940       Node* otherproj = iff->proj_out(1 - ptr->as_Proj()->_con);
941 
942       // Null check of the return of append which can simply be eliminated
943       if (b->_test._test == BoolTest::ne &&
944           v2->bottom_type() == TypePtr::NULL_PTR &&
945           v1->is_Proj() && ctrl_path.member(v1->in(0))) {
946         // NULL check of the return value of the append
947         null_check_count++;
948         if (otherproj->outcnt() == 1) {
949           CallStaticJavaNode* call = otherproj->unique_out()->isa_CallStaticJava();
950           if (call != NULL && call->_name != NULL && strcmp(call->_name, "uncommon_trap") == 0) {
951             ctrl_path.push(call);
952           }
953         }
954         _control.push(ptr);
955         ptr = ptr->in(0)->in(0);
956         continue;
957       }
958 
959       // A test which leads to an uncommon trap which should be safe.
960       // Later this trap will be converted into a trap that restarts
961       // at the beginning.
962       if (otherproj->outcnt() == 1) {
963         CallStaticJavaNode* call = otherproj->unique_out()->isa_CallStaticJava();
964         if (call != NULL && call->_name != NULL && strcmp(call->_name, "uncommon_trap") == 0) {
965           // control flow leads to uct so should be ok
966           _uncommon_traps.push(call);
967           ctrl_path.push(call);
968           ptr = ptr->in(0)->in(0);
969           continue;
970         }
971       }
972 
973 #ifndef PRODUCT
974       // Some unexpected control flow we don't know how to handle.
975       if (PrintOptimizeStringConcat) {
976         tty->print_cr("failing with unknown test");
977         b->dump();
978         cmp->dump();
979         v1->dump();
980         v2->dump();
981         tty->cr();
982       }
983 #endif
984       fail = true;
985       break;
986     } else if (ptr->is_Proj() && ptr->in(0)->is_Initialize()) {
987       ptr = ptr->in(0)->in(0);
988     } else if (ptr->is_Region()) {
989       Node* copy = ptr->as_Region()->is_copy();
990       if (copy != NULL) {
991         ptr = copy;
992         continue;
993       }
994       if (ptr->req() == 3 &&
995           ptr->in(1) != NULL && ptr->in(1)->is_Proj() &&
996           ptr->in(2) != NULL && ptr->in(2)->is_Proj() &&
997           ptr->in(1)->in(0) == ptr->in(2)->in(0) &&
998           ptr->in(1)->in(0) != NULL && ptr->in(1)->in(0)->is_If()) {
999         // Simple diamond.
1000         // XXX should check for possibly merging stores.  simple data merges are ok.
1001         // The IGVN will make this simple diamond go away when it
1002         // transforms the Region. Make sure it sees it.
1003         Compile::current()->record_for_igvn(ptr);
1004         ptr = ptr->in(1)->in(0)->in(0);
1005         continue;
1006       }
1007 #ifndef PRODUCT
1008       if (PrintOptimizeStringConcat) {
1009         tty->print_cr("fusion would fail for region");
1010         _begin->dump();
1011         ptr->dump(2);
1012       }
1013 #endif
1014       fail = true;
1015       break;
1016     } else {
1017       // other unknown control
1018       if (!fail) {
1019 #ifndef PRODUCT
1020         if (PrintOptimizeStringConcat) {
1021           tty->print_cr("fusion would fail for");
1022           _begin->dump();
1023         }
1024 #endif
1025         fail = true;
1026       }
1027 #ifndef PRODUCT
1028       if (PrintOptimizeStringConcat) {
1029         ptr->dump();
1030       }
1031 #endif
1032       ptr = ptr->in(0);
1033     }
1034   }
1035 #ifndef PRODUCT
1036   if (PrintOptimizeStringConcat && fail) {
1037     tty->cr();
1038   }
1039 #endif
1040   if (fail) return !fail;
1041 
1042   // Validate that all these results produced are contained within
1043   // this cluster of objects.  First collect all the results produced
1044   // by calls in the region.
1045   _stringopts->_visited.clear();
1046   Node_List worklist;
1047   Node* final_result = _end->proj_out_or_null(TypeFunc::Parms);
1048   for (uint i = 0; i < _control.size(); i++) {
1049     CallNode* cnode = _control.at(i)->isa_Call();
1050     if (cnode != NULL) {
1051       _stringopts->_visited.test_set(cnode->_idx);
1052     }
1053     Node* result = cnode != NULL ? cnode->proj_out_or_null(TypeFunc::Parms) : NULL;
1054     if (result != NULL && result != final_result) {
1055       worklist.push(result);
1056     }
1057   }
1058 
1059   Node* last_result = NULL;
1060   while (worklist.size() > 0) {
1061     Node* result = worklist.pop();
1062     if (_stringopts->_visited.test_set(result->_idx))
1063       continue;
1064     for (SimpleDUIterator i(result); i.has_next(); i.next()) {
1065       Node *use = i.get();
1066       if (ctrl_path.member(use)) {
1067         // already checked this
1068         continue;
1069       }
1070       int opc = use->Opcode();
1071       if (opc == Op_CmpP || opc == Op_Node) {
1072         ctrl_path.push(use);
1073         continue;
1074       }
1075       if (opc == Op_CastPP || opc == Op_CheckCastPP) {
1076         for (SimpleDUIterator j(use); j.has_next(); j.next()) {
1077           worklist.push(j.get());
1078         }
1079         worklist.push(use->in(1));
1080         ctrl_path.push(use);
1081         continue;
1082       }
1083 #ifndef PRODUCT
1084       if (PrintOptimizeStringConcat) {
1085         if (result != last_result) {
1086           last_result = result;
1087           tty->print_cr("extra uses for result:");
1088           last_result->dump();
1089         }
1090         use->dump();
1091       }
1092 #endif
1093       fail = true;
1094       break;
1095     }
1096   }
1097 
1098 #ifndef PRODUCT
1099   if (PrintOptimizeStringConcat && !fail) {
1100     ttyLocker ttyl;
1101     tty->cr();
1102     tty->print("fusion has correct control flow (%d %d) for ", null_check_count, _uncommon_traps.size());
1103     _begin->jvms()->dump_spec(tty); tty->cr();
1104     for (int i = 0; i < num_arguments(); i++) {
1105       argument(i)->dump();
1106     }
1107     _control.dump();
1108     tty->cr();
1109   }
1110 #endif
1111 
1112   return !fail;
1113 }
1114 
fetch_static_field(GraphKit & kit,ciField * field)1115 Node* PhaseStringOpts::fetch_static_field(GraphKit& kit, ciField* field) {
1116   const TypeInstPtr* mirror_type = TypeInstPtr::make(field->holder()->java_mirror());
1117   Node* klass_node = __ makecon(mirror_type);
1118   BasicType bt = field->layout_type();
1119   ciType* field_klass = field->type();
1120 
1121   const Type *type;
1122   if( bt == T_OBJECT ) {
1123     if (!field->type()->is_loaded()) {
1124       type = TypeInstPtr::BOTTOM;
1125     } else if (field->is_static_constant()) {
1126       // This can happen if the constant oop is non-perm.
1127       ciObject* con = field->constant_value().as_object();
1128       // Do not "join" in the previous type; it doesn't add value,
1129       // and may yield a vacuous result if the field is of interface type.
1130       type = TypeOopPtr::make_from_constant(con, true)->isa_oopptr();
1131       assert(type != NULL, "field singleton type must be consistent");
1132       return __ makecon(type);
1133     } else {
1134       type = TypeOopPtr::make_from_klass(field_klass->as_klass());
1135     }
1136   } else {
1137     type = Type::get_const_basic_type(bt);
1138   }
1139 
1140   return kit.make_load(NULL, kit.basic_plus_adr(klass_node, field->offset_in_bytes()),
1141                        type, T_OBJECT,
1142                        C->get_alias_index(mirror_type->add_offset(field->offset_in_bytes())),
1143                        MemNode::unordered);
1144 }
1145 
int_stringSize(GraphKit & kit,Node * arg)1146 Node* PhaseStringOpts::int_stringSize(GraphKit& kit, Node* arg) {
1147   if (arg->is_Con()) {
1148     // Constant integer. Compute constant length using Integer.sizeTable
1149     int arg_val = arg->get_int();
1150     int count = 1;
1151     if (arg_val < 0) {
1152       arg_val = -arg_val;
1153       count++;
1154     }
1155 
1156     ciArray* size_table = (ciArray*)size_table_field->constant_value().as_object();
1157     for (int i = 0; i < size_table->length(); i++) {
1158       if (arg_val <= size_table->element_value(i).as_int()) {
1159         count += i;
1160         break;
1161       }
1162     }
1163     return __ intcon(count);
1164   }
1165 
1166   RegionNode *final_merge = new RegionNode(3);
1167   kit.gvn().set_type(final_merge, Type::CONTROL);
1168   Node* final_size = new PhiNode(final_merge, TypeInt::INT);
1169   kit.gvn().set_type(final_size, TypeInt::INT);
1170 
1171   IfNode* iff = kit.create_and_map_if(kit.control(),
1172                                       __ Bool(__ CmpI(arg, __ intcon(0x80000000)), BoolTest::ne),
1173                                       PROB_FAIR, COUNT_UNKNOWN);
1174   Node* is_min = __ IfFalse(iff);
1175   final_merge->init_req(1, is_min);
1176   final_size->init_req(1, __ intcon(11));
1177 
1178   kit.set_control(__ IfTrue(iff));
1179   if (kit.stopped()) {
1180     final_merge->init_req(2, C->top());
1181     final_size->init_req(2, C->top());
1182   } else {
1183 
1184     // int size = (i < 0) ? stringSize(-i) + 1 : stringSize(i);
1185     RegionNode *r = new RegionNode(3);
1186     kit.gvn().set_type(r, Type::CONTROL);
1187     Node *phi = new PhiNode(r, TypeInt::INT);
1188     kit.gvn().set_type(phi, TypeInt::INT);
1189     Node *size = new PhiNode(r, TypeInt::INT);
1190     kit.gvn().set_type(size, TypeInt::INT);
1191     Node* chk = __ CmpI(arg, __ intcon(0));
1192     Node* p = __ Bool(chk, BoolTest::lt);
1193     IfNode* iff = kit.create_and_map_if(kit.control(), p, PROB_FAIR, COUNT_UNKNOWN);
1194     Node* lessthan = __ IfTrue(iff);
1195     Node* greaterequal = __ IfFalse(iff);
1196     r->init_req(1, lessthan);
1197     phi->init_req(1, __ SubI(__ intcon(0), arg));
1198     size->init_req(1, __ intcon(1));
1199     r->init_req(2, greaterequal);
1200     phi->init_req(2, arg);
1201     size->init_req(2, __ intcon(0));
1202     kit.set_control(r);
1203     C->record_for_igvn(r);
1204     C->record_for_igvn(phi);
1205     C->record_for_igvn(size);
1206 
1207     // for (int i=0; ; i++)
1208     //   if (x <= sizeTable[i])
1209     //     return i+1;
1210 
1211     // Add loop predicate first.
1212     kit.add_empty_predicates();
1213 
1214     RegionNode *loop = new RegionNode(3);
1215     loop->init_req(1, kit.control());
1216     kit.gvn().set_type(loop, Type::CONTROL);
1217 
1218     Node *index = new PhiNode(loop, TypeInt::INT);
1219     index->init_req(1, __ intcon(0));
1220     kit.gvn().set_type(index, TypeInt::INT);
1221     kit.set_control(loop);
1222     Node* sizeTable = fetch_static_field(kit, size_table_field);
1223 
1224     Node* value = kit.load_array_element(NULL, sizeTable, index, TypeAryPtr::INTS);
1225     C->record_for_igvn(value);
1226     Node* limit = __ CmpI(phi, value);
1227     Node* limitb = __ Bool(limit, BoolTest::le);
1228     IfNode* iff2 = kit.create_and_map_if(kit.control(), limitb, PROB_MIN, COUNT_UNKNOWN);
1229     Node* lessEqual = __ IfTrue(iff2);
1230     Node* greater = __ IfFalse(iff2);
1231 
1232     loop->init_req(2, greater);
1233     index->init_req(2, __ AddI(index, __ intcon(1)));
1234 
1235     kit.set_control(lessEqual);
1236     C->record_for_igvn(loop);
1237     C->record_for_igvn(index);
1238 
1239     final_merge->init_req(2, kit.control());
1240     final_size->init_req(2, __ AddI(__ AddI(index, size), __ intcon(1)));
1241   }
1242 
1243   kit.set_control(final_merge);
1244   C->record_for_igvn(final_merge);
1245   C->record_for_igvn(final_size);
1246 
1247   return final_size;
1248 }
1249 
1250 // Simplified version of Integer.getChars
getChars(GraphKit & kit,Node * arg,Node * dst_array,BasicType bt,Node * end,Node * final_merge,Node * final_mem,int merge_index)1251 void PhaseStringOpts::getChars(GraphKit& kit, Node* arg, Node* dst_array, BasicType bt, Node* end, Node* final_merge, Node* final_mem, int merge_index) {
1252   // if (i < 0) {
1253   //     sign = '-';
1254   //     i = -i;
1255   // }
1256   IfNode* iff = kit.create_and_map_if(kit.control(), __ Bool(__ CmpI(arg, __ intcon(0)), BoolTest::lt),
1257                                       PROB_FAIR, COUNT_UNKNOWN);
1258 
1259   RegionNode* merge = new RegionNode(3);
1260   kit.gvn().set_type(merge, Type::CONTROL);
1261   Node* i = new PhiNode(merge, TypeInt::INT);
1262   kit.gvn().set_type(i, TypeInt::INT);
1263   Node* sign = new PhiNode(merge, TypeInt::INT);
1264   kit.gvn().set_type(sign, TypeInt::INT);
1265 
1266   merge->init_req(1, __ IfTrue(iff));
1267   i->init_req(1, __ SubI(__ intcon(0), arg));
1268   sign->init_req(1, __ intcon('-'));
1269   merge->init_req(2, __ IfFalse(iff));
1270   i->init_req(2, arg);
1271   sign->init_req(2, __ intcon(0));
1272 
1273   kit.set_control(merge);
1274 
1275   C->record_for_igvn(merge);
1276   C->record_for_igvn(i);
1277   C->record_for_igvn(sign);
1278 
1279   // for (;;) {
1280   //     q = i / 10;
1281   //     r = i - ((q << 3) + (q << 1));  // r = i-(q*10) ...
1282   //     buf [--charPos] = digits [r];
1283   //     i = q;
1284   //     if (i == 0) break;
1285   // }
1286 
1287   // Add loop predicate first.
1288   kit.add_empty_predicates();
1289 
1290   RegionNode* head = new RegionNode(3);
1291   head->init_req(1, kit.control());
1292 
1293   kit.gvn().set_type(head, Type::CONTROL);
1294   Node* i_phi = new PhiNode(head, TypeInt::INT);
1295   i_phi->init_req(1, i);
1296   kit.gvn().set_type(i_phi, TypeInt::INT);
1297   Node* charPos = new PhiNode(head, TypeInt::INT);
1298   charPos->init_req(1, end);
1299   kit.gvn().set_type(charPos, TypeInt::INT);
1300   Node* mem = PhiNode::make(head, kit.memory(byte_adr_idx), Type::MEMORY, TypeAryPtr::BYTES);
1301   kit.gvn().set_type(mem, Type::MEMORY);
1302 
1303   kit.set_control(head);
1304   kit.set_memory(mem, byte_adr_idx);
1305 
1306   Node* q = __ DivI(kit.null(), i_phi, __ intcon(10));
1307   Node* r = __ SubI(i_phi, __ AddI(__ LShiftI(q, __ intcon(3)),
1308                                    __ LShiftI(q, __ intcon(1))));
1309   Node* index = __ SubI(charPos, __ intcon((bt == T_BYTE) ? 1 : 2));
1310   Node* ch = __ AddI(r, __ intcon('0'));
1311   Node* st = __ store_to_memory(kit.control(), kit.array_element_address(dst_array, index, T_BYTE),
1312                                 ch, bt, byte_adr_idx, MemNode::unordered, (bt != T_BYTE) /* mismatched */);
1313 
1314   iff = kit.create_and_map_if(head, __ Bool(__ CmpI(q, __ intcon(0)), BoolTest::ne),
1315                               PROB_FAIR, COUNT_UNKNOWN);
1316   Node* ne = __ IfTrue(iff);
1317   Node* eq = __ IfFalse(iff);
1318 
1319   head->init_req(2, ne);
1320   mem->init_req(2, st);
1321 
1322   i_phi->init_req(2, q);
1323   charPos->init_req(2, index);
1324   charPos = index;
1325 
1326   kit.set_control(eq);
1327   kit.set_memory(st, byte_adr_idx);
1328 
1329   C->record_for_igvn(head);
1330   C->record_for_igvn(mem);
1331   C->record_for_igvn(i_phi);
1332   C->record_for_igvn(charPos);
1333 
1334   // if (sign != 0) {
1335   //     buf [--charPos] = sign;
1336   // }
1337   iff = kit.create_and_map_if(kit.control(), __ Bool(__ CmpI(sign, __ intcon(0)), BoolTest::ne),
1338                               PROB_FAIR, COUNT_UNKNOWN);
1339 
1340   final_merge->init_req(merge_index + 2, __ IfFalse(iff));
1341   final_mem->init_req(merge_index + 2, kit.memory(byte_adr_idx));
1342 
1343   kit.set_control(__ IfTrue(iff));
1344   if (kit.stopped()) {
1345     final_merge->init_req(merge_index + 1, C->top());
1346     final_mem->init_req(merge_index + 1, C->top());
1347   } else {
1348     Node* index = __ SubI(charPos, __ intcon((bt == T_BYTE) ? 1 : 2));
1349     st = __ store_to_memory(kit.control(), kit.array_element_address(dst_array, index, T_BYTE),
1350                             sign, bt, byte_adr_idx, MemNode::unordered, (bt != T_BYTE) /* mismatched */);
1351 
1352     final_merge->init_req(merge_index + 1, kit.control());
1353     final_mem->init_req(merge_index + 1, st);
1354   }
1355 }
1356 
1357 // Copy the characters representing arg into dst_array starting at start
int_getChars(GraphKit & kit,Node * arg,Node * dst_array,Node * dst_coder,Node * start,Node * size)1358 Node* PhaseStringOpts::int_getChars(GraphKit& kit, Node* arg, Node* dst_array, Node* dst_coder, Node* start, Node* size) {
1359   bool dcon = dst_coder->is_Con();
1360   bool dbyte = dcon ? (dst_coder->get_int() == java_lang_String::CODER_LATIN1) : false;
1361   Node* end = __ AddI(start, __ LShiftI(size, dst_coder));
1362 
1363   // The final_merge node has 4 entries in case the encoding is known:
1364   // (0) Control, (1) result w/ sign, (2) result w/o sign, (3) result for Integer.min_value
1365   // or 6 entries in case the encoding is not known:
1366   // (0) Control, (1) Latin1 w/ sign, (2) Latin1 w/o sign, (3) min_value, (4) UTF16 w/ sign, (5) UTF16 w/o sign
1367   RegionNode* final_merge = new RegionNode(dcon ? 4 : 6);
1368   kit.gvn().set_type(final_merge, Type::CONTROL);
1369 
1370   Node* final_mem = PhiNode::make(final_merge, kit.memory(byte_adr_idx), Type::MEMORY, TypeAryPtr::BYTES);
1371   kit.gvn().set_type(final_mem, Type::MEMORY);
1372 
1373   // need to handle arg == Integer.MIN_VALUE specially because negating doesn't make it positive
1374   IfNode* iff = kit.create_and_map_if(kit.control(), __ Bool(__ CmpI(arg, __ intcon(0x80000000)), BoolTest::ne),
1375                                       PROB_FAIR, COUNT_UNKNOWN);
1376 
1377   Node* old_mem = kit.memory(byte_adr_idx);
1378 
1379   kit.set_control(__ IfFalse(iff));
1380   if (kit.stopped()) {
1381     // Statically not equal to MIN_VALUE so this path is dead
1382     final_merge->init_req(3, kit.control());
1383   } else {
1384     copy_string(kit, __ makecon(TypeInstPtr::make(C->env()->the_min_jint_string())),
1385                 dst_array, dst_coder, start);
1386     final_merge->init_req(3, kit.control());
1387     final_mem->init_req(3, kit.memory(byte_adr_idx));
1388   }
1389 
1390   kit.set_control(__ IfTrue(iff));
1391   kit.set_memory(old_mem, byte_adr_idx);
1392 
1393   if (!dcon) {
1394     // Check encoding of destination
1395     iff = kit.create_and_map_if(kit.control(), __ Bool(__ CmpI(dst_coder, __ intcon(0)), BoolTest::eq),
1396                                 PROB_FAIR, COUNT_UNKNOWN);
1397     old_mem = kit.memory(byte_adr_idx);
1398   }
1399   if (!dcon || dbyte) {
1400     // Destination is Latin1,
1401     if (!dcon) {
1402       kit.set_control(__ IfTrue(iff));
1403     }
1404     getChars(kit, arg, dst_array, T_BYTE, end, final_merge, final_mem);
1405   }
1406   if (!dcon || !dbyte) {
1407     // Destination is UTF16
1408     int merge_index = 0;
1409     if (!dcon) {
1410       kit.set_control(__ IfFalse(iff));
1411       kit.set_memory(old_mem, byte_adr_idx);
1412       merge_index = 3; // Account for Latin1 case
1413     }
1414     getChars(kit, arg, dst_array, T_CHAR, end, final_merge, final_mem, merge_index);
1415   }
1416 
1417   // Final merge point for Latin1 and UTF16 case
1418   kit.set_control(final_merge);
1419   kit.set_memory(final_mem, byte_adr_idx);
1420 
1421   C->record_for_igvn(final_merge);
1422   C->record_for_igvn(final_mem);
1423   return end;
1424 }
1425 
1426 // Copy 'count' bytes/chars from src_array to dst_array starting at index start
arraycopy(GraphKit & kit,IdealKit & ideal,Node * src_array,Node * dst_array,BasicType elembt,Node * start,Node * count)1427 void PhaseStringOpts::arraycopy(GraphKit& kit, IdealKit& ideal, Node* src_array, Node* dst_array, BasicType elembt, Node* start, Node* count) {
1428   assert(elembt == T_BYTE || elembt == T_CHAR, "Invalid type for arraycopy");
1429 
1430   if (elembt == T_CHAR) {
1431     // Get number of chars
1432     count = __ RShiftI(count, __ intcon(1));
1433   }
1434 
1435   Node* extra = NULL;
1436 #ifdef _LP64
1437   count = __ ConvI2L(count);
1438   extra = C->top();
1439 #endif
1440 
1441   Node* src_ptr = __ array_element_address(src_array, __ intcon(0), T_BYTE);
1442   Node* dst_ptr = __ array_element_address(dst_array, start, T_BYTE);
1443   // Check if destination address is aligned to HeapWordSize
1444   const TypeInt* tdst = __ gvn().type(start)->is_int();
1445   bool aligned = tdst->is_con() && ((tdst->get_con() * type2aelembytes(T_BYTE)) % HeapWordSize == 0);
1446   // Figure out which arraycopy runtime method to call (disjoint, uninitialized).
1447   const char* copyfunc_name = "arraycopy";
1448   address     copyfunc_addr = StubRoutines::select_arraycopy_function(elembt, aligned, true, copyfunc_name, true);
1449   ideal.make_leaf_call_no_fp(OptoRuntime::fast_arraycopy_Type(), copyfunc_addr, copyfunc_name,
1450                              TypeAryPtr::BYTES, src_ptr, dst_ptr, count, extra);
1451 }
1452 
1453 #undef __
1454 #define __ ideal.
1455 
1456 // Copy contents of a Latin1 encoded string from src_array to dst_array
copy_latin1_string(GraphKit & kit,IdealKit & ideal,Node * src_array,IdealVariable & count,Node * dst_array,Node * dst_coder,Node * start)1457 void PhaseStringOpts::copy_latin1_string(GraphKit& kit, IdealKit& ideal, Node* src_array, IdealVariable& count,
1458                                          Node* dst_array, Node* dst_coder, Node* start) {
1459   bool dcon = dst_coder->is_Con();
1460   bool dbyte = dcon ? (dst_coder->get_int() == java_lang_String::CODER_LATIN1) : false;
1461 
1462   if (!dcon) {
1463     __ if_then(dst_coder, BoolTest::eq, __ ConI(java_lang_String::CODER_LATIN1));
1464   }
1465   if (!dcon || dbyte) {
1466     // Destination is Latin1. Simply emit a byte arraycopy.
1467     arraycopy(kit, ideal, src_array, dst_array, T_BYTE, start, __ value(count));
1468   }
1469   if (!dcon) {
1470     __ else_();
1471   }
1472   if (!dcon || !dbyte) {
1473     // Destination is UTF16. Inflate src_array into dst_array.
1474     kit.sync_kit(ideal);
1475     if (Matcher::match_rule_supported(Op_StrInflatedCopy)) {
1476       // Use fast intrinsic
1477       Node* src = kit.array_element_address(src_array, kit.intcon(0), T_BYTE);
1478       Node* dst = kit.array_element_address(dst_array, start, T_BYTE);
1479       kit.inflate_string(src, dst, TypeAryPtr::BYTES, __ value(count));
1480     } else {
1481       // No intrinsic available, use slow method
1482       kit.inflate_string_slow(src_array, dst_array, start, __ value(count));
1483     }
1484     ideal.sync_kit(&kit);
1485     // Multiply count by two since we now need two bytes per char
1486     __ set(count, __ LShiftI(__ value(count), __ ConI(1)));
1487   }
1488   if (!dcon) {
1489     __ end_if();
1490   }
1491 }
1492 
1493 // Read two bytes from index and index+1 and convert them to a char
readChar(ciTypeArray * array,int index)1494 static jchar readChar(ciTypeArray* array, int index) {
1495   int shift_high, shift_low;
1496 #ifdef VM_LITTLE_ENDIAN
1497     shift_high = 0;
1498     shift_low = 8;
1499 #else
1500     shift_high = 8;
1501     shift_low = 0;
1502 #endif
1503 
1504   jchar b1 = ((jchar) array->byte_at(index)) & 0xff;
1505   jchar b2 = ((jchar) array->byte_at(index+1)) & 0xff;
1506   return (b1 << shift_high) | (b2 << shift_low);
1507 }
1508 
1509 // Copy contents of constant src_array to dst_array by emitting individual stores
copy_constant_string(GraphKit & kit,IdealKit & ideal,ciTypeArray * src_array,IdealVariable & count,bool src_is_byte,Node * dst_array,Node * dst_coder,Node * start)1510 void PhaseStringOpts::copy_constant_string(GraphKit& kit, IdealKit& ideal, ciTypeArray* src_array, IdealVariable& count,
1511                                            bool src_is_byte, Node* dst_array, Node* dst_coder, Node* start) {
1512   bool dcon = dst_coder->is_Con();
1513   bool dbyte = dcon ? (dst_coder->get_int() == java_lang_String::CODER_LATIN1) : false;
1514   int length = src_array->length();
1515 
1516   if (!dcon) {
1517     __ if_then(dst_coder, BoolTest::eq, __ ConI(java_lang_String::CODER_LATIN1));
1518   }
1519   if (!dcon || dbyte) {
1520     // Destination is Latin1. Copy each byte of src_array into dst_array.
1521     Node* index = start;
1522     for (int i = 0; i < length; i++) {
1523       Node* adr = kit.array_element_address(dst_array, index, T_BYTE);
1524       Node* val = __ ConI(src_array->byte_at(i));
1525       __ store(__ ctrl(), adr, val, T_BYTE, byte_adr_idx, MemNode::unordered);
1526       index = __ AddI(index, __ ConI(1));
1527     }
1528   }
1529   if (!dcon) {
1530     __ else_();
1531   }
1532   if (!dcon || !dbyte) {
1533     // Destination is UTF16. Copy each char of src_array into dst_array.
1534     Node* index = start;
1535     for (int i = 0; i < length; i++) {
1536       Node* adr = kit.array_element_address(dst_array, index, T_BYTE);
1537       jchar val;
1538       if (src_is_byte) {
1539         val = src_array->byte_at(i) & 0xff;
1540       } else {
1541         val = readChar(src_array, i++);
1542       }
1543       __ store(__ ctrl(), adr, __ ConI(val), T_CHAR, byte_adr_idx, MemNode::unordered, true /* mismatched */);
1544       index = __ AddI(index, __ ConI(2));
1545     }
1546     if (src_is_byte) {
1547       // Multiply count by two since we now need two bytes per char
1548       __ set(count, __ ConI(2 * length));
1549     }
1550   }
1551   if (!dcon) {
1552     __ end_if();
1553   }
1554 }
1555 
1556 // Compress copy contents of the byte/char String str into dst_array starting at index start.
copy_string(GraphKit & kit,Node * str,Node * dst_array,Node * dst_coder,Node * start)1557 Node* PhaseStringOpts::copy_string(GraphKit& kit, Node* str, Node* dst_array, Node* dst_coder, Node* start) {
1558   Node* src_array = kit.load_String_value(str, true);
1559 
1560   IdealKit ideal(&kit, true, true);
1561   IdealVariable count(ideal); __ declarations_done();
1562 
1563   if (str->is_Con()) {
1564     // Constant source string
1565     ciTypeArray* src_array_type = get_constant_value(kit, str);
1566 
1567     // Check encoding of constant string
1568     bool src_is_byte = (get_constant_coder(kit, str) == java_lang_String::CODER_LATIN1);
1569 
1570     // For small constant strings just emit individual stores.
1571     // A length of 6 seems like a good space/speed tradeof.
1572     __ set(count, __ ConI(src_array_type->length()));
1573     int src_len = src_array_type->length() / (src_is_byte ? 1 : 2);
1574     if (src_len < unroll_string_copy_length) {
1575       // Small constant string
1576       copy_constant_string(kit, ideal, src_array_type, count, src_is_byte, dst_array, dst_coder, start);
1577     } else if (src_is_byte) {
1578       // Source is Latin1
1579       copy_latin1_string(kit, ideal, src_array, count, dst_array, dst_coder, start);
1580     } else {
1581       // Source is UTF16 (destination too). Simply emit a char arraycopy.
1582       arraycopy(kit, ideal, src_array, dst_array, T_CHAR, start, __ value(count));
1583     }
1584   } else {
1585     Node* size = kit.load_array_length(src_array);
1586     __ set(count, size);
1587     // Non-constant source string
1588     if (CompactStrings) {
1589       // Emit runtime check for coder
1590       Node* coder = kit.load_String_coder(str, true);
1591       __ if_then(coder, BoolTest::eq, __ ConI(java_lang_String::CODER_LATIN1)); {
1592         // Source is Latin1
1593         copy_latin1_string(kit, ideal, src_array, count, dst_array, dst_coder, start);
1594       } __ else_();
1595     }
1596     // Source is UTF16 (destination too). Simply emit a char arraycopy.
1597     arraycopy(kit, ideal, src_array, dst_array, T_CHAR, start, __ value(count));
1598 
1599     if (CompactStrings) {
1600       __ end_if();
1601     }
1602   }
1603 
1604   // Finally sync IdealKit and GraphKit.
1605   kit.sync_kit(ideal);
1606   return __ AddI(start, __ value(count));
1607 }
1608 
1609 // Compress copy the char into dst_array at index start.
copy_char(GraphKit & kit,Node * val,Node * dst_array,Node * dst_coder,Node * start)1610 Node* PhaseStringOpts::copy_char(GraphKit& kit, Node* val, Node* dst_array, Node* dst_coder, Node* start) {
1611   bool dcon = (dst_coder != NULL) && dst_coder->is_Con();
1612   bool dbyte = dcon ? (dst_coder->get_int() == java_lang_String::CODER_LATIN1) : false;
1613 
1614   IdealKit ideal(&kit, true, true);
1615   IdealVariable end(ideal); __ declarations_done();
1616   Node* adr = kit.array_element_address(dst_array, start, T_BYTE);
1617   if (!dcon){
1618     __ if_then(dst_coder, BoolTest::eq, __ ConI(java_lang_String::CODER_LATIN1));
1619   }
1620   if (!dcon || dbyte) {
1621     // Destination is Latin1. Store a byte.
1622     __ store(__ ctrl(), adr, val, T_BYTE, byte_adr_idx, MemNode::unordered);
1623     __ set(end, __ AddI(start, __ ConI(1)));
1624   }
1625   if (!dcon) {
1626     __ else_();
1627   }
1628   if (!dcon || !dbyte) {
1629     // Destination is UTF16. Store a char.
1630     __ store(__ ctrl(), adr, val, T_CHAR, byte_adr_idx, MemNode::unordered, true /* mismatched */);
1631     __ set(end, __ AddI(start, __ ConI(2)));
1632   }
1633   if (!dcon) {
1634     __ end_if();
1635   }
1636   // Finally sync IdealKit and GraphKit.
1637   kit.sync_kit(ideal);
1638   return __ value(end);
1639 }
1640 
1641 #undef __
1642 #define __ kit.
1643 
1644 // Allocate a byte array of specified length.
allocate_byte_array(GraphKit & kit,IdealKit * ideal,Node * length)1645 Node* PhaseStringOpts::allocate_byte_array(GraphKit& kit, IdealKit* ideal, Node* length) {
1646   if (ideal != NULL) {
1647     // Sync IdealKit and graphKit.
1648     kit.sync_kit(*ideal);
1649   }
1650   Node* byte_array = NULL;
1651   {
1652     PreserveReexecuteState preexecs(&kit);
1653     // The original jvms is for an allocation of either a String or
1654     // StringBuffer so no stack adjustment is necessary for proper
1655     // reexecution.  If we deoptimize in the slow path the bytecode
1656     // will be reexecuted and the char[] allocation will be thrown away.
1657     kit.jvms()->set_should_reexecute(true);
1658     byte_array = kit.new_array(__ makecon(TypeKlassPtr::make(ciTypeArrayKlass::make(T_BYTE))),
1659                                length, 1);
1660   }
1661 
1662   // Mark the allocation so that zeroing is skipped since the code
1663   // below will overwrite the entire array
1664   AllocateArrayNode* byte_alloc = AllocateArrayNode::Ideal_array_allocation(byte_array, _gvn);
1665   byte_alloc->maybe_set_complete(_gvn);
1666 
1667   if (ideal != NULL) {
1668     // Sync IdealKit and graphKit.
1669     ideal->sync_kit(&kit);
1670   }
1671   return byte_array;
1672 }
1673 
get_constant_coder(GraphKit & kit,Node * str)1674 jbyte PhaseStringOpts::get_constant_coder(GraphKit& kit, Node* str) {
1675   assert(str->is_Con(), "String must be constant");
1676   const TypeOopPtr* str_type = kit.gvn().type(str)->isa_oopptr();
1677   ciInstance* str_instance = str_type->const_oop()->as_instance();
1678   jbyte coder = str_instance->field_value_by_offset(java_lang_String::coder_offset()).as_byte();
1679   assert(CompactStrings || (coder == java_lang_String::CODER_UTF16), "Strings must be UTF16 encoded");
1680   return coder;
1681 }
1682 
get_constant_length(GraphKit & kit,Node * str)1683 int PhaseStringOpts::get_constant_length(GraphKit& kit, Node* str) {
1684   assert(str->is_Con(), "String must be constant");
1685   return get_constant_value(kit, str)->length();
1686 }
1687 
get_constant_value(GraphKit & kit,Node * str)1688 ciTypeArray* PhaseStringOpts::get_constant_value(GraphKit& kit, Node* str) {
1689   assert(str->is_Con(), "String must be constant");
1690   const TypeOopPtr* str_type = kit.gvn().type(str)->isa_oopptr();
1691   ciInstance* str_instance = str_type->const_oop()->as_instance();
1692   ciObject* src_array = str_instance->field_value_by_offset(java_lang_String::value_offset()).as_object();
1693   return src_array->as_type_array();
1694 }
1695 
replace_string_concat(StringConcat * sc)1696 void PhaseStringOpts::replace_string_concat(StringConcat* sc) {
1697   // Log a little info about the transformation
1698   sc->maybe_log_transform();
1699 
1700   // pull the JVMState of the allocation into a SafePointNode to serve as
1701   // as a shim for the insertion of the new code.
1702   JVMState* jvms     = sc->begin()->jvms()->clone_shallow(C);
1703   uint size = sc->begin()->req();
1704   SafePointNode* map = new SafePointNode(size, jvms);
1705 
1706   // copy the control and memory state from the final call into our
1707   // new starting state.  This allows any preceeding tests to feed
1708   // into the new section of code.
1709   for (uint i1 = 0; i1 < TypeFunc::Parms; i1++) {
1710     map->init_req(i1, sc->end()->in(i1));
1711   }
1712   // blow away old allocation arguments
1713   for (uint i1 = TypeFunc::Parms; i1 < jvms->debug_start(); i1++) {
1714     map->init_req(i1, C->top());
1715   }
1716   // Copy the rest of the inputs for the JVMState
1717   for (uint i1 = jvms->debug_start(); i1 < sc->begin()->req(); i1++) {
1718     map->init_req(i1, sc->begin()->in(i1));
1719   }
1720   // Make sure the memory state is a MergeMem for parsing.
1721   if (!map->in(TypeFunc::Memory)->is_MergeMem()) {
1722     map->set_req(TypeFunc::Memory, MergeMemNode::make(map->in(TypeFunc::Memory)));
1723   }
1724 
1725   jvms->set_map(map);
1726   map->ensure_stack(jvms, jvms->method()->max_stack());
1727 
1728   // disconnect all the old StringBuilder calls from the graph
1729   sc->eliminate_unneeded_control();
1730 
1731   // At this point all the old work has been completely removed from
1732   // the graph and the saved JVMState exists at the point where the
1733   // final toString call used to be.
1734   GraphKit kit(jvms);
1735 
1736   // There may be uncommon traps which are still using the
1737   // intermediate states and these need to be rewritten to point at
1738   // the JVMState at the beginning of the transformation.
1739   sc->convert_uncommon_traps(kit, jvms);
1740 
1741   // Now insert the logic to compute the size of the string followed
1742   // by all the logic to construct array and resulting string.
1743 
1744   Node* null_string = __ makecon(TypeInstPtr::make(C->env()->the_null_string()));
1745 
1746   // Create a region for the overflow checks to merge into.
1747   int args = MAX2(sc->num_arguments(), 1);
1748   RegionNode* overflow = new RegionNode(args);
1749   kit.gvn().set_type(overflow, Type::CONTROL);
1750 
1751   // Create a hook node to hold onto the individual sizes since they
1752   // are need for the copying phase.
1753   Node* string_sizes = new Node(args);
1754 
1755   Node* coder = __ intcon(0);
1756   Node* length = __ intcon(0);
1757   // If at least one argument is UTF16 encoded, we can fix the encoding.
1758   bool coder_fixed = false;
1759 
1760   if (!CompactStrings) {
1761     // Fix encoding of result string to UTF16
1762     coder_fixed = true;
1763     coder = __ intcon(java_lang_String::CODER_UTF16);
1764   }
1765 
1766   for (int argi = 0; argi < sc->num_arguments(); argi++) {
1767     Node* arg = sc->argument(argi);
1768     switch (sc->mode(argi)) {
1769       case StringConcat::IntMode: {
1770         Node* string_size = int_stringSize(kit, arg);
1771 
1772         // accumulate total
1773         length = __ AddI(length, string_size);
1774 
1775         // Cache this value for the use by int_toString
1776         string_sizes->init_req(argi, string_size);
1777         break;
1778       }
1779       case StringConcat::StringNullCheckMode: {
1780         const Type* type = kit.gvn().type(arg);
1781         assert(type != TypePtr::NULL_PTR, "missing check");
1782         if (!type->higher_equal(TypeInstPtr::NOTNULL)) {
1783           // Null check with uncommon trap since
1784           // StringBuilder(null) throws exception.
1785           // Use special uncommon trap instead of
1786           // calling normal do_null_check().
1787           Node* p = __ Bool(__ CmpP(arg, kit.null()), BoolTest::ne);
1788           IfNode* iff = kit.create_and_map_if(kit.control(), p, PROB_MIN, COUNT_UNKNOWN);
1789           overflow->add_req(__ IfFalse(iff));
1790           Node* notnull = __ IfTrue(iff);
1791           kit.set_control(notnull); // set control for the cast_not_null
1792           arg = kit.cast_not_null(arg, false);
1793           sc->set_argument(argi, arg);
1794         }
1795         assert(kit.gvn().type(arg)->higher_equal(TypeInstPtr::NOTNULL), "sanity");
1796         // Fallthrough to add string length.
1797       }
1798       case StringConcat::StringMode: {
1799         const Type* type = kit.gvn().type(arg);
1800         Node* count = NULL;
1801         Node* arg_coder = NULL;
1802         if (type == TypePtr::NULL_PTR) {
1803           // replace the argument with the null checked version
1804           arg = null_string;
1805           sc->set_argument(argi, arg);
1806           count = kit.load_String_length(arg, true);
1807           arg_coder = kit.load_String_coder(arg, true);
1808         } else if (!type->higher_equal(TypeInstPtr::NOTNULL)) {
1809           // s = s != null ? s : "null";
1810           // length = length + (s.count - s.offset);
1811           RegionNode *r = new RegionNode(3);
1812           kit.gvn().set_type(r, Type::CONTROL);
1813           Node *phi = new PhiNode(r, type);
1814           kit.gvn().set_type(phi, phi->bottom_type());
1815           Node* p = __ Bool(__ CmpP(arg, kit.null()), BoolTest::ne);
1816           IfNode* iff = kit.create_and_map_if(kit.control(), p, PROB_MIN, COUNT_UNKNOWN);
1817           Node* notnull = __ IfTrue(iff);
1818           Node* isnull =  __ IfFalse(iff);
1819           kit.set_control(notnull); // set control for the cast_not_null
1820           r->init_req(1, notnull);
1821           phi->init_req(1, kit.cast_not_null(arg, false));
1822           r->init_req(2, isnull);
1823           phi->init_req(2, null_string);
1824           kit.set_control(r);
1825           C->record_for_igvn(r);
1826           C->record_for_igvn(phi);
1827           // replace the argument with the null checked version
1828           arg = phi;
1829           sc->set_argument(argi, arg);
1830           count = kit.load_String_length(arg, true);
1831           arg_coder = kit.load_String_coder(arg, true);
1832         } else {
1833           // A corresponding nullcheck will be connected during IGVN MemNode::Ideal_common_DU_postCCP
1834           // kit.control might be a different test, that can be hoisted above the actual nullcheck
1835           // in case, that the control input is not null, Ideal_common_DU_postCCP will not look for a nullcheck.
1836           count = kit.load_String_length(arg, false);
1837           arg_coder = kit.load_String_coder(arg, false);
1838         }
1839         if (arg->is_Con()) {
1840           // Constant string. Get constant coder and length.
1841           jbyte const_coder = get_constant_coder(kit, arg);
1842           int const_length = get_constant_length(kit, arg);
1843           if (const_coder == java_lang_String::CODER_LATIN1) {
1844             // Can be latin1 encoded
1845             arg_coder = __ intcon(const_coder);
1846             count = __ intcon(const_length);
1847           } else {
1848             // Found UTF16 encoded string. Fix result array encoding to UTF16.
1849             coder_fixed = true;
1850             coder = __ intcon(const_coder);
1851             count = __ intcon(const_length / 2);
1852           }
1853         }
1854 
1855         if (!coder_fixed) {
1856           coder = __ OrI(coder, arg_coder);
1857         }
1858         length = __ AddI(length, count);
1859         string_sizes->init_req(argi, NULL);
1860         break;
1861       }
1862       case StringConcat::CharMode: {
1863         // one character only
1864         const TypeInt* t = kit.gvn().type(arg)->is_int();
1865         if (!coder_fixed && t->is_con()) {
1866           // Constant char
1867           if (t->get_con() <= 255) {
1868             // Can be latin1 encoded
1869             coder = __ OrI(coder, __ intcon(java_lang_String::CODER_LATIN1));
1870           } else {
1871             // Must be UTF16 encoded. Fix result array encoding to UTF16.
1872             coder_fixed = true;
1873             coder = __ intcon(java_lang_String::CODER_UTF16);
1874           }
1875         } else if (!coder_fixed) {
1876           // Not constant
1877 #undef __
1878 #define __ ideal.
1879           IdealKit ideal(&kit, true, true);
1880           IdealVariable char_coder(ideal); __ declarations_done();
1881           // Check if character can be latin1 encoded
1882           __ if_then(arg, BoolTest::le, __ ConI(0xFF));
1883             __ set(char_coder, __ ConI(java_lang_String::CODER_LATIN1));
1884           __ else_();
1885             __ set(char_coder, __ ConI(java_lang_String::CODER_UTF16));
1886           __ end_if();
1887           kit.sync_kit(ideal);
1888           coder = __ OrI(coder, __ value(char_coder));
1889 #undef __
1890 #define __ kit.
1891         }
1892         length = __ AddI(length, __ intcon(1));
1893         break;
1894       }
1895       default:
1896         ShouldNotReachHere();
1897     }
1898     if (argi > 0) {
1899       // Check that the sum hasn't overflowed
1900       IfNode* iff = kit.create_and_map_if(kit.control(),
1901                                           __ Bool(__ CmpI(length, __ intcon(0)), BoolTest::lt),
1902                                           PROB_MIN, COUNT_UNKNOWN);
1903       kit.set_control(__ IfFalse(iff));
1904       overflow->set_req(argi, __ IfTrue(iff));
1905     }
1906   }
1907 
1908   {
1909     // Hook
1910     PreserveJVMState pjvms(&kit);
1911     kit.set_control(overflow);
1912     C->record_for_igvn(overflow);
1913     kit.uncommon_trap(Deoptimization::Reason_intrinsic,
1914                       Deoptimization::Action_make_not_entrant);
1915   }
1916 
1917   Node* result;
1918   if (!kit.stopped()) {
1919     assert(CompactStrings || (coder->is_Con() && coder->get_int() == java_lang_String::CODER_UTF16),
1920            "Result string must be UTF16 encoded if CompactStrings is disabled");
1921 
1922     Node* dst_array = NULL;
1923     if (sc->num_arguments() == 1 &&
1924         (sc->mode(0) == StringConcat::StringMode ||
1925          sc->mode(0) == StringConcat::StringNullCheckMode)) {
1926       // Handle the case when there is only a single String argument.
1927       // In this case, we can just pull the value from the String itself.
1928       dst_array = kit.load_String_value(sc->argument(0), true);
1929     } else {
1930       // Allocate destination byte array according to coder
1931       dst_array = allocate_byte_array(kit, NULL, __ LShiftI(length, coder));
1932 
1933       // Now copy the string representations into the final byte[]
1934       Node* start = __ intcon(0);
1935       for (int argi = 0; argi < sc->num_arguments(); argi++) {
1936         Node* arg = sc->argument(argi);
1937         switch (sc->mode(argi)) {
1938           case StringConcat::IntMode: {
1939             start = int_getChars(kit, arg, dst_array, coder, start, string_sizes->in(argi));
1940             break;
1941           }
1942           case StringConcat::StringNullCheckMode:
1943           case StringConcat::StringMode: {
1944             start = copy_string(kit, arg, dst_array, coder, start);
1945             break;
1946           }
1947           case StringConcat::CharMode: {
1948             start = copy_char(kit, arg, dst_array, coder, start);
1949           break;
1950           }
1951           default:
1952             ShouldNotReachHere();
1953         }
1954       }
1955     }
1956 
1957     // If we're not reusing an existing String allocation then allocate one here.
1958     result = sc->string_alloc();
1959     if (result == NULL) {
1960       PreserveReexecuteState preexecs(&kit);
1961       // The original jvms is for an allocation of either a String or
1962       // StringBuffer so no stack adjustment is necessary for proper
1963       // reexecution.
1964       kit.jvms()->set_should_reexecute(true);
1965       result = kit.new_instance(__ makecon(TypeKlassPtr::make(C->env()->String_klass())));
1966     }
1967 
1968     // Initialize the string
1969     kit.store_String_value(result, dst_array);
1970     kit.store_String_coder(result, coder);
1971 
1972     // The value field is final. Emit a barrier here to ensure that the effect
1973     // of the initialization is committed to memory before any code publishes
1974     // a reference to the newly constructed object (see Parse::do_exits()).
1975     assert(AllocateNode::Ideal_allocation(result, _gvn) != NULL, "should be newly allocated");
1976     kit.insert_mem_bar(Op_MemBarRelease, result);
1977   } else {
1978     result = C->top();
1979   }
1980   // hook up the outgoing control and result
1981   kit.replace_call(sc->end(), result);
1982 
1983   // Unhook any hook nodes
1984   string_sizes->disconnect_inputs(NULL, C);
1985   sc->cleanup();
1986 }
1987