1 /*
2 * Copyright (c) 1997, 2018, Oracle and/or its affiliates. All rights reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20 * or visit www.oracle.com if you need additional information or have any
21 * questions.
22 *
23 */
24
25
26 #include "precompiled.hpp"
27 #include "classfile/altHashing.hpp"
28 #include "classfile/classLoaderData.hpp"
29 #include "gc/shared/collectedHeap.hpp"
30 #include "logging/log.hpp"
31 #include "logging/logStream.hpp"
32 #include "memory/allocation.inline.hpp"
33 #include "memory/resourceArea.hpp"
34 #include "oops/symbol.hpp"
35 #include "runtime/atomic.hpp"
36 #include "runtime/os.hpp"
37
pack_length_and_refcount(int length,int refcount)38 uint32_t Symbol::pack_length_and_refcount(int length, int refcount) {
39 STATIC_ASSERT(max_symbol_length == ((1 << 16) - 1));
40 STATIC_ASSERT(PERM_REFCOUNT == ((1 << 16) - 1));
41 assert(length >= 0, "negative length");
42 assert(length <= max_symbol_length, "too long symbol");
43 assert(refcount >= 0, "negative refcount");
44 assert(refcount <= PERM_REFCOUNT, "invalid refcount");
45 uint32_t hi = length;
46 uint32_t lo = refcount;
47 return (hi << 16) | lo;
48 }
49
Symbol(const u1 * name,int length,int refcount)50 Symbol::Symbol(const u1* name, int length, int refcount) {
51 _length_and_refcount = pack_length_and_refcount(length, refcount);
52 _identity_hash = (short)os::random();
53 for (int i = 0; i < length; i++) {
54 byte_at_put(i, name[i]);
55 }
56 }
57
operator new(size_t sz,int len,TRAPS)58 void* Symbol::operator new(size_t sz, int len, TRAPS) throw() {
59 int alloc_size = size(len)*wordSize;
60 address res = (address) AllocateHeap(alloc_size, mtSymbol);
61 return res;
62 }
63
operator new(size_t sz,int len,Arena * arena,TRAPS)64 void* Symbol::operator new(size_t sz, int len, Arena* arena, TRAPS) throw() {
65 int alloc_size = size(len)*wordSize;
66 address res = (address)arena->Amalloc_4(alloc_size);
67 return res;
68 }
69
operator delete(void * p)70 void Symbol::operator delete(void *p) {
71 assert(((Symbol*)p)->refcount() == 0, "should not call this");
72 FreeHeap(p);
73 }
74
75 // ------------------------------------------------------------------
76 // Symbol::starts_with
77 //
78 // Tests if the symbol starts with the specified prefix of the given
79 // length.
starts_with(const char * prefix,int len) const80 bool Symbol::starts_with(const char* prefix, int len) const {
81 if (len > utf8_length()) return false;
82 while (len-- > 0) {
83 if (prefix[len] != char_at(len))
84 return false;
85 }
86 assert(len == -1, "we should be at the beginning");
87 return true;
88 }
89
90
91 // ------------------------------------------------------------------
92 // Symbol::index_of
93 //
94 // Finds if the given string is a substring of this symbol's utf8 bytes.
95 // Return -1 on failure. Otherwise return the first index where str occurs.
index_of_at(int i,const char * str,int len) const96 int Symbol::index_of_at(int i, const char* str, int len) const {
97 assert(i >= 0 && i <= utf8_length(), "oob");
98 if (len <= 0) return 0;
99 char first_char = str[0];
100 address bytes = (address) ((Symbol*)this)->base();
101 address limit = bytes + utf8_length() - len; // inclusive limit
102 address scan = bytes + i;
103 if (scan > limit)
104 return -1;
105 for (; scan <= limit; scan++) {
106 scan = (address) memchr(scan, first_char, (limit + 1 - scan));
107 if (scan == NULL)
108 return -1; // not found
109 assert(scan >= bytes+i && scan <= limit, "scan oob");
110 if (memcmp(scan, str, len) == 0)
111 return (int)(scan - bytes);
112 }
113 return -1;
114 }
115
116
as_C_string(char * buf,int size) const117 char* Symbol::as_C_string(char* buf, int size) const {
118 if (size > 0) {
119 int len = MIN2(size - 1, utf8_length());
120 for (int i = 0; i < len; i++) {
121 buf[i] = char_at(i);
122 }
123 buf[len] = '\0';
124 }
125 return buf;
126 }
127
as_C_string() const128 char* Symbol::as_C_string() const {
129 int len = utf8_length();
130 char* str = NEW_RESOURCE_ARRAY(char, len + 1);
131 return as_C_string(str, len + 1);
132 }
133
as_C_string_flexible_buffer(Thread * t,char * buf,int size) const134 char* Symbol::as_C_string_flexible_buffer(Thread* t,
135 char* buf, int size) const {
136 char* str;
137 int len = utf8_length();
138 int buf_len = len + 1;
139 if (size < buf_len) {
140 str = NEW_RESOURCE_ARRAY(char, buf_len);
141 } else {
142 str = buf;
143 }
144 return as_C_string(str, buf_len);
145 }
146
print_utf8_on(outputStream * st) const147 void Symbol::print_utf8_on(outputStream* st) const {
148 st->print("%s", as_C_string());
149 }
150
print_symbol_on(outputStream * st) const151 void Symbol::print_symbol_on(outputStream* st) const {
152 char *s;
153 st = st ? st : tty;
154 {
155 // ResourceMark may not affect st->print(). If st is a string
156 // stream it could resize, using the same resource arena.
157 ResourceMark rm;
158 s = as_quoted_ascii();
159 s = os::strdup(s);
160 }
161 if (s == NULL) {
162 st->print("(null)");
163 } else {
164 st->print("%s", s);
165 os::free(s);
166 }
167 }
168
as_quoted_ascii() const169 char* Symbol::as_quoted_ascii() const {
170 const char *ptr = (const char *)&_body[0];
171 int quoted_length = UTF8::quoted_ascii_length(ptr, utf8_length());
172 char* result = NEW_RESOURCE_ARRAY(char, quoted_length + 1);
173 UTF8::as_quoted_ascii(ptr, utf8_length(), result, quoted_length + 1);
174 return result;
175 }
176
as_unicode(int & length) const177 jchar* Symbol::as_unicode(int& length) const {
178 Symbol* this_ptr = (Symbol*)this;
179 length = UTF8::unicode_length((char*)this_ptr->bytes(), utf8_length());
180 jchar* result = NEW_RESOURCE_ARRAY(jchar, length);
181 if (length > 0) {
182 UTF8::convert_to_unicode((char*)this_ptr->bytes(), result, length);
183 }
184 return result;
185 }
186
as_klass_external_name(char * buf,int size) const187 const char* Symbol::as_klass_external_name(char* buf, int size) const {
188 if (size > 0) {
189 char* str = as_C_string(buf, size);
190 int length = (int)strlen(str);
191 // Turn all '/'s into '.'s (also for array klasses)
192 for (int index = 0; index < length; index++) {
193 if (str[index] == '/') {
194 str[index] = '.';
195 }
196 }
197 return str;
198 } else {
199 return buf;
200 }
201 }
202
as_klass_external_name() const203 const char* Symbol::as_klass_external_name() const {
204 char* str = as_C_string();
205 int length = (int)strlen(str);
206 // Turn all '/'s into '.'s (also for array klasses)
207 for (int index = 0; index < length; index++) {
208 if (str[index] == '/') {
209 str[index] = '.';
210 }
211 }
212 return str;
213 }
214
215 // Alternate hashing for unbalanced symbol tables.
new_hash(juint seed)216 unsigned int Symbol::new_hash(juint seed) {
217 ResourceMark rm;
218 // Use alternate hashing algorithm on this symbol.
219 return AltHashing::murmur3_32(seed, (const jbyte*)as_C_string(), utf8_length());
220 }
221
222 // Increment refcount while checking for zero. If the Symbol's refcount becomes zero
223 // a thread could be concurrently removing the Symbol. This is used during SymbolTable
224 // lookup to avoid reviving a dead Symbol.
try_increment_refcount()225 bool Symbol::try_increment_refcount() {
226 uint32_t found = _length_and_refcount;
227 while (true) {
228 uint32_t old_value = found;
229 int refc = extract_refcount(old_value);
230 if (refc == PERM_REFCOUNT) {
231 return true; // sticky max or created permanent
232 } else if (refc == 0) {
233 return false; // dead, can't revive.
234 } else {
235 found = Atomic::cmpxchg(old_value + 1, &_length_and_refcount, old_value);
236 if (found == old_value) {
237 return true; // successfully updated.
238 }
239 // refcount changed, try again.
240 }
241 }
242 }
243
244 // The increment_refcount() is called when not doing lookup. It is assumed that you
245 // have a symbol with a non-zero refcount and it can't become zero while referenced by
246 // this caller.
increment_refcount()247 void Symbol::increment_refcount() {
248 if (!try_increment_refcount()) {
249 #ifdef ASSERT
250 print();
251 fatal("refcount has gone to zero");
252 #endif
253 }
254 #ifndef PRODUCT
255 if (refcount() != PERM_REFCOUNT) { // not a permanent symbol
256 NOT_PRODUCT(Atomic::inc(&_total_count);)
257 }
258 #endif
259 }
260
261 // Decrement refcount potentially while racing increment, so we need
262 // to check the value after attempting to decrement so that if another
263 // thread increments to PERM_REFCOUNT the value is not decremented.
decrement_refcount()264 void Symbol::decrement_refcount() {
265 uint32_t found = _length_and_refcount;
266 while (true) {
267 uint32_t old_value = found;
268 int refc = extract_refcount(old_value);
269 if (refc == PERM_REFCOUNT) {
270 return; // refcount is permanent, permanent is sticky
271 } else if (refc == 0) {
272 #ifdef ASSERT
273 print();
274 fatal("refcount underflow");
275 #endif
276 return;
277 } else {
278 found = Atomic::cmpxchg(old_value - 1, &_length_and_refcount, old_value);
279 if (found == old_value) {
280 return; // successfully updated.
281 }
282 // refcount changed, try again.
283 }
284 }
285 }
286
metaspace_pointers_do(MetaspaceClosure * it)287 void Symbol::metaspace_pointers_do(MetaspaceClosure* it) {
288 if (log_is_enabled(Trace, cds)) {
289 LogStream trace_stream(Log(cds)::trace());
290 trace_stream.print("Iter(Symbol): %p ", this);
291 print_value_on(&trace_stream);
292 trace_stream.cr();
293 }
294 }
295
print_on(outputStream * st) const296 void Symbol::print_on(outputStream* st) const {
297 st->print("Symbol: '");
298 print_symbol_on(st);
299 st->print("'");
300 st->print(" count %d", refcount());
301 }
302
303 // The print_value functions are present in all builds, to support the
304 // disassembler and error reporting.
print_value_on(outputStream * st) const305 void Symbol::print_value_on(outputStream* st) const {
306 st->print("'");
307 for (int i = 0; i < utf8_length(); i++) {
308 st->print("%c", char_at(i));
309 }
310 st->print("'");
311 }
312
is_valid(Symbol * s)313 bool Symbol::is_valid(Symbol* s) {
314 if (!is_aligned(s, sizeof(MetaWord))) return false;
315 if ((size_t)s < os::min_page_size()) return false;
316
317 if (!os::is_readable_range(s, s + 1)) return false;
318
319 // Symbols are not allocated in Java heap.
320 if (Universe::heap()->is_in_reserved(s)) return false;
321
322 int len = s->utf8_length();
323 if (len < 0) return false;
324
325 jbyte* bytes = (jbyte*) s->bytes();
326 return os::is_readable_range(bytes, bytes + len);
327 }
328
329 // SymbolTable prints this in its statistics
330 NOT_PRODUCT(size_t Symbol::_total_count = 0;)
331