1 /* src/vm/string.c - java.lang.String related functions
3 Copyright (C) 1996-2005 R. Grafl, A. Krall, C. Kruegel, C. Oates,
4 R. Obermaisser, M. Platter, M. Probst, S. Ring, E. Steiner,
5 C. Thalinger, D. Thuernbeck, P. Tomsich, C. Ullrich, J. Wenninger,
6 Institut f. Computersprachen - TU Wien
8 This file is part of CACAO.
10 This program is free software; you can redistribute it and/or
11 modify it under the terms of the GNU General Public License as
12 published by the Free Software Foundation; either version 2, or (at
13 your option) any later version.
15 This program is distributed in the hope that it will be useful, but
16 WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 General Public License for more details.
20 You should have received a copy of the GNU General Public License
21 along with this program; if not, write to the Free Software
22 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
25 Contact: cacao@complang.tuwien.ac.at
27 Authors: Reinhard Grafl
31 Changes: Christian Thalinger
33 $Id: string.c 3695 2005-11-17 13:47:58Z twisti $
43 #include "vm/global.h"
45 #include "mm/memory.h"
46 #include "native/include/java_lang_String.h"
47 #include "vm/exceptions.h"
48 #include "vm/loader.h"
49 #include "vm/options.h"
50 #include "vm/stringlocal.h"
54 /* global variables ***********************************************************/
56 #if defined(USE_THREADS)
57 static java_objectheader *lock_string_hashtable;
61 /* global string definitions **************************************************/
63 /* exception/error super class */
65 const char *string_java_lang_Throwable =
66 "java/lang/Throwable";
68 const char *string_java_lang_VMThrowable =
69 "java/lang/VMThrowable";
72 /* specify some exception strings for code generation */
74 const char *string_java_lang_ArithmeticException =
75 "java/lang/ArithmeticException";
77 const char *string_java_lang_ArithmeticException_message =
80 const char *string_java_lang_ArrayIndexOutOfBoundsException =
81 "java/lang/ArrayIndexOutOfBoundsException";
83 const char *string_java_lang_ArrayStoreException =
84 "java/lang/ArrayStoreException";
86 const char *string_java_lang_ClassCastException =
87 "java/lang/ClassCastException";
89 const char *string_java_lang_ClassNotFoundException =
90 "java/lang/ClassNotFoundException";
92 const char *string_java_lang_CloneNotSupportedException =
93 "java/lang/CloneNotSupportedException";
95 const char *string_java_lang_Exception =
96 "java/lang/Exception";
98 const char *string_java_lang_IllegalAccessException =
99 "java/lang/IllegalAccessException";
101 const char *string_java_lang_IllegalArgumentException =
102 "java/lang/IllegalArgumentException";
104 const char *string_java_lang_IllegalMonitorStateException =
105 "java/lang/IllegalMonitorStateException";
107 const char *string_java_lang_IndexOutOfBoundsException =
108 "java/lang/IndexOutOfBoundsException";
110 const char *string_java_lang_InstantiationException =
111 "java/lang/InstantiationException";
113 const char *string_java_lang_InterruptedException =
114 "java/lang/InterruptedException";
116 const char *string_java_lang_NegativeArraySizeException =
117 "java/lang/NegativeArraySizeException";
119 const char *string_java_lang_NoSuchFieldException =
120 "java/lang/NoSuchFieldException";
122 const char *string_java_lang_NoSuchMethodException =
123 "java/lang/NoSuchMethodException";
125 const char *string_java_lang_NullPointerException =
126 "java/lang/NullPointerException";
128 const char *string_java_lang_reflect_InvocationTargetException =
129 "java/lang/reflect/InvocationTargetException";
132 /* specify some error strings for code generation */
134 const char *string_java_lang_AbstractMethodError =
135 "java/lang/AbstractMethodError";
137 const char *string_java_lang_ClassCircularityError =
138 "java/lang/ClassCircularityError";
140 const char *string_java_lang_ClassFormatError =
141 "java/lang/ClassFormatError";
143 const char *string_java_lang_Error =
146 const char *string_java_lang_ExceptionInInitializerError =
147 "java/lang/ExceptionInInitializerError";
149 const char *string_java_lang_IncompatibleClassChangeError =
150 "java/lang/IncompatibleClassChangeError";
152 const char *string_java_lang_InstantiationError =
153 "java/lang/InstantiationError";
155 const char *string_java_lang_InternalError =
156 "java/lang/InternalError";
158 const char *string_java_lang_LinkageError =
159 "java/lang/LinkageError";
161 const char *string_java_lang_NoClassDefFoundError =
162 "java/lang/NoClassDefFoundError";
164 const char *string_java_lang_NoSuchFieldError =
165 "java/lang/NoSuchFieldError";
167 const char *string_java_lang_NoSuchMethodError =
168 "java/lang/NoSuchMethodError";
170 const char *string_java_lang_OutOfMemoryError =
171 "java/lang/OutOfMemoryError";
173 const char *string_java_lang_UnsatisfiedLinkError =
174 "java/lang/UnsatisfiedLinkError";
176 const char *string_java_lang_UnsupportedClassVersionError =
177 "java/lang/UnsupportedClassVersionError";
179 const char *string_java_lang_VerifyError =
180 "java/lang/VerifyError";
182 const char *string_java_lang_VirtualMachineError =
183 "java/lang/VirtualMachineError";
186 /* string_init *****************************************************************
188 Initialize the string hashtable lock.
190 *******************************************************************************/
192 bool string_init(void)
194 #if defined(USE_THREADS)
195 /* create string hashtable lock object */
197 lock_string_hashtable = NEW(java_objectheader);
199 # if defined(NATIVE_THREADS)
200 initObjectLock(lock_string_hashtable);
204 /* everything's ok */
210 /* stringtable_update **********************************************************
212 Traverses the javastring hashtable and sets the vftbl-entries of
213 javastrings which were temporarily set to NULL, because
214 java.lang.Object was not yet loaded.
216 *******************************************************************************/
218 void stringtable_update(void)
220 java_lang_String *js;
222 literalstring *s; /* hashtable entry */
225 for (i = 0; i < string_hash.size; i++) {
226 s = string_hash.ptr[i];
230 js = (java_lang_String *) s->string;
232 if (!js || !js->value) {
233 /* error in hashtable found */
234 log_text("invalid literalstring in hashtable");
240 if (!js->header.vftbl)
241 /* vftbl of javastring is NULL */
242 js->header.vftbl = class_java_lang_String->vftbl;
244 if (!a->header.objheader.vftbl)
245 /* vftbl of character-array is NULL */
246 a->header.objheader.vftbl = primitivetype_table[ARRAYTYPE_CHAR].arrayvftbl;
248 /* follow link in external hash chain */
256 /* javastring_new **************************************************************
258 creates a new object of type java/lang/String with the text of
259 the specified utf8-string
261 return: pointer to the string or NULL if memory is exhausted.
263 *******************************************************************************/
265 java_lang_String *javastring_new(utf *u)
267 char *utf_ptr; /* current utf character in utf string */
268 u4 utflength; /* length of utf-string if uncompressed */
269 java_lang_String *s; /* result-string */
274 *exceptionptr = new_nullpointerexception();
279 utflength = utf_strlen(u);
281 s = (java_lang_String *) builtin_new(class_java_lang_String);
282 a = builtin_newarray_char(utflength);
284 /* javastring or character-array could not be created */
288 /* decompress utf-string */
289 for (i = 0; i < utflength; i++)
290 a->data[i] = utf_nextu2(&utf_ptr);
292 /* set fields of the javastring-object */
295 s->count = utflength;
300 /* javastring_new_slash_to_dot *************************************************
302 creates a new object of type java/lang/String with the text of
303 the specified utf8-string with slashes changed to dots
305 return: pointer to the string or NULL if memory is exhausted.
307 *******************************************************************************/
309 java_lang_String *javastring_new_slash_to_dot(utf *u)
311 char *utf_ptr; /* current utf character in utf string */
312 u4 utflength; /* length of utf-string if uncompressed */
313 java_lang_String *s; /* result-string */
319 *exceptionptr = new_nullpointerexception();
324 utflength = utf_strlen(u);
326 s = (java_lang_String *) builtin_new(class_java_lang_String);
327 a = builtin_newarray_char(utflength);
329 /* javastring or character-array could not be created */
333 /* decompress utf-string */
334 for (i = 0; i < utflength; i++) {
335 ch = utf_nextu2(&utf_ptr);
341 /* set fields of the javastring-object */
344 s->count = utflength;
350 /* javastring_new_char *********************************************************
352 creates a new java/lang/String object which contains the convertet
353 C-string passed via text.
355 return: the object pointer or NULL if memory is exhausted.
357 *******************************************************************************/
359 java_lang_String *javastring_new_char(const char *text)
362 s4 len; /* length of the string */
363 java_lang_String *s; /* result-string */
367 *exceptionptr = new_nullpointerexception();
373 s = (java_lang_String *) builtin_new(class_java_lang_String);
374 a = builtin_newarray_char(len);
376 /* javastring or character-array could not be created */
381 for (i = 0; i < len; i++)
382 a->data[i] = text[i];
384 /* set fields of the javastring-object */
393 /* javastring_tochar ***********************************************************
395 converts a Java string into a C string.
397 return: pointer to C string
399 Caution: calling method MUST release the allocated memory!
401 *******************************************************************************/
403 char *javastring_tochar(java_objectheader *so)
405 java_lang_String *s = (java_lang_String *) so;
418 buf = MNEW(char, s->count + 1);
420 for (i = 0; i < s->count; i++)
421 buf[i] = a->data[s->offset + i];
429 /* javastring_toutf ************************************************************
431 Make utf symbol from javastring.
433 *******************************************************************************/
435 utf *javastring_toutf(java_lang_String *string, bool isclassname)
437 java_lang_String *str = (java_lang_String *) string;
439 return utf_new_u2(str->value->data + str->offset, str->count, isclassname);
443 /* javastring_strlen ***********************************************************
445 Returns the length of the Java string.
447 *******************************************************************************/
449 s4 javastring_strlen(java_objectheader *so)
451 java_lang_String *s = (java_lang_String *) so;
460 /* literalstring_u2 ************************************************************
462 Searches for the javastring with the specified u2-array in the
463 string hashtable, if there is no such string a new one is created.
465 If copymode is true a copy of the u2-array is made.
467 *******************************************************************************/
469 java_objectheader *literalstring_u2(java_chararray *a, u4 length, u4 offset,
472 literalstring *s; /* hashtable element */
473 java_lang_String *js; /* u2-array wrapped in javastring */
474 java_chararray *stringdata; /* copy of u2-array */
479 #if defined(USE_THREADS)
480 builtin_monitorenter(lock_string_hashtable);
483 /* find location in hashtable */
485 key = unicode_hashkey(a->data + offset, length);
486 slot = key & (string_hash.size - 1);
487 s = string_hash.ptr[slot];
490 js = (java_lang_String *) s->string;
492 if (length == js->count) {
495 for (i = 0; i < length; i++)
496 if (a->data[offset + i] != js->value->data[i])
499 /* string already in hashtable, free memory */
502 mem_free(a, sizeof(java_chararray) + sizeof(u2) * (length - 1) + 10);
504 #if defined(USE_THREADS)
505 builtin_monitorexit(lock_string_hashtable);
508 return (java_objectheader *) js;
512 /* follow link in external hash chain */
517 /* create copy of u2-array for new javastring */
518 u4 arraysize = sizeof(java_chararray) + sizeof(u2) * (length - 1) + 10;
519 stringdata = mem_alloc(arraysize);
520 /* memcpy(stringdata, a, arraysize); */
521 memcpy(&(stringdata->header), &(a->header), sizeof(java_arrayheader));
522 memcpy(&(stringdata->data), &(a->data) + offset, sizeof(u2) * (length - 1) + 10);
528 /* location in hashtable found, complete arrayheader */
530 stringdata->header.objheader.vftbl =
531 primitivetype_table[ARRAYTYPE_CHAR].arrayvftbl;
532 stringdata->header.size = length;
534 /* XXX TWISTI: is this necessary? */
535 if (!class_java_lang_String)
536 class_java_lang_String = load_class_bootstrap(utf_java_lang_String);
538 assert(class_java_lang_String);
539 assert(class_java_lang_String->loaded);
541 /* if we use eager loading, we have to check loaded String class */
544 list_addfirst(&unlinkedclasses, class_java_lang_String);
546 /* create new javastring */
548 js = NEW(java_lang_String);
550 #if defined(USE_THREADS) && defined(NATIVE_THREADS)
551 initObjectLock(&js->header);
554 js->header.vftbl = class_java_lang_String->vftbl;
555 js->value = stringdata;
559 /* create new literalstring */
561 s = NEW(literalstring);
562 s->hashlink = string_hash.ptr[slot];
563 s->string = (java_objectheader *) js;
564 string_hash.ptr[slot] = s;
566 /* update number of hashtable entries */
568 string_hash.entries++;
570 /* reorganization of hashtable */
572 if (string_hash.entries > (string_hash.size * 2)) {
573 /* reorganization of hashtable, average length of the external
574 chains is approx. 2 */
578 literalstring *nexts;
579 java_lang_String *tmpjs;
580 hashtable newhash; /* the new hashtable */
582 /* create new hashtable, double the size */
584 init_hashtable(&newhash, string_hash.size * 2);
585 newhash.entries = string_hash.entries;
587 /* transfer elements to new hashtable */
589 for (i = 0; i < string_hash.size; i++) {
590 s = string_hash.ptr[i];
594 tmpjs = (java_lang_String *) s->string;
595 slot = unicode_hashkey(tmpjs->value->data, tmpjs->count) & (newhash.size - 1);
597 s->hashlink = newhash.ptr[slot];
598 newhash.ptr[slot] = s;
600 /* follow link in external hash chain */
605 /* dispose old table */
607 MFREE(string_hash.ptr, void*, string_hash.size);
608 string_hash = newhash;
611 #if defined(USE_THREADS)
612 builtin_monitorexit(lock_string_hashtable);
615 return (java_objectheader *) js;
619 /* literalstring_new ***********************************************************
621 Creates a new javastring with the text of the utf-symbol and inserts it into
622 the string hashtable.
624 *******************************************************************************/
626 java_objectheader *literalstring_new(utf *u)
628 char *utf_ptr; /* pointer to current unicode character */
630 u4 utflength; /* length of utf-string if uncompressed */
631 java_chararray *a; /* u2-array constructed from utf string */
635 utflength = utf_strlen(u);
637 /* allocate memory */
638 a = mem_alloc(sizeof(java_chararray) + sizeof(u2) * (utflength - 1) + 10);
640 /* convert utf-string to u2-array */
641 for (i = 0; i < utflength; i++)
642 a->data[i] = utf_nextu2(&utf_ptr);
644 return literalstring_u2(a, utflength, 0, false);
648 /* literalstring_free **********************************************************
650 Removes a javastring from memory.
652 *******************************************************************************/
654 void literalstring_free(java_objectheader* sobj)
659 s = (java_lang_String *) sobj;
662 /* dispose memory of java.lang.String object */
663 FREE(s, java_lang_String);
665 /* dispose memory of java-characterarray */
666 FREE(a, sizeof(java_chararray) + sizeof(u2) * (a->header.size - 1)); /* +10 ?? */
671 * These are local overrides for various environment variables in Emacs.
672 * Please do not remove this and leave it at the end of the file, where
673 * Emacs will automagically detect them.
674 * ---------------------------------------------------------------------
677 * indent-tabs-mode: t