1 /* src/vm/string.c - java.lang.String related functions
3 Copyright (C) 1996-2005 R. Grafl, A. Krall, C. Kruegel, C. Oates,
4 R. Obermaisser, M. Platter, M. Probst, S. Ring, E. Steiner,
5 C. Thalinger, D. Thuernbeck, P. Tomsich, C. Ullrich, J. Wenninger,
6 Institut f. Computersprachen - TU Wien
8 This file is part of CACAO.
10 This program is free software; you can redistribute it and/or
11 modify it under the terms of the GNU General Public License as
12 published by the Free Software Foundation; either version 2, or (at
13 your option) any later version.
15 This program is distributed in the hope that it will be useful, but
16 WITHOUT ANY WARRANTY; without even the implied warranty of
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 General Public License for more details.
20 You should have received a copy of the GNU General Public License
21 along with this program; if not, write to the Free Software
22 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
25 Contact: cacao@complang.tuwien.ac.at
27 Authors: Reinhard Grafl
31 Changes: Christian Thalinger
33 $Id: string.c 2504 2005-05-23 08:22:45Z twisti $
43 #include "vm/global.h"
45 #include "mm/memory.h"
46 #include "native/include/java_lang_String.h"
47 #include "vm/exceptions.h"
48 #include "vm/loader.h"
49 #include "vm/options.h"
50 #include "vm/stringlocal.h"
54 /* global string definitions **************************************************/
56 /* exception/error super class */
58 const char *string_java_lang_Throwable =
59 "java/lang/Throwable";
61 const char *string_java_lang_VMThrowable =
62 "java/lang/VMThrowable";
65 /* specify some exception strings for code generation */
67 const char *string_java_lang_ArithmeticException =
68 "java/lang/ArithmeticException";
70 const char *string_java_lang_ArithmeticException_message =
73 const char *string_java_lang_ArrayIndexOutOfBoundsException =
74 "java/lang/ArrayIndexOutOfBoundsException";
76 const char *string_java_lang_ArrayStoreException =
77 "java/lang/ArrayStoreException";
79 const char *string_java_lang_ClassCastException =
80 "java/lang/ClassCastException";
82 const char *string_java_lang_ClassNotFoundException =
83 "java/lang/ClassNotFoundException";
85 const char *string_java_lang_CloneNotSupportedException =
86 "java/lang/CloneNotSupportedException";
88 const char *string_java_lang_Exception =
89 "java/lang/Exception";
91 const char *string_java_lang_IllegalAccessException =
92 "java/lang/IllegalAccessException";
94 const char *string_java_lang_IllegalArgumentException =
95 "java/lang/IllegalArgumentException";
97 const char *string_java_lang_IllegalMonitorStateException =
98 "java/lang/IllegalMonitorStateException";
100 const char *string_java_lang_IndexOutOfBoundsException =
101 "java/lang/IndexOutOfBoundsException";
103 const char *string_java_lang_InstantiationException =
104 "java/lang/InstantiationException";
106 const char *string_java_lang_InterruptedException =
107 "java/lang/InterruptedException";
109 const char *string_java_lang_NegativeArraySizeException =
110 "java/lang/NegativeArraySizeException";
112 const char *string_java_lang_NoSuchFieldException =
113 "java/lang/NoSuchFieldException";
115 const char *string_java_lang_NoSuchMethodException =
116 "java/lang/NoSuchMethodException";
118 const char *string_java_lang_NullPointerException =
119 "java/lang/NullPointerException";
122 /* specify some error strings for code generation */
124 const char *string_java_lang_AbstractMethodError =
125 "java/lang/AbstractMethodError";
127 const char *string_java_lang_ClassCircularityError =
128 "java/lang/ClassCircularityError";
130 const char *string_java_lang_ClassFormatError =
131 "java/lang/ClassFormatError";
133 const char *string_java_lang_Error =
136 const char *string_java_lang_ExceptionInInitializerError =
137 "java/lang/ExceptionInInitializerError";
139 const char *string_java_lang_IncompatibleClassChangeError =
140 "java/lang/IncompatibleClassChangeError";
142 const char *string_java_lang_InternalError =
143 "java/lang/InternalError";
145 const char *string_java_lang_LinkageError =
146 "java/lang/LinkageError";
148 const char *string_java_lang_NoClassDefFoundError =
149 "java/lang/NoClassDefFoundError";
151 const char *string_java_lang_NoSuchFieldError =
152 "java/lang/NoSuchFieldError";
154 const char *string_java_lang_NoSuchMethodError =
155 "java/lang/NoSuchMethodError";
157 const char *string_java_lang_OutOfMemoryError =
158 "java/lang/OutOfMemoryError";
160 const char *string_java_lang_UnsupportedClassVersionError =
161 "java/lang/UnsupportedClassVersionError";
163 const char *string_java_lang_VerifyError =
164 "java/lang/VerifyError";
166 const char *string_java_lang_VirtualMachineError =
167 "java/lang/VirtualMachineError";
170 /* stringtable_update **********************************************************
172 Traverses the javastring hashtable and sets the vftbl-entries of
173 javastrings which were temporarily set to NULL, because
174 java.lang.Object was not yet loaded.
176 *******************************************************************************/
178 void stringtable_update(void)
180 java_lang_String *js;
182 literalstring *s; /* hashtable entry */
185 for (i = 0; i < string_hash.size; i++) {
186 s = string_hash.ptr[i];
190 js = (java_lang_String *) s->string;
192 if (!js || !js->value) {
193 /* error in hashtable found */
194 log_text("invalid literalstring in hashtable");
200 if (!js->header.vftbl)
201 /* vftbl of javastring is NULL */
202 js->header.vftbl = class_java_lang_String->vftbl;
204 if (!a->header.objheader.vftbl)
205 /* vftbl of character-array is NULL */
206 a->header.objheader.vftbl = primitivetype_table[ARRAYTYPE_CHAR].arrayvftbl;
208 /* follow link in external hash chain */
216 /* javastring_new **************************************************************
218 creates a new object of type java/lang/String with the text of
219 the specified utf8-string
221 return: pointer to the string or NULL if memory is exhausted.
223 *******************************************************************************/
225 java_lang_String *javastring_new(utf *u)
227 char *utf_ptr; /* current utf character in utf string */
228 u4 utflength; /* length of utf-string if uncompressed */
229 java_lang_String *s; /* result-string */
234 *exceptionptr = new_nullpointerexception();
239 utflength = utf_strlen(u);
241 s = (java_lang_String *) builtin_new(class_java_lang_String);
242 a = builtin_newarray_char(utflength);
244 /* javastring or character-array could not be created */
248 /* decompress utf-string */
249 for (i = 0; i < utflength; i++)
250 a->data[i] = utf_nextu2(&utf_ptr);
252 /* set fields of the javastring-object */
255 s->count = utflength;
260 /* javastring_new_slash_to_dot *************************************************
262 creates a new object of type java/lang/String with the text of
263 the specified utf8-string with slashes changed to dots
265 return: pointer to the string or NULL if memory is exhausted.
267 *******************************************************************************/
269 java_lang_String *javastring_new_slash_to_dot(utf *u)
271 char *utf_ptr; /* current utf character in utf string */
272 u4 utflength; /* length of utf-string if uncompressed */
273 java_lang_String *s; /* result-string */
279 *exceptionptr = new_nullpointerexception();
284 utflength = utf_strlen(u);
286 s = (java_lang_String *) builtin_new(class_java_lang_String);
287 a = builtin_newarray_char(utflength);
289 /* javastring or character-array could not be created */
293 /* decompress utf-string */
294 for (i = 0; i < utflength; i++) {
295 ch = utf_nextu2(&utf_ptr);
301 /* set fields of the javastring-object */
304 s->count = utflength;
310 /* javastring_new_char *********************************************************
312 creates a new java/lang/String object which contains the convertet
313 C-string passed via text.
315 return: the object pointer or NULL if memory is exhausted.
317 *******************************************************************************/
319 java_lang_String *javastring_new_char(const char *text)
322 s4 len; /* length of the string */
323 java_lang_String *s; /* result-string */
327 *exceptionptr = new_nullpointerexception();
333 s = (java_lang_String *) builtin_new(class_java_lang_String);
334 a = builtin_newarray_char(len);
336 /* javastring or character-array could not be created */
341 for (i = 0; i < len; i++)
342 a->data[i] = text[i];
344 /* set fields of the javastring-object */
353 /* javastring_tochar ***********************************************************
355 converts a Java string into a C string.
357 return: pointer to C string
359 Caution: calling method MUST release the allocated memory!
361 *******************************************************************************/
363 char *javastring_tochar(java_objectheader *so)
365 java_lang_String *s = (java_lang_String *) so;
378 buf = MNEW(char, s->count + 1);
380 for (i = 0; i < s->count; i++)
381 buf[i] = a->data[s->offset + i];
389 /* javastring_toutf ************************************************************
391 Make utf symbol from javastring.
393 *******************************************************************************/
395 utf *javastring_toutf(java_lang_String *string, bool isclassname)
397 java_lang_String *str = (java_lang_String *) string;
399 return utf_new_u2(str->value->data + str->offset, str->count, isclassname);
403 /* javastring_strlen ***********************************************************
405 Returns the length of the Java string.
407 *******************************************************************************/
409 s4 javastring_strlen(java_objectheader *so)
411 java_lang_String *s = (java_lang_String *) so;
420 /* literalstring_u2 ************************************************************
422 Searches for the javastring with the specified u2-array in the
423 string hashtable, if there is no such string a new one is created.
425 If copymode is true a copy of the u2-array is made.
427 *******************************************************************************/
429 java_objectheader *literalstring_u2(java_chararray *a, u4 length, u4 offset,
432 literalstring *s; /* hashtable element */
433 java_lang_String *js; /* u2-array wrapped in javastring */
434 java_chararray *stringdata; /* copy of u2-array */
439 /* find location in hashtable */
440 key = unicode_hashkey(a->data + offset, length);
441 slot = key & (string_hash.size - 1);
442 s = string_hash.ptr[slot];
445 js = (java_lang_String *) s->string;
447 if (length == js->count) {
449 for (i = 0; i < length; i++) {
450 if (a->data[offset + i] != js->value->data[i])
454 /* string already in hashtable, free memory */
456 mem_free(a, sizeof(java_chararray) + sizeof(u2) * (length - 1) + 10);
458 return (java_objectheader *) js;
462 /* follow link in external hash chain */
467 /* create copy of u2-array for new javastring */
468 u4 arraysize = sizeof(java_chararray) + sizeof(u2) * (length - 1) + 10;
469 stringdata = mem_alloc(arraysize);
470 /* memcpy(stringdata, a, arraysize); */
471 memcpy(&(stringdata->header), &(a->header), sizeof(java_arrayheader));
472 memcpy(&(stringdata->data), &(a->data) + offset, sizeof(u2) * (length - 1) + 10);
478 /* location in hashtable found, complete arrayheader */
479 stringdata->header.objheader.vftbl = primitivetype_table[ARRAYTYPE_CHAR].arrayvftbl;
480 stringdata->header.size = length;
482 if (!class_java_lang_String)
483 load_class_bootstrap(utf_java_lang_String,&class_java_lang_String);
484 assert(class_java_lang_String);
485 assert(class_java_lang_String->loaded);
487 /* if we use eager loading, we have to check loaded String class */
489 list_addfirst(&unlinkedclasses, class_java_lang_String);
492 /* create new javastring */
493 js = NEW(java_lang_String);
494 #if defined(USE_THREADS) && defined(NATIVE_THREADS)
495 initObjectLock(&js->header);
497 js->header.vftbl = class_java_lang_String->vftbl;
498 js->value = stringdata;
502 /* create new literalstring */
503 s = NEW(literalstring);
504 s->hashlink = string_hash.ptr[slot];
505 s->string = (java_objectheader *) js;
506 string_hash.ptr[slot] = s;
508 /* update number of hashtable entries */
509 string_hash.entries++;
511 /* reorganization of hashtable */
512 if (string_hash.entries > (string_hash.size * 2)) {
513 /* reorganization of hashtable, average length of
514 the external chains is approx. 2 */
518 hashtable newhash; /* the new hashtable */
520 /* create new hashtable, double the size */
521 init_hashtable(&newhash, string_hash.size * 2);
522 newhash.entries = string_hash.entries;
524 /* transfer elements to new hashtable */
525 for (i = 0; i < string_hash.size; i++) {
526 s = string_hash.ptr[i];
528 literalstring *nexts = s->hashlink;
529 js = (java_lang_String *) s->string;
530 slot = unicode_hashkey(js->value->data, js->count) & (newhash.size - 1);
532 s->hashlink = newhash.ptr[slot];
533 newhash.ptr[slot] = s;
535 /* follow link in external hash chain */
540 /* dispose old table */
541 MFREE(string_hash.ptr, void*, string_hash.size);
542 string_hash = newhash;
545 return (java_objectheader *) js;
549 /* literalstring_new ***********************************************************
551 Creates a new javastring with the text of the utf-symbol and inserts it into
552 the string hashtable.
554 *******************************************************************************/
556 java_objectheader *literalstring_new(utf *u)
558 char *utf_ptr; /* pointer to current unicode character */
560 u4 utflength; /* length of utf-string if uncompressed */
561 java_chararray *a; /* u2-array constructed from utf string */
565 utflength = utf_strlen(u);
567 /* allocate memory */
568 a = mem_alloc(sizeof(java_chararray) + sizeof(u2) * (utflength - 1) + 10);
570 /* convert utf-string to u2-array */
571 for (i = 0; i < utflength; i++)
572 a->data[i] = utf_nextu2(&utf_ptr);
574 return literalstring_u2(a, utflength, 0, false);
578 /* literalstring_free **********************************************************
580 Removes a javastring from memory.
582 *******************************************************************************/
584 void literalstring_free(java_objectheader* sobj)
589 s = (java_lang_String *) sobj;
592 /* dispose memory of java.lang.String object */
593 FREE(s, java_lang_String);
595 /* dispose memory of java-characterarray */
596 FREE(a, sizeof(java_chararray) + sizeof(u2) * (a->header.size - 1)); /* +10 ?? */
601 * These are local overrides for various environment variables in Emacs.
602 * Please do not remove this and leave it at the end of the file, where
603 * Emacs will automagically detect them.
604 * ---------------------------------------------------------------------
607 * indent-tabs-mode: t