mirror of
https://github.com/gnustep/libs-base.git
synced 2025-04-23 09:04:13 +00:00
git-svn-id: svn+ssh://svn.gna.org/svn/gnustep/libs/base/trunk@38556 72102866-910b-0410-8b05-ffd578937521
6256 lines
139 KiB
Objective-C
6256 lines
139 KiB
Objective-C
/** Implementation for GNUStep of NSString concrete subclasses
|
||
Copyright (C) 1997,1998,2000 Free Software Foundation, Inc.
|
||
|
||
Base on code written by Stevo Crvenkovski <stevo@btinternet.com>
|
||
Date: February 1997
|
||
|
||
Based on NSGCString and NSString
|
||
Written by: Andrew Kachites McCallum
|
||
<mccallum@gnu.ai.mit.edu>
|
||
Date: March 1995
|
||
|
||
Optimised by Richard Frith-Macdonald <richard@brainstorm.co.uk>
|
||
Date: October 1998
|
||
|
||
Redesign/rewrite by Richard Frith-Macdonald <rfm@gnu.org>
|
||
Date: September 2000
|
||
|
||
This file is part of the GNUstep Base Library.
|
||
|
||
This library is free software; you can redistribute it and/or
|
||
modify it under the terms of the GNU Lesser General Public
|
||
License as published by the Free Software Foundation; either
|
||
version 2 of the License, or (at your option) any later version.
|
||
|
||
This library is distributed in the hope that it will be useful,
|
||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
Library General Public License for more details.
|
||
|
||
You should have received a copy of the GNU Lesser General Public
|
||
License along with this library; if not, write to the Free
|
||
Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
|
||
Boston, MA 02111 USA.
|
||
*/
|
||
|
||
#import "common.h"
|
||
#import "Foundation/NSCoder.h"
|
||
#import "Foundation/NSArray.h"
|
||
#import "Foundation/NSData.h"
|
||
#import "Foundation/NSDictionary.h"
|
||
#import "Foundation/NSCharacterSet.h"
|
||
#import "Foundation/NSRange.h"
|
||
#import "Foundation/NSException.h"
|
||
#import "Foundation/NSValue.h"
|
||
#import "Foundation/NSKeyedArchiver.h"
|
||
#import "GNUstepBase/GSObjCRuntime.h"
|
||
|
||
#import "GSPrivate.h"
|
||
|
||
#ifdef HAVE_MALLOC_H
|
||
#if !defined(__OpenBSD__)
|
||
#include <malloc.h>
|
||
#endif
|
||
#endif
|
||
|
||
#ifdef HAVE_ALLOCA_H
|
||
#include <alloca.h>
|
||
#endif
|
||
|
||
/* memcpy(), strlen(), strcmp() are gcc builtin's */
|
||
|
||
#import "GNUstepBase/Unicode.h"
|
||
|
||
static NSStringEncoding externalEncoding = 0;
|
||
static NSStringEncoding internalEncoding = NSISOLatin1StringEncoding;
|
||
|
||
static BOOL isByteEncoding(NSStringEncoding enc)
|
||
{
|
||
return GSPrivateIsByteEncoding(enc);
|
||
}
|
||
|
||
#ifdef NeXT_RUNTIME
|
||
/* Used by the Darwin/NeXT ObjC Runtime
|
||
until Apple Radar 2870817 is fixed. */
|
||
struct objc_class _NSConstantStringClassReference;
|
||
#endif
|
||
|
||
/* Determine the length of the UTF-8 string as a unicode (UTF-16) string.
|
||
* sets the ascii flag according to the content found.
|
||
*/
|
||
static NSUInteger
|
||
lengthUTF8(const uint8_t *p, unsigned l, BOOL *ascii, BOOL *latin1)
|
||
{
|
||
const uint8_t *e = p + l;
|
||
BOOL a = YES;
|
||
BOOL l1 = YES;
|
||
|
||
l = 0;
|
||
while (p < e)
|
||
{
|
||
uint8_t c = *p;
|
||
uint32_t u = c;
|
||
|
||
if (c > 0x7f)
|
||
{
|
||
int i, sle = 0;
|
||
|
||
a = NO;
|
||
/* calculated the expected sequence length */
|
||
while (c & 0x80)
|
||
{
|
||
c = c << 1;
|
||
sle++;
|
||
}
|
||
|
||
/* legal ? */
|
||
if ((sle < 2) || (sle > 6))
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Bad sequence length in constant string"];
|
||
}
|
||
|
||
if (p + sle > e)
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Short data in constant string"];
|
||
}
|
||
|
||
/* get the codepoint */
|
||
for (i = 1; i < sle; i++)
|
||
{
|
||
if (p[i] < 0x80 || p[i] >= 0xc0)
|
||
break;
|
||
u = (u << 6) | (p[i] & 0x3f);
|
||
}
|
||
|
||
if (i < sle)
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Codepoint out of range in constant string"];
|
||
}
|
||
u = u & ~(0xffffffff << ((5 * sle) + 1));
|
||
p += sle;
|
||
|
||
/*
|
||
* We check for invalid codepoints here.
|
||
*/
|
||
if (u > 0x10ffff || u == 0xfffe || u == 0xffff
|
||
|| (u >= 0xfdd0 && u <= 0xfdef))
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Codepoint invalid in constant string"];
|
||
}
|
||
|
||
if ((u >= 0xd800) && (u <= 0xdfff))
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Bad surrogate pair in constant string"];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
p++;
|
||
}
|
||
|
||
/*
|
||
* Add codepoint as either a single unichar for BMP
|
||
* or as a pair of surrogates for codepoints over 16 bits.
|
||
*/
|
||
if (u < 0x10000)
|
||
{
|
||
l++;
|
||
if (u > 255)
|
||
{
|
||
l1 = NO;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
l += 2;
|
||
}
|
||
}
|
||
if (0 != ascii)
|
||
{
|
||
*ascii = a;
|
||
}
|
||
if (0 != latin1)
|
||
{
|
||
*latin1 = l1;
|
||
}
|
||
return l;
|
||
}
|
||
|
||
/* Count the number of bytes that make up this UTF-8 code point.
|
||
This to keep in mind:
|
||
* This macro doesn't return anything larger than '4'
|
||
* Legal UTF-8 cannot be larger than 4 bytes long (0x10FFFF)
|
||
* It will return 0 for anything illegal
|
||
*/
|
||
#define UTF8_BYTE_COUNT(c) \
|
||
(((c) < 0xf8) ? 1 + ((c) >= 0xc0) + ((c) >= 0xe0) + ((c) >= 0xf0) : 0)
|
||
|
||
/* Sequentially extracts characters from UTF-8 string
|
||
* p = pointer to the utf-8 data
|
||
* l = length (bytes) of the utf-8 data
|
||
* o = pointer to current offset within the data
|
||
* n = pointer to either zero or the next pre-read part of a surrogate pair.
|
||
* The condition for having read the entire string is that the offset (*o)
|
||
* is the number of bytes in the string, and the unichar pointed to by *n
|
||
* is zero (meaning there is no second part of a surrogate pair remaining).
|
||
*/
|
||
static inline unichar
|
||
nextUTF8(const uint8_t *p, unsigned l, unsigned *o, unichar *n)
|
||
{
|
||
unsigned i;
|
||
|
||
/* If we still have the second part of a surrogate pair, return it.
|
||
*/
|
||
if (*n > 0)
|
||
{
|
||
unichar u = *n;
|
||
|
||
*n = 0;
|
||
return u;
|
||
}
|
||
|
||
if ((i = *o) < l)
|
||
{
|
||
uint8_t c = p[i];
|
||
uint32_t u = c;
|
||
|
||
if (c > 0x7f)
|
||
{
|
||
int j, sle = 0;
|
||
|
||
/* calculated the expected sequence length */
|
||
sle = UTF8_BYTE_COUNT(c);
|
||
|
||
/* legal ? */
|
||
if (sle < 2)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"bad multibyte character length"];
|
||
}
|
||
|
||
if (sle + i > l)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"multibyte character extends beyond data"];
|
||
}
|
||
|
||
/* get the codepoint */
|
||
for (j = 1; j < sle; j++)
|
||
{
|
||
uint8_t b = p[i + j];
|
||
|
||
if (b < 0x80 || b >= 0xc0)
|
||
break;
|
||
u = (u << 6) | (b & 0x3f);
|
||
}
|
||
|
||
if (j < sle)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"bad data in multibyte character"];
|
||
}
|
||
u = u & ~(0xffffffff << ((5 * sle) + 1));
|
||
i += sle;
|
||
|
||
/*
|
||
* We discard invalid codepoints here.
|
||
*/
|
||
if (u > 0x10ffff || u == 0xfffe || u == 0xffff
|
||
|| (u >= 0xfdd0 && u <= 0xfdef))
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"invalid unicode codepoint"];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
i++;
|
||
}
|
||
|
||
/*
|
||
* Add codepoint as either a single unichar for BMP
|
||
* or as a pair of surrogates for codepoints over 16 bits.
|
||
*/
|
||
if (u >= 0x10000)
|
||
{
|
||
unichar ul, uh;
|
||
|
||
u -= 0x10000;
|
||
ul = u & 0x3ff;
|
||
uh = (u >> 10) & 0x3ff;
|
||
|
||
*n = ul + 0xdc00; // record second part of pair
|
||
u = uh + 0xd800; // return first part.
|
||
}
|
||
*o = i; // Return new index
|
||
return (unichar)u;
|
||
}
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"no more data in UTF-8 string"];
|
||
return 0;
|
||
}
|
||
|
||
static BOOL
|
||
literalIsEqualInternal(NXConstantString *s, GSStr o)
|
||
{
|
||
unsigned len = o->_count;
|
||
|
||
/* Since UTF-8 is a multibyte character set, it must have at least
|
||
* as many bytes as another string of the same length. So if the
|
||
* UTF-8 string is shorter, the two cannot be equal.
|
||
* A check for this can quickly give us a result in half the cases
|
||
* where the two strings have different lengths.
|
||
*/
|
||
if (len > s->nxcslen)
|
||
{
|
||
return NO;
|
||
}
|
||
else
|
||
{
|
||
NSUInteger pos = 0;
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
unichar u;
|
||
|
||
if (0 == o->_flags.wide)
|
||
{
|
||
/* If the other string is a buffer containing ascii characters,
|
||
* we can perform a bytewise comparison.
|
||
*/
|
||
if (internalEncoding == NSASCIIStringEncoding)
|
||
{
|
||
if (len == s->nxcslen
|
||
&& 0 == memcmp(o->_contents.c, s->nxcsptr, len))
|
||
{
|
||
return YES;
|
||
}
|
||
else
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
/* If the other string is a buffer containing latin1 characters,
|
||
* we can compare buffer contents with unichar values directly.
|
||
*/
|
||
if (internalEncoding == NSISOLatin1StringEncoding)
|
||
{
|
||
while (i < s->nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)s->nxcsptr, s->nxcslen, &i, &n);
|
||
if (pos >= len || (unichar)o->_contents.c[pos] != u)
|
||
{
|
||
return NO;
|
||
}
|
||
pos++;
|
||
}
|
||
if (pos != len)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
|
||
/* For any other narrow internal string, we know that ascii is
|
||
* a subset of the encoding, so as long as characters are ascii
|
||
* (don't have the top bit set) we can do bytewise comparison.
|
||
*/
|
||
if (len == s->nxcslen)
|
||
{
|
||
unsigned index;
|
||
|
||
for (index = 0; index < len; index++)
|
||
{
|
||
uint8_t c = s->nxcsptr[index];
|
||
|
||
if (c != o->_contents.c[index] || c >= 128)
|
||
{
|
||
/* Characters differ at this point.
|
||
*/
|
||
break;
|
||
}
|
||
}
|
||
if (index == len)
|
||
{
|
||
return YES;
|
||
}
|
||
/* The characters were the same up to 'index', so we won't
|
||
* need to recheck those first few characters.
|
||
*/
|
||
pos = i = index;
|
||
}
|
||
}
|
||
|
||
/* For small strings, or ones where we already have an array of
|
||
* UTF-16 characters, we can do a UTF-16 comparison directly.
|
||
* For larger strings, we may do as well with a character by
|
||
* character comparison.
|
||
*/
|
||
if (1 == o->_flags.wide || (len < 200 && pos < len))
|
||
{
|
||
unichar *ptr;
|
||
|
||
if (1 == o->_flags.wide)
|
||
{
|
||
ptr = o->_contents.u;
|
||
}
|
||
else
|
||
{
|
||
ptr = alloca(sizeof(unichar) * len);
|
||
if (NO == GSToUnicode(&ptr, &len, o->_contents.c,
|
||
len, internalEncoding, 0, 0))
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
/* Now we have a UTF-16 buffer, so we can do a UTF-16 comparison.
|
||
*/
|
||
while (i < s->nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)s->nxcsptr, s->nxcslen, &i, &n);
|
||
if (pos >= len || ptr[pos] != u)
|
||
{
|
||
return NO;
|
||
}
|
||
pos++;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unichar (*imp)(id, SEL, NSUInteger);
|
||
|
||
/* Do a character by character comparison using characterAtIndex:
|
||
* This will be relatively slow, but how often will we actually
|
||
* need to do this for a literal string? Most string literals will
|
||
* either be short or will differ from any other string we are
|
||
* doing a comparison with within the first few tens of characters.
|
||
*/
|
||
imp = (unichar(*)(id,SEL,NSUInteger))[(id)o methodForSelector:
|
||
@selector(characterAtIndex:)];
|
||
while (i < s->nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)s->nxcsptr, s->nxcslen, &i, &n);
|
||
if (pos >= len
|
||
|| (*imp)((id)o, @selector(characterAtIndex:), pos) != u)
|
||
{
|
||
return NO;
|
||
}
|
||
pos++;
|
||
}
|
||
}
|
||
if (pos != len)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
}
|
||
|
||
|
||
/*
|
||
* GSPlaceholderString - placeholder class for objects awaiting intialisation.
|
||
*/
|
||
@interface GSPlaceholderString : NSString
|
||
{
|
||
NSZone *myZone;
|
||
}
|
||
@end
|
||
|
||
|
||
/*
|
||
GSString is the root class of our hierarchy of string classes. All our
|
||
classes except GSPlaceholderString inherit from it. GSString provides
|
||
the common part of the ivar layout. It also has safe implementations
|
||
of all the memory management methods subclasses should override.
|
||
|
||
Concrete subclasses of GSString are identified by two properties:
|
||
how the string is encoded (its structure; 8-bit data or 16-bit unicode
|
||
data), and how the memory for the contents is handled (its memory
|
||
management).
|
||
|
||
Two direct subclasses of GSString provide the code for the two structures.
|
||
The memory management part of the concrete subclasses is abstracted to
|
||
a single flag for the structure classes: free. This is set only if the
|
||
_contents buffer is guaranteed to remain valid at least until the instance
|
||
has been deallocated.
|
||
|
||
Many optimizations, such as retaining instead of copying, and using pointers
|
||
to another strings _contents buffer, are valid only if this flag is set.
|
||
|
||
GSCString, an abstract class that stores the string as 8-bit data in the
|
||
internal encoding.
|
||
*/
|
||
@interface GSCString : GSString
|
||
{
|
||
}
|
||
@end
|
||
|
||
/*
|
||
And GSUnicodeString, an abstract class that stores the string as 16-bit
|
||
unicode characters.
|
||
*/
|
||
@interface GSUnicodeString : GSString
|
||
{
|
||
}
|
||
@end
|
||
|
||
|
||
/*
|
||
For each memory management scheme, there is a pair of concrete subclasses
|
||
of the two abstract structure classes. Each subclass has a single -init...
|
||
method which can be used to initialize that specific subclass.
|
||
|
||
GS*BufferString, concrete subclasses that store the data in an external
|
||
(wrt. the instance itself) buffer. The buffer may or may not be owned
|
||
by the instance; the 'owned' flag indicates which. If it is set,
|
||
we may need to free the buffer when we are deallocated.
|
||
*/
|
||
@interface GSCBufferString : GSCString
|
||
{
|
||
}
|
||
@end
|
||
|
||
@interface GSUnicodeBufferString : GSUnicodeString
|
||
{
|
||
}
|
||
@end
|
||
|
||
|
||
/*
|
||
GS*InlineString, concrete subclasses that store the data immediately after
|
||
the instance iself.
|
||
*/
|
||
@interface GSCInlineString : GSCString
|
||
{
|
||
}
|
||
@end
|
||
|
||
@interface GSUInlineString : GSUnicodeString
|
||
{
|
||
}
|
||
@end
|
||
|
||
|
||
/*
|
||
GS*SubString, concrete subclasses that use the data in another string
|
||
instance.
|
||
*/
|
||
@interface GSCSubString : GSCString
|
||
{
|
||
@public
|
||
GSString *_parent;
|
||
}
|
||
@end
|
||
|
||
@interface GSUnicodeSubString : GSUnicodeString
|
||
{
|
||
@public
|
||
GSString *_parent;
|
||
}
|
||
@end
|
||
|
||
/*
|
||
* Include sequence handling code with instructions to generate search
|
||
* and compare functions for NSString objects.
|
||
*/
|
||
#define GSEQ_STRCOMP strCompUsNs
|
||
#define GSEQ_STRRANGE strRangeUsNs
|
||
#define GSEQ_O GSEQ_NS
|
||
#define GSEQ_S GSEQ_US
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRCOMP strCompUsUs
|
||
#define GSEQ_STRRANGE strRangeUsUs
|
||
#define GSEQ_O GSEQ_US
|
||
#define GSEQ_S GSEQ_US
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRCOMP strCompUsCs
|
||
#define GSEQ_STRRANGE strRangeUsCs
|
||
#define GSEQ_O GSEQ_CS
|
||
#define GSEQ_S GSEQ_US
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRCOMP strCompCsNs
|
||
#define GSEQ_STRRANGE strRangeCsNs
|
||
#define GSEQ_O GSEQ_NS
|
||
#define GSEQ_S GSEQ_CS
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRCOMP strCompCsUs
|
||
#define GSEQ_STRRANGE strRangeCsUs
|
||
#define GSEQ_O GSEQ_US
|
||
#define GSEQ_S GSEQ_CS
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRCOMP strCompCsCs
|
||
#define GSEQ_STRRANGE strRangeCsCs
|
||
#define GSEQ_O GSEQ_CS
|
||
#define GSEQ_S GSEQ_CS
|
||
#include "GSeq.h"
|
||
|
||
#define GSEQ_STRRANGE strRangeNsNs
|
||
#define GSEQ_O GSEQ_NS
|
||
#define GSEQ_S GSEQ_NS
|
||
#include "GSeq.h"
|
||
|
||
static Class NSDataClass = 0;
|
||
static Class NSStringClass = 0;
|
||
static Class GSStringClass = 0;
|
||
static Class GSCStringClass = 0;
|
||
static Class GSCBufferStringClass = 0;
|
||
static Class GSCInlineStringClass = 0;
|
||
static Class GSCSubStringClass = 0;
|
||
static Class GSUnicodeStringClass = 0;
|
||
static Class GSUnicodeBufferStringClass = 0;
|
||
static Class GSUnicodeSubStringClass = 0;
|
||
static Class GSUInlineStringClass = 0;
|
||
static Class GSMutableStringClass = 0;
|
||
static Class NSConstantStringClass = 0;
|
||
|
||
static SEL cMemberSel;
|
||
static SEL convertSel;
|
||
static BOOL (*convertImp)(id, SEL, NSStringEncoding);
|
||
static SEL equalSel;
|
||
static BOOL (*equalImp)(id, SEL, id);
|
||
static SEL hashSel;
|
||
static NSUInteger (*hashImp)(id, SEL);
|
||
|
||
/*
|
||
* The setup() function is called when any concrete string class is
|
||
* initialized, and caches classes and some method implementations.
|
||
*/
|
||
static void
|
||
setup(BOOL rerun)
|
||
{
|
||
static BOOL beenHere = NO;
|
||
|
||
if (!beenHere || rerun)
|
||
{
|
||
beenHere = YES;
|
||
|
||
caiSel = @selector(characterAtIndex:);
|
||
gcrSel = @selector(getCharacters:range:);
|
||
ranSel = @selector(rangeOfComposedCharacterSequenceAtIndex:);
|
||
|
||
/*
|
||
* Cache the default string encoding, and set the internal encoding
|
||
* used by 8-bit character strings to match if possible.
|
||
*/
|
||
externalEncoding = GSPrivateDefaultCStringEncoding();
|
||
if (isByteEncoding(externalEncoding) == YES)
|
||
{
|
||
internalEncoding = externalEncoding;
|
||
}
|
||
|
||
/*
|
||
* Cache pointers to classes to work round misfeature in
|
||
* GNU compiler/runtime system where class lookup is very slow.
|
||
*/
|
||
NSDataClass = [NSData class];
|
||
NSStringClass = [NSString class];
|
||
GSStringClass = [GSString class];
|
||
GSCStringClass = [GSCString class];
|
||
GSUnicodeStringClass = [GSUnicodeString class];
|
||
GSCBufferStringClass = [GSCBufferString class];
|
||
GSUnicodeBufferStringClass = [GSUnicodeBufferString class];
|
||
GSCInlineStringClass = [GSCInlineString class];
|
||
GSUInlineStringClass = [GSUInlineString class];
|
||
GSCSubStringClass = [GSCSubString class];
|
||
GSUnicodeSubStringClass = [GSUnicodeSubString class];
|
||
GSMutableStringClass = [GSMutableString class];
|
||
NSConstantStringClass = [NXConstantString class];
|
||
|
||
/*
|
||
* Cache some selectors and method implementations for
|
||
* cases where we want to use the implementation
|
||
* provided in the abstract rolot cllass of the cluster.
|
||
*/
|
||
cMemberSel = @selector(characterIsMember:);
|
||
convertSel = @selector(canBeConvertedToEncoding:);
|
||
convertImp = (BOOL (*)(id, SEL, NSStringEncoding))
|
||
[NSStringClass instanceMethodForSelector: convertSel];
|
||
equalSel = @selector(isEqualToString:);
|
||
equalImp = (BOOL (*)(id, SEL, id))
|
||
[NSStringClass instanceMethodForSelector: equalSel];
|
||
hashSel = @selector(hash);
|
||
hashImp = (NSUInteger (*)(id, SEL))
|
||
[GSStringClass instanceMethodForSelector: hashSel];
|
||
|
||
caiSel = @selector(characterAtIndex:);
|
||
gcrSel = @selector(getCharacters:range:);
|
||
ranSel = @selector(rangeOfComposedCharacterSequenceAtIndex:);
|
||
}
|
||
}
|
||
|
||
static GSCInlineString*
|
||
newCInline(unsigned length, NSZone *zone)
|
||
{
|
||
GSCInlineString *me;
|
||
|
||
me = (GSCInlineString*)
|
||
NSAllocateObject(GSCInlineStringClass, length, zone);
|
||
me->_contents.c = (unsigned char*)
|
||
(((void*)me)+class_getInstanceSize(GSCInlineStringClass));
|
||
me->_count = length;
|
||
me->_flags.wide = 0;
|
||
me->_flags.owned = 1; // Ignored on dealloc, but means we own buffer
|
||
return me;
|
||
}
|
||
|
||
static GSUInlineString*
|
||
newUInline(unsigned length, NSZone *zone)
|
||
{
|
||
GSUInlineString *me;
|
||
|
||
me = (GSUInlineString*)
|
||
NSAllocateObject(GSUInlineStringClass, length*sizeof(unichar), zone);
|
||
me->_contents.u = (unichar*)
|
||
(((void*)me)+class_getInstanceSize(GSUInlineStringClass));
|
||
me->_count = length;
|
||
me->_flags.wide = 1;
|
||
me->_flags.owned = 1; // Ignored on dealloc, but means we own buffer
|
||
return me;
|
||
}
|
||
|
||
/* Predeclare a few functions
|
||
*/
|
||
static void GSStrWiden(GSStr s);
|
||
static void getCString_u(GSStr self, char *buffer, unsigned int maxLength,
|
||
NSRange aRange, NSRange *leftoverRange);
|
||
|
||
#if defined(OBJC_SMALL_OBJECT_SHIFT) && (OBJC_SMALL_OBJECT_SHIFT == 3)
|
||
#define TINY_STRING_MASK 4
|
||
static BOOL useTinyStrings;
|
||
/**
|
||
* A GSTinyString is used on 64-bit platforms to store up to 8 ASCII (7-bit)
|
||
* characters inside a pointer. Note that a mutable version of this class is
|
||
* not possible, because modifying the string changes the pointer value.
|
||
* The layout of a tiny string is as follows:
|
||
struct
|
||
{
|
||
uintptr_t char0 :7;
|
||
uintptr_t char1 :7;
|
||
uintptr_t char2 :7;
|
||
uintptr_t char3 :7;
|
||
uintptr_t char4 :7;
|
||
uintptr_t char5 :7;
|
||
uintptr_t char6 :7;
|
||
uintptr_t char7 :7;
|
||
uintptr_t length :5;
|
||
uintptr_t tag :3;
|
||
};
|
||
*/
|
||
#define TINY_STRING_CHAR(s, x) ((s & (0xFE00000000000000 >> (x*7))) >> (57-(x*7)))
|
||
#define TINY_STRING_LENGTH_MASK 0x1f
|
||
#define TINY_STRING_LENGTH_SHIFT OBJC_SMALL_OBJECT_SHIFT
|
||
|
||
static BOOL
|
||
tinyEqualToString(uintptr_t s, NSString *aString)
|
||
{
|
||
NSUInteger l;
|
||
|
||
if ((NSString*)s == aString)
|
||
{
|
||
return YES;
|
||
}
|
||
|
||
l = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
if ([aString length] != l)
|
||
{
|
||
return NO;
|
||
}
|
||
else if (l > 0)
|
||
{
|
||
unichar buf[8];
|
||
|
||
[aString getCharacters: buf range: NSMakeRange(0, l)];
|
||
while (l-- > 0)
|
||
{
|
||
if ((unichar)TINY_STRING_CHAR(s, l) != buf[l])
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
}
|
||
return YES;
|
||
}
|
||
|
||
@interface GSTinyString : NSString
|
||
@end
|
||
|
||
#ifdef GS_PROFILE_TINY_STRINGS
|
||
static int tinyStrings = 0;
|
||
static void logTinyStringCount(void)
|
||
{
|
||
fprintf(stderr, "%d tiny strings created\n", tinyStrings);
|
||
}
|
||
#endif
|
||
|
||
static int
|
||
tsbytes(uintptr_t s, char *buf)
|
||
{
|
||
int length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
int index;
|
||
|
||
for (index = 0; index < length; index++)
|
||
{
|
||
buf[index] = (char)TINY_STRING_CHAR(s, index);
|
||
}
|
||
buf[index] = 0;
|
||
return index;
|
||
}
|
||
|
||
@implementation GSTinyString
|
||
|
||
- (BOOL) boolValue
|
||
{
|
||
char buf[9];
|
||
int count = tsbytes((uintptr_t)self, buf);
|
||
int i;
|
||
|
||
for (i = 0; i < count; i++)
|
||
{
|
||
char c = buf[i];
|
||
|
||
if (strchr("123456789yYtT", c) != 0)
|
||
{
|
||
return YES;
|
||
}
|
||
if (!isspace(c) && c != '0' && c != '-' && c != '+')
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)anIndex
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
NSUInteger length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
|
||
if (anIndex >= length)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-characterAtIndex: index out of range"];
|
||
}
|
||
// Implicit NULL terminator on slightly-too-long strings.
|
||
if (anIndex == 8)
|
||
{
|
||
return '\0';
|
||
}
|
||
return TINY_STRING_CHAR(s, anIndex);
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
int length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
int index;
|
||
|
||
for (index = 0; index < length; index++)
|
||
{
|
||
buffer[index] = (unichar)TINY_STRING_CHAR(s, index);
|
||
}
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer range: (NSRange)aRange
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
int length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
int index;
|
||
int offset;
|
||
|
||
GS_RANGE_CHECK(aRange, length);
|
||
length = NSMaxRange(aRange);
|
||
offset = 0;
|
||
for (index = aRange.location; index < length; index++)
|
||
{
|
||
buffer[offset++] = (unichar)TINY_STRING_CHAR(s, index);
|
||
}
|
||
}
|
||
|
||
- (BOOL) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
int length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
int index;
|
||
|
||
if (buffer == 0)
|
||
{
|
||
return NO; // Can't fit in here
|
||
}
|
||
if (NSUnicodeStringEncoding == encoding)
|
||
{
|
||
maxLength /= 2;
|
||
if (maxLength > 1)
|
||
{
|
||
unichar *buf = (unichar*)buffer;
|
||
|
||
if (maxLength <= length)
|
||
{
|
||
length = maxLength - 1;
|
||
}
|
||
for (index = 0; index < length; index++)
|
||
{
|
||
buf[index] = (unichar)TINY_STRING_CHAR(s, index);
|
||
}
|
||
buf[index] = 0;
|
||
return YES;
|
||
}
|
||
return NO;
|
||
}
|
||
else if (isByteEncoding(encoding))
|
||
{
|
||
if (maxLength > 0)
|
||
{
|
||
if (maxLength <= length)
|
||
{
|
||
length = maxLength - 1;
|
||
}
|
||
for (index = 0; index < length; index++)
|
||
{
|
||
buffer[index] = (char)TINY_STRING_CHAR(s, index);
|
||
}
|
||
buffer[index] = 0;
|
||
return YES;
|
||
}
|
||
return NO;
|
||
}
|
||
return [super getCString: buffer maxLength: maxLength encoding: encoding];
|
||
}
|
||
|
||
- (NSUInteger) hash
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
int length = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
uint32_t ret = 0;
|
||
|
||
if (length > 0)
|
||
{
|
||
unichar buf[10];
|
||
int index;
|
||
|
||
for (index = 0; index < length; index++)
|
||
{
|
||
buf[index] = (char)TINY_STRING_CHAR(s, index);
|
||
}
|
||
ret = GSPrivateHash(0, buf, length * sizeof(unichar));
|
||
|
||
/*
|
||
* The hash caching in our concrete string classes uses zero to denote
|
||
* an empty cache value, so we MUST NOT return a hash of zero.
|
||
*/
|
||
ret &= 0x0fffffff;
|
||
if (ret == 0)
|
||
{
|
||
ret = 0x0fffffff;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
ret = 0x0ffffffe; /* Hash for an empty string. */
|
||
}
|
||
return ret;
|
||
}
|
||
|
||
- (int) intValue
|
||
{
|
||
char buf[9];
|
||
|
||
tsbytes((uintptr_t)self, buf);
|
||
return strtol(buf, 0, 10);
|
||
}
|
||
|
||
- (NSInteger) integerValue
|
||
{
|
||
char buf[9];
|
||
|
||
tsbytes((uintptr_t)self, buf);
|
||
#if GS_SIZEOF_VOIDP == GS_SIZEOF_LONG
|
||
return strtol(buf, 0, 10);
|
||
#else
|
||
return strtoll(buf, 0, 10);
|
||
#endif
|
||
}
|
||
|
||
- (BOOL) isEqualToString: (NSString*)aString
|
||
{
|
||
return tinyEqualToString((uintptr_t)self, aString);
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
return (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
}
|
||
|
||
- (long long) longLongValue
|
||
{
|
||
char buf[9];
|
||
|
||
tsbytes((uintptr_t)self, buf);
|
||
return strtoll(buf, 0, 10);
|
||
}
|
||
|
||
- (id) mutableCopyWithZone: (NSZone*)z
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
NSUInteger i;
|
||
NSUInteger l;
|
||
GSMutableString *obj;
|
||
char bytes[8];
|
||
|
||
l = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
bytes[i] = (unichar)TINY_STRING_CHAR(s, i);
|
||
}
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0, z);
|
||
obj = [obj initWithBytes: bytes
|
||
length: l
|
||
encoding: internalEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (NSRange) rangeOfComposedCharacterSequenceAtIndex: (NSUInteger)anIndex
|
||
{
|
||
uintptr_t s = (uintptr_t)self;
|
||
NSUInteger l = (s >> TINY_STRING_LENGTH_SHIFT) & TINY_STRING_LENGTH_MASK;
|
||
|
||
if (anIndex >= l)
|
||
[NSException raise: NSRangeException format:@"Invalid location."];
|
||
return NSMakeRange(anIndex, 1);
|
||
}
|
||
|
||
- (const char*) UTF8String
|
||
{
|
||
char *buf = GSAutoreleasedBuffer(9);
|
||
|
||
tsbytes((uintptr_t)self, buf);
|
||
return buf;
|
||
}
|
||
|
||
+ (void) load
|
||
{
|
||
useTinyStrings = objc_registerSmallObjectClass_np(self, TINY_STRING_MASK);
|
||
#ifdef GS_PROFILE_TINY_STRINGS
|
||
atexit(logTinyStringCount);
|
||
#endif
|
||
}
|
||
|
||
+ (id) alloc
|
||
{
|
||
return (id)TINY_STRING_MASK;
|
||
}
|
||
|
||
+ (id) allocWithZone: (NSZone*)aZone
|
||
{
|
||
return (id)TINY_STRING_MASK;
|
||
}
|
||
|
||
- (id) copy
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (id) copyWithZone: (NSZone*)aZone
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (id) retain
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (NSUInteger) retainCount
|
||
{
|
||
return UINT_MAX;
|
||
}
|
||
|
||
- (id) autorelease
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (oneway void) release
|
||
{
|
||
return;
|
||
}
|
||
@end
|
||
|
||
/**
|
||
* Constructs a tiny string.
|
||
*/
|
||
static inline id
|
||
createTinyString(const char *str, int length)
|
||
{
|
||
unsigned int i;
|
||
uintptr_t s = TINY_STRING_MASK;
|
||
|
||
/* No tiny string support detected at run time, give up
|
||
*/
|
||
if (!useTinyStrings)
|
||
{
|
||
return nil;
|
||
}
|
||
|
||
/* String too long to fit in a pointer, give up
|
||
*/
|
||
if (length > 9)
|
||
{
|
||
return nil;
|
||
}
|
||
|
||
/* String would fit if the last byte was an implicit 0, but it isn't.
|
||
*/
|
||
if ((length == 9) && str[8] != '\0')
|
||
{
|
||
return nil;
|
||
}
|
||
|
||
s |= length << TINY_STRING_LENGTH_SHIFT;
|
||
for (i = 0 ; i<length ; i++)
|
||
{
|
||
// If this is not a 7-bit character, we can't use it.
|
||
if (str[i] & 0x80) { return nil; }
|
||
s |= ((uintptr_t)str[i]) << (57 - (i*7));
|
||
}
|
||
#ifdef GS_PROFILE_TINY_STRINGS
|
||
__sync_fetch_and_add(&tinyStrings, 1);
|
||
#endif
|
||
return (id)s;
|
||
}
|
||
#else
|
||
static inline id
|
||
createTinyString(const char *str, int length)
|
||
{
|
||
return nil;
|
||
}
|
||
#endif
|
||
/*
|
||
* The GSPlaceholderString class is used by the abstract cluster root
|
||
* class to provide temporary objects that will be replaced as soon
|
||
* as the objects are initialised. This object tries to replace
|
||
* itself with an appropriate object whose type may vary depending
|
||
* on the initialisation method used.
|
||
*/
|
||
@implementation GSPlaceholderString
|
||
+ (id) allocWithZone: (NSZone*)z
|
||
{
|
||
GSPlaceholderString *o = NSAllocateObject(self, 0, z);
|
||
o->myZone = z;
|
||
return o;
|
||
}
|
||
|
||
+ (void) initialize
|
||
{
|
||
setup(NO);
|
||
}
|
||
|
||
- (id) autorelease
|
||
{
|
||
NSWarnLog(@"-autorelease sent to uninitialised string");
|
||
return self; // placeholders never get released.
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)index
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"attempt to use uninitialised string"];
|
||
return 0;
|
||
}
|
||
|
||
- (void) dealloc
|
||
{
|
||
NSLog(@"Warning ... attempt to deallocate instance of %@ in zone %p",
|
||
NSStringFromClass([self class]), [self zone]);
|
||
GSNOSUPERDEALLOC; // Placeholders never get deallocated.
|
||
}
|
||
|
||
/*
|
||
* Replace self with an empty inline unicode string.
|
||
*/
|
||
- (id) init
|
||
{
|
||
return [self initWithBytes: 0 length: 0 encoding: internalEncoding];
|
||
}
|
||
|
||
/*
|
||
* Remove any BOM and perform byte swapping if required.
|
||
*/
|
||
static void
|
||
fixBOM(unsigned char **bytes, NSUInteger*length, BOOL *owned,
|
||
NSStringEncoding encoding)
|
||
{
|
||
unsigned char *b = *bytes;
|
||
unsigned len = *length;
|
||
|
||
if (encoding == NSUnicodeStringEncoding && *length >= 2
|
||
&& ((b[0] == 0xFE && b[1] == 0xFF) || (b[0] == 0xFF && b[1] == 0xFE)))
|
||
{
|
||
// Got a byte order marker ... remove it.
|
||
if (len == sizeof(unichar))
|
||
{
|
||
if (*owned)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(b), b);
|
||
*owned = NO;
|
||
}
|
||
*length = 0;
|
||
*bytes = 0;
|
||
}
|
||
else
|
||
{
|
||
unsigned char *from = b;
|
||
unsigned char *to;
|
||
unichar u;
|
||
|
||
// Got a byte order marker ... remove it.
|
||
len -= sizeof(unichar);
|
||
memcpy(&u, from, sizeof(unichar));
|
||
from += sizeof(unichar);
|
||
to = NSAllocateCollectable(len, 0);
|
||
if (u == 0xFEFF)
|
||
{
|
||
// Native byte order
|
||
memcpy(to, from, len);
|
||
}
|
||
else
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < len; i += 2)
|
||
{
|
||
to[i] = from[i+1];
|
||
to[i+1] = from[i];
|
||
}
|
||
}
|
||
if (*owned == YES)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(b), b);
|
||
}
|
||
else
|
||
{
|
||
*owned = YES;
|
||
}
|
||
*length = len;
|
||
*bytes = to;
|
||
}
|
||
}
|
||
else if (encoding == NSUTF8StringEncoding && len >= 3
|
||
&& b[0] == 0xEF && b[1] == 0xBB && b[2] == 0xBF)
|
||
{
|
||
if (len == 3)
|
||
{
|
||
if (*owned)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(b), b);
|
||
*owned = NO;
|
||
}
|
||
*length = 0;
|
||
*bytes = 0;
|
||
}
|
||
else
|
||
{
|
||
unsigned char *from = b;
|
||
unsigned char *to;
|
||
|
||
// Got a byte order marker ... remove it.
|
||
len -= 3;
|
||
from += 3;
|
||
to = NSAllocateCollectable(len, 0);
|
||
memcpy(to, from, len);
|
||
if (*owned == YES)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(b), b);
|
||
}
|
||
else
|
||
{
|
||
*owned = YES;
|
||
}
|
||
*length = len;
|
||
*bytes = to;
|
||
}
|
||
}
|
||
}
|
||
|
||
- (id) initWithBytes: (const void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
const void *original;
|
||
void *chars = 0;
|
||
BOOL flag = NO;
|
||
|
||
if (0 == length)
|
||
{
|
||
return (id)@"";
|
||
}
|
||
|
||
if (0 == bytes)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-initWithBytes:lenth:encoding given nul bytes"];
|
||
}
|
||
|
||
#if defined(OBJC_SMALL_OBJECT_SHIFT) && (OBJC_SMALL_OBJECT_SHIFT == 3)
|
||
if (useTinyStrings)
|
||
{
|
||
if (NSASCIIStringEncoding == encoding)
|
||
{
|
||
id tinyString = createTinyString(bytes, length);
|
||
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
if (length < 9)
|
||
{
|
||
if (NSUTF8StringEncoding == encoding
|
||
|| GSPrivateIsByteEncoding(encoding))
|
||
{
|
||
NSUInteger i;
|
||
|
||
for (i = 0; i < length; i++)
|
||
{
|
||
if (((const char*)bytes)[i] & 0x80)
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
if (i == length)
|
||
{
|
||
id tinyString = createTinyString(bytes, length);
|
||
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
#endif
|
||
|
||
original = bytes;
|
||
fixBOM((unsigned char**)&bytes, &length, &flag, encoding);
|
||
/*
|
||
* We need to copy the data if there is any, unless fixBOM()
|
||
* has already done it for us.
|
||
*/
|
||
if (original == bytes)
|
||
{
|
||
#if GS_WITH_GC
|
||
chars = NSAllocateCollectable(length, 0);
|
||
#else
|
||
chars = NSZoneMalloc(myZone, length);
|
||
#endif
|
||
memcpy(chars, bytes, length);
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* The fixBOM() function has already copied the data and allocated
|
||
* new memory, so we can just pass that to the designated initialiser
|
||
*/
|
||
chars = (void*)bytes;
|
||
}
|
||
|
||
return [self initWithBytesNoCopy: chars
|
||
length: length
|
||
encoding: encoding
|
||
freeWhenDone: YES];
|
||
}
|
||
|
||
- (id) initWithBytesNoCopy: (void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
GSCharPtr chars = { .u = 0 };
|
||
BOOL isASCII = NO;
|
||
BOOL isLatin1 = NO;
|
||
GSStr me;
|
||
|
||
if (0 == length)
|
||
{
|
||
if (YES == flag && 0 != bytes)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(bytes), bytes);
|
||
}
|
||
return (id)@"";
|
||
}
|
||
|
||
fixBOM((unsigned char**)&bytes, &length, &flag, encoding);
|
||
if (encoding == NSUnicodeStringEncoding)
|
||
{
|
||
chars.u = bytes;
|
||
}
|
||
else
|
||
{
|
||
chars.c = bytes;
|
||
}
|
||
|
||
if (encoding == NSUTF8StringEncoding
|
||
|| (encoding != internalEncoding && isByteEncoding(encoding) == YES))
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < length; i++)
|
||
{
|
||
if ((chars.c)[i] > 127)
|
||
{
|
||
if (encoding == NSASCIIStringEncoding)
|
||
{
|
||
if (flag == YES && chars.c != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars.c), chars.c);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
break;
|
||
}
|
||
}
|
||
if (i == length)
|
||
{
|
||
/*
|
||
* This is actually ASCII data ... so we can just store it as if
|
||
* in the internal 8bit encoding scheme.
|
||
*/
|
||
encoding = internalEncoding;
|
||
}
|
||
}
|
||
|
||
if (encoding == internalEncoding)
|
||
{
|
||
#if GS_WITH_GC
|
||
/* If we are using GC, copy and free any non-collectable buffer so
|
||
* we don't leak memory.
|
||
*/
|
||
if (GSPrivateIsCollectable(chars.c) == NO)
|
||
{
|
||
me = newCInline(length, myZone);
|
||
memcpy(me->_contents.c, chars.c, length);
|
||
NSZoneFree(NSZoneFromPointer(chars.c), chars.c);
|
||
return (id)me;
|
||
}
|
||
#endif
|
||
me = (GSStr)NSAllocateObject(GSCBufferStringClass, 0, myZone);
|
||
me->_contents.c = chars.c;
|
||
me->_count = length;
|
||
me->_flags.wide = 0;
|
||
me->_flags.owned = flag;
|
||
return (id)me;
|
||
}
|
||
|
||
/*
|
||
* Any remaining encoding needs to be converted to UTF-16.
|
||
*/
|
||
if (encoding != NSUnicodeStringEncoding)
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
|
||
if (GSPrivateIsEncodingSupported(encoding) == NO)
|
||
{
|
||
if (flag == YES && bytes != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(bytes), bytes);
|
||
}
|
||
return nil; // Invalid encoding
|
||
}
|
||
|
||
if (GSToUnicode(&u, &l, chars.c, length, encoding, myZone, 0) == NO)
|
||
{
|
||
if (flag == YES && chars.c != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars.c), chars.c);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
if (flag == YES && chars.c != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars.c), chars.c);
|
||
}
|
||
chars.u = u;
|
||
length = l * sizeof(unichar);
|
||
flag = YES;
|
||
}
|
||
|
||
length /= sizeof(unichar);
|
||
if (GSUnicode(chars.u, length, &isASCII, &isLatin1) != length)
|
||
{
|
||
if (flag == YES && chars.u != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars.u), chars.u);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
|
||
if (isASCII == YES
|
||
|| (internalEncoding == NSISOLatin1StringEncoding && isLatin1 == YES))
|
||
{
|
||
me = (GSStr)newCInline(length, myZone);
|
||
while (length-- > 0)
|
||
{
|
||
me->_contents.c[length] = chars.u[length];
|
||
}
|
||
if (flag == YES && chars.u != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars.u), chars.u);
|
||
}
|
||
}
|
||
else
|
||
{
|
||
#if GS_WITH_GC
|
||
/* If we are using GC, copy and free any non-collectable buffer so
|
||
* we don't leak memory.
|
||
*/
|
||
if (GSPrivateIsCollectable(chars.u) == NO)
|
||
{
|
||
me = newUInline(length, myZone);
|
||
memcpy(me->_contents.u, chars.u, length * sizeof(unichar));
|
||
NSZoneFree(NSZoneFromPointer(chars.u), chars.u);
|
||
return (id)me;
|
||
}
|
||
#endif
|
||
me = (GSStr)NSAllocateObject(GSUnicodeBufferStringClass, 0, myZone);
|
||
me->_contents.u = chars.u;
|
||
me->_count = length;
|
||
me->_flags.wide = 1;
|
||
me->_flags.owned = flag;
|
||
}
|
||
return (id)me;
|
||
}
|
||
|
||
- (id) initWithCharacters: (const unichar*)chars
|
||
length: (NSUInteger)length
|
||
{
|
||
return [self initWithBytes: (const void*)chars
|
||
length: length * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
}
|
||
|
||
- (id) initWithCharactersNoCopy: (unichar*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: (void*)chars
|
||
length: length * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
- (id) initWithCString: (const char*)chars
|
||
length: (NSUInteger)length
|
||
{
|
||
return [self initWithBytes: (const void*)chars
|
||
length: length
|
||
encoding: externalEncoding];
|
||
}
|
||
|
||
- (id) initWithCStringNoCopy: (char*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: (void*)chars
|
||
length: length
|
||
encoding: externalEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
- (id) initWithFormat: (NSString*)format
|
||
locale: (NSDictionary*)locale
|
||
arguments: (va_list)argList
|
||
{
|
||
GSStr f;
|
||
unsigned char buf[2048];
|
||
unichar fbuf[1024];
|
||
unichar *fmt = fbuf;
|
||
size_t len;
|
||
GSStr me;
|
||
|
||
/*
|
||
* First we provide an array of unichar characters containing the
|
||
* format string. For performance reasons we try to use an on-stack
|
||
* buffer if the format string is small enough ... it almost always
|
||
* will be.
|
||
*/
|
||
len = [format length];
|
||
if (len >= 1024)
|
||
{
|
||
fmt = NSZoneMalloc(NSDefaultMallocZone(), (len+1)*sizeof(unichar));
|
||
}
|
||
[format getCharacters: fmt];
|
||
fmt[len] = '\0';
|
||
|
||
/*
|
||
* Now set up 'f' as a GSMutableString object whose initial buffer is
|
||
* allocated on the stack. The GSPrivateFormat function can write into it.
|
||
*/
|
||
f = (GSStr)alloca(class_getInstanceSize(GSMutableStringClass));
|
||
object_setClass(f, GSMutableStringClass);
|
||
f->_zone = NSDefaultMallocZone();
|
||
f->_contents.c = buf;
|
||
f->_capacity = sizeof(buf);
|
||
f->_count = 0;
|
||
f->_flags.wide = 0;
|
||
f->_flags.owned = 0;
|
||
GSPrivateFormat(f, fmt, argList, locale);
|
||
if (fmt != fbuf)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), fmt);
|
||
}
|
||
|
||
/*
|
||
* Don't use noCopy because f->_contents.u may be memory on the stack,
|
||
* and even if it wasn't f->_capacity may be greater than f->_count so
|
||
* we could be wasting quite a bit of space. Better to accept a
|
||
* performance hit due to copying data (and allocating/deallocating
|
||
* the temporary buffer) for large strings. For most strings, the
|
||
* on-stack memory will have been used, so we will get better performance.
|
||
*/
|
||
if (f->_flags.wide == 1)
|
||
{
|
||
me = (GSStr)newUInline(f->_count, myZone);
|
||
memcpy(me->_contents.u, f->_contents.u, f->_count*sizeof(unichar));
|
||
}
|
||
else
|
||
{
|
||
me = (GSStr)newCInline(f->_count, myZone);
|
||
memcpy(me->_contents.c, f->_contents.c, f->_count);
|
||
}
|
||
|
||
/*
|
||
* If the string had to grow beyond the initial buffer size, we must
|
||
* release any allocated memory.
|
||
*/
|
||
if (1 == f->_flags.owned)
|
||
{
|
||
NSZoneFree(f->_zone, f->_contents.c);
|
||
}
|
||
return (id)me;
|
||
}
|
||
|
||
/*
|
||
* Replace self with an inline string matching the sort of information
|
||
* given.
|
||
*/
|
||
- (id) initWithString: (NSString*)string
|
||
{
|
||
unsigned length;
|
||
Class c;
|
||
GSStr me;
|
||
|
||
if (string == nil)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-initWithString: given nil string"];
|
||
if (NO == [string isKindOfClass: NSStringClass]) // may be proxy
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-initWithString: given non-string object"];
|
||
|
||
c = object_getClass(string);
|
||
length = [string length];
|
||
if (GSObjCIsKindOf(c, GSCStringClass) == YES
|
||
|| (GSObjCIsKindOf(c, GSMutableStringClass) == YES
|
||
&& ((GSStr)string)->_flags.wide == 0))
|
||
{
|
||
/*
|
||
* For a GSCString subclass, or an 8-bit GSMutableString,
|
||
* we can copy the bytes directly into an inline string.
|
||
*/
|
||
me = (GSStr)newCInline(length, myZone);
|
||
memcpy(me->_contents.c, ((GSStr)string)->_contents.c, length);
|
||
}
|
||
else if (GSObjCIsKindOf(c, GSUnicodeStringClass) == YES
|
||
|| GSObjCIsKindOf(c, GSMutableStringClass) == YES)
|
||
{
|
||
/*
|
||
* For a GSUnicodeString subclass, or a 16-bit GSMutableString,
|
||
* we can copy the bytes directly into an inline string.
|
||
*/
|
||
me = (GSStr)newUInline(length, myZone);
|
||
memcpy(me->_contents.u, ((GSStr)string)->_contents.u,
|
||
length*sizeof(unichar));
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* For a string with an unknown class, we can initialise by
|
||
* having the string copy its content directly into our buffer.
|
||
*/
|
||
me = (GSStr)newUInline(length, myZone);
|
||
[string getCharacters: me->_contents.u];
|
||
}
|
||
return (id)me;
|
||
}
|
||
|
||
- (id) initWithUTF8String: (const char*)bytes
|
||
{
|
||
const uint8_t *b = (const uint8_t*)bytes;
|
||
BOOL ascii = YES;
|
||
NSUInteger length;
|
||
GSStr me;
|
||
uint8_t c;
|
||
|
||
if (0 == bytes)
|
||
{
|
||
return (id)@"";
|
||
}
|
||
/* Skip leading BOM
|
||
*/
|
||
if (b[0] == 0xEF && b[1] == 0xBB && b[2] == 0xBF)
|
||
{
|
||
b = &b[3];
|
||
}
|
||
|
||
length = 0;
|
||
while ((c = b[length]))
|
||
{
|
||
length++;
|
||
if (c > 127)
|
||
{
|
||
ascii = NO;
|
||
while (b[length])
|
||
{
|
||
length++;
|
||
}
|
||
break;
|
||
}
|
||
}
|
||
|
||
if (YES == ascii)
|
||
{
|
||
id o = createTinyString((const char*)b, length);
|
||
|
||
if (nil == o)
|
||
{
|
||
me = (GSStr)newCInline(length, myZone);
|
||
memcpy(me->_contents.c, b, length);
|
||
o = (id)me;
|
||
}
|
||
return o;
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
|
||
if (GSToUnicode(&u, &l, b, length, NSUTF8StringEncoding, myZone, 0) == NO)
|
||
{
|
||
return nil; // Invalid data
|
||
}
|
||
me = (GSStr)NSAllocateObject(GSUnicodeBufferStringClass, 0, myZone);
|
||
me->_contents.u = u;
|
||
me->_count = l;
|
||
me->_flags.wide = 1;
|
||
me->_flags.owned = YES;
|
||
}
|
||
return (id)me;
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"attempt to use uninitialised string"];
|
||
return 0;
|
||
}
|
||
|
||
- (oneway void) release
|
||
{
|
||
return; // placeholders never get released.
|
||
}
|
||
|
||
- (id) retain
|
||
{
|
||
return self; // placeholders never get retained.
|
||
}
|
||
@end
|
||
|
||
|
||
|
||
/*
|
||
* The following inline functions are used by the concrete string classes
|
||
* to implement their core functionality.
|
||
* GSCString uses the functions with the _c suffix.
|
||
* GSCSubString, GSCInlineString, GSCBufferString
|
||
* inherit methods from GSCString.
|
||
* GSUnicodeString uses the functions with the _u suffix.
|
||
* GSUnicodeSubString, GSUInlineString, and GSUnicodeBufferString
|
||
* inherit methods from GSUnicodeString.
|
||
* GSMutableString uses all the functions, selecting the _c or _u versions
|
||
* depending on whether its storage is 8-bit or 16-bit.
|
||
* In addition, GSMutableString uses a few functions without a suffix that are
|
||
* peculiar to its memory management (shrinking, growing, and converting).
|
||
*/
|
||
|
||
static inline const char*
|
||
UTF8String_c(GSStr self)
|
||
{
|
||
unsigned char *r;
|
||
|
||
if (self->_count == 0)
|
||
{
|
||
return "";
|
||
}
|
||
if (internalEncoding == NSASCIIStringEncoding)
|
||
{
|
||
unsigned i = self->_count;
|
||
|
||
r = (unsigned char*)GSAutoreleasedBuffer(self->_count+1);
|
||
while (i-- > 0)
|
||
{
|
||
r[i] = self->_contents.c[i] & 0x7f;
|
||
}
|
||
r[self->_count] = '\0';
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
unsigned s = 0;
|
||
|
||
/*
|
||
* We must convert from internal format to unicode and then to
|
||
* UTF8 string encoding.
|
||
*/
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count, internalEncoding,
|
||
NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
if (GSFromUnicode((unsigned char**)&r, &s, u, l, NSUTF8StringEncoding,
|
||
NSDefaultMallocZone(), GSUniTerminate|GSUniTemporary|GSUniStrict) == NO)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert from Unicode to UTF8."];
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
}
|
||
|
||
return (const char*)r;
|
||
}
|
||
|
||
static inline const char*
|
||
UTF8String_u(GSStr self)
|
||
{
|
||
unsigned c = self->_count;
|
||
|
||
if (c == 0)
|
||
{
|
||
return "";
|
||
}
|
||
else
|
||
{
|
||
unsigned int l = 0;
|
||
unsigned char *r = 0;
|
||
|
||
if (GSFromUnicode(&r, &l, self->_contents.u, c, NSUTF8StringEncoding,
|
||
NSDefaultMallocZone(), GSUniTerminate|GSUniTemporary|GSUniStrict) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't get UTF8 from Unicode string."];
|
||
}
|
||
return (const char*)r;
|
||
}
|
||
}
|
||
|
||
static inline BOOL
|
||
boolValue_c(GSStr self)
|
||
{
|
||
unsigned count = self->_count;
|
||
unsigned i;
|
||
|
||
for (i = 0; i < count; i++)
|
||
{
|
||
char c = self->_contents.c[i];
|
||
|
||
if (strchr("123456789yYtT", c) != 0)
|
||
{
|
||
return YES;
|
||
}
|
||
if (!isspace(c) && c != '0' && c != '-' && c != '+')
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
|
||
static inline BOOL
|
||
boolValue_u(GSStr self)
|
||
{
|
||
unsigned count = self->_count;
|
||
unsigned i;
|
||
|
||
for (i = 0; i < count; i++)
|
||
{
|
||
unichar c = self->_contents.u[i];
|
||
|
||
if (c > 'y')
|
||
{
|
||
break;
|
||
}
|
||
if (strchr("123456789yYtT", c) != 0)
|
||
{
|
||
return YES;
|
||
}
|
||
if (!isspace(c) && c != '0' && c != '-' && c != '+')
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
|
||
static inline void
|
||
intBuf_c(GSStr self, char *buf)
|
||
{
|
||
unsigned c = self->_count;
|
||
unsigned i = 0;
|
||
unsigned j = 0;
|
||
|
||
while (i < c && isspace(self->_contents.c[i]))
|
||
{
|
||
i++;
|
||
}
|
||
if (i < c)
|
||
{
|
||
char sign = self->_contents.c[i];
|
||
|
||
if ('+' == sign || '-' == sign)
|
||
{
|
||
buf[j++] = sign;
|
||
i++;
|
||
}
|
||
}
|
||
while (i < c && j < 20 && isdigit(self->_contents.c[i]))
|
||
{
|
||
buf[j++] = self->_contents.c[i++];
|
||
}
|
||
buf[j] = '\0';
|
||
}
|
||
|
||
static inline void
|
||
intBuf_u(GSStr self, char *buf)
|
||
{
|
||
unsigned c = self->_count;
|
||
unsigned i = 0;
|
||
unsigned j = 0;
|
||
|
||
while (i < c && isspace(self->_contents.u[i]))
|
||
{
|
||
i++;
|
||
}
|
||
if (i < c)
|
||
{
|
||
unichar sign = self->_contents.u[i];
|
||
|
||
if ('+' == sign || '-' == sign)
|
||
{
|
||
buf[j++] = (char)sign;
|
||
i++;
|
||
}
|
||
}
|
||
while (i < c && j < 20 && isdigit(self->_contents.u[i]))
|
||
{
|
||
buf[j++] = (char)self->_contents.u[i++];
|
||
}
|
||
buf[j] = '\0';
|
||
}
|
||
|
||
static inline BOOL
|
||
canBeConvertedToEncoding_c(GSStr self, NSStringEncoding enc)
|
||
{
|
||
unsigned c = self->_count;
|
||
BOOL result = YES;
|
||
|
||
/*
|
||
* If the length is zero, or we are already using the required encoding,
|
||
* or the required encoding is unicode (can hold any character) then we
|
||
* can assume that a conversion would succeed.
|
||
* We also know a conversion must succeed if the internal encoding is
|
||
* ascii and the required encoding has ascii as a subset.
|
||
*/
|
||
if (c > 0
|
||
&& enc != internalEncoding
|
||
&& enc != NSUTF8StringEncoding
|
||
&& enc != NSUnicodeStringEncoding
|
||
&& ((internalEncoding != NSASCIIStringEncoding) || !isByteEncoding(enc)))
|
||
{
|
||
unsigned l = 0;
|
||
unichar *r = 0;
|
||
|
||
/*
|
||
* To check whether conversion is possible, we first convert to
|
||
* unicode and then check to see whether it is possible to convert
|
||
* to the desired encoding.
|
||
*/
|
||
result = GSToUnicode(&r, &l, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(), GSUniStrict);
|
||
if (result == YES)
|
||
{
|
||
if (enc == NSISOLatin1StringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
/*
|
||
* If all the unicode characters are in the 0 to 255 range
|
||
* they are all latin1.
|
||
*/
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
if (r[i] > 255)
|
||
{
|
||
result = NO;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else if (enc == NSASCIIStringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
/*
|
||
* If all the unicode characters are in the 0 to 127 range
|
||
* they are all ascii.
|
||
*/
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
if (r[i] > 127)
|
||
{
|
||
result = NO;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned dummy = 0; // Hold returned length.
|
||
|
||
result = GSFromUnicode(0, &dummy, r, l, enc, 0, GSUniStrict);
|
||
}
|
||
|
||
// Temporary unicode string no longer needed.
|
||
NSZoneFree(NSDefaultMallocZone(), r);
|
||
}
|
||
}
|
||
return result;
|
||
}
|
||
|
||
static inline BOOL
|
||
canBeConvertedToEncoding_u(GSStr self, NSStringEncoding enc)
|
||
{
|
||
unsigned c = self->_count;
|
||
BOOL result = YES;
|
||
|
||
if (c > 0)
|
||
{
|
||
if (enc == NSUTF8StringEncoding || enc == NSUnicodeStringEncoding)
|
||
{
|
||
if (GSUnicode(self->_contents.u, c, 0, 0) != c)
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
if (enc == NSISOLatin1StringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
/*
|
||
* If all the unicode characters are in the 0 to 255 range
|
||
* they are all latin1.
|
||
*/
|
||
for (i = 0; i < self->_count; i++)
|
||
{
|
||
if (self->_contents.u[i] > 255)
|
||
{
|
||
result = NO;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else if (enc == NSASCIIStringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
/*
|
||
* If all the unicode characters are in the 0 to 127 range
|
||
* they are all ascii.
|
||
*/
|
||
for (i = 0; i < self->_count; i++)
|
||
{
|
||
if (self->_contents.u[i] > 127)
|
||
{
|
||
result = NO;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned dummy = 0; // Hold returned length.
|
||
|
||
result = GSFromUnicode(0, &dummy, self->_contents.u, c, enc,
|
||
0, GSUniStrict);
|
||
}
|
||
}
|
||
}
|
||
return result;
|
||
}
|
||
|
||
static inline unichar
|
||
characterAtIndex_c(GSStr self, unsigned index)
|
||
{
|
||
unichar u;
|
||
|
||
if (index >= self->_count)
|
||
[NSException raise: NSRangeException format: @"Invalid index."];
|
||
u = self->_contents.c[index];
|
||
if (u > 127)
|
||
{
|
||
unsigned char c = (unsigned char)u;
|
||
unsigned int s = 1;
|
||
unichar *d = &u;
|
||
|
||
GSToUnicode(&d, &s, &c, 1, internalEncoding, 0, 0);
|
||
}
|
||
return u;
|
||
}
|
||
|
||
static inline unichar
|
||
characterAtIndex_u(GSStr self,unsigned index)
|
||
{
|
||
if (index >= self->_count)
|
||
[NSException raise: NSRangeException format: @"Invalid index."];
|
||
return self->_contents.u[index];
|
||
}
|
||
|
||
static inline NSComparisonResult
|
||
compare_c(GSStr self, NSString *aString, unsigned mask, NSRange aRange)
|
||
{
|
||
Class c;
|
||
|
||
c = object_getClass(aString);
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)aString)->_flags.wide == 1))
|
||
return strCompCsUs((id)self, aString, mask, aRange);
|
||
else if (GSObjCIsKindOf(c, GSCStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)aString)->_flags.wide == 0))
|
||
return strCompCsCs((id)self, aString, mask, aRange);
|
||
else
|
||
return strCompCsNs((id)self, aString, mask, aRange);
|
||
}
|
||
|
||
static inline NSComparisonResult
|
||
compare_u(GSStr self, NSString *aString, unsigned mask, NSRange aRange)
|
||
{
|
||
Class c;
|
||
|
||
c = object_getClass(aString);
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass)
|
||
|| (c == GSMutableStringClass && ((GSStr)aString)->_flags.wide == 1))
|
||
return strCompUsUs((id)self, aString, mask, aRange);
|
||
else if (GSObjCIsKindOf(c, GSCStringClass)
|
||
|| (c == GSMutableStringClass && ((GSStr)aString)->_flags.wide == 0))
|
||
return strCompUsCs((id)self, aString, mask, aRange);
|
||
else
|
||
return strCompUsNs((id)self, aString, mask, aRange);
|
||
}
|
||
|
||
static inline const char*
|
||
cString_c(GSStr self, NSStringEncoding enc)
|
||
{
|
||
unsigned char *r = 0;
|
||
|
||
if (self->_count == 0)
|
||
{
|
||
return "\0";
|
||
}
|
||
else if (enc == internalEncoding)
|
||
{
|
||
r = (unsigned char*)GSAutoreleasedBuffer(self->_count+1);
|
||
|
||
if (self->_count > 0)
|
||
{
|
||
memcpy(r, self->_contents.c, self->_count);
|
||
}
|
||
r[self->_count] = '\0';
|
||
}
|
||
else if (enc == NSUnicodeStringEncoding)
|
||
{
|
||
unsigned l = 0;
|
||
|
||
/*
|
||
* The external C string encoding is unicode ... convert to it.
|
||
*/
|
||
if (GSToUnicode((unichar**)&r, &l, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(),
|
||
GSUniTerminate|GSUniTemporary|GSUniStrict) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
unsigned s = 0;
|
||
|
||
/*
|
||
* The external C string encoding is not compatible with the internal
|
||
* 8-bit character strings ... we must convert from internal format to
|
||
* unicode and then to the external C string encoding.
|
||
*/
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count, internalEncoding,
|
||
NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
if (GSFromUnicode((unsigned char**)&r, &s, u, l, enc,
|
||
NSDefaultMallocZone(), GSUniTerminate|GSUniTemporary|GSUniStrict) == NO)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert from Unicode string."];
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
}
|
||
|
||
return (const char*)r;
|
||
}
|
||
|
||
static inline const char*
|
||
cString_u(GSStr self, NSStringEncoding enc)
|
||
{
|
||
unsigned c = self->_count;
|
||
|
||
if (c == 0)
|
||
{
|
||
return "\0";
|
||
}
|
||
else if (enc == NSUnicodeStringEncoding)
|
||
{
|
||
unichar *tmp;
|
||
unsigned l;
|
||
|
||
if ((l = GSUnicode(self->_contents.u, c, 0, 0)) != c)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"NSString is not legal UTF-16 at %u", l];
|
||
}
|
||
tmp = (unichar*)NSZoneMalloc(NSDefaultMallocZone(), (c + 1)*2);
|
||
memcpy(tmp, self->_contents.u, c*2);
|
||
tmp[c] = 0;
|
||
[NSDataClass dataWithBytesNoCopy: tmp
|
||
length: (c + 1)*2
|
||
freeWhenDone: YES];
|
||
return (const char*)tmp;
|
||
}
|
||
else
|
||
{
|
||
unsigned int l = 0;
|
||
unsigned char *r = 0;
|
||
|
||
if (GSFromUnicode(&r, &l, self->_contents.u, c, enc,
|
||
NSDefaultMallocZone(), GSUniTerminate|GSUniTemporary|GSUniStrict) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't get cString from Unicode string."];
|
||
}
|
||
return (const char*)r;
|
||
}
|
||
}
|
||
|
||
static inline unsigned int
|
||
cStringLength_c(GSStr self, NSStringEncoding enc)
|
||
{
|
||
if (enc == internalEncoding)
|
||
{
|
||
return self->_count;
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* The external C string encoding is not compatible with the internal
|
||
* 8-bit character strings ... we must convert from internal format to
|
||
* unicode and then to the external C string encoding.
|
||
*/
|
||
if (self->_count == 0)
|
||
{
|
||
return 0;
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
unsigned s = 0;
|
||
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to/from Unicode string."];
|
||
}
|
||
if (GSFromUnicode(0, &s, u, l, enc, 0, GSUniStrict) == NO)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't get cStringLength from string."];
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
return s;
|
||
}
|
||
}
|
||
}
|
||
|
||
static inline unsigned int
|
||
cStringLength_u(GSStr self, NSStringEncoding enc)
|
||
{
|
||
unsigned c = self->_count;
|
||
|
||
if (c == 0)
|
||
{
|
||
return 0;
|
||
}
|
||
else
|
||
{
|
||
unsigned l = 0;
|
||
|
||
if (GSFromUnicode(0, &l, self->_contents.u, c, enc, 0, GSUniStrict) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't get cStringLength from Unicode string."];
|
||
}
|
||
return l;
|
||
}
|
||
}
|
||
|
||
static inline NSData*
|
||
dataUsingEncoding_c(GSStr self, NSStringEncoding encoding, BOOL lossy)
|
||
{
|
||
unsigned len = self->_count;
|
||
|
||
if (len == 0)
|
||
{
|
||
return [NSDataClass data];
|
||
}
|
||
|
||
if ((encoding == internalEncoding)
|
||
|| ((internalEncoding == NSASCIIStringEncoding)
|
||
&& (encoding == NSUTF8StringEncoding || isByteEncoding(encoding))))
|
||
{
|
||
unsigned char *buff;
|
||
|
||
buff = (unsigned char*)NSZoneMalloc(NSDefaultMallocZone(), len);
|
||
memcpy(buff, self->_contents.c, len);
|
||
return [NSDataClass dataWithBytesNoCopy: buff length: len];
|
||
}
|
||
else if (encoding == NSUnicodeStringEncoding)
|
||
{
|
||
unsigned int l = 0;
|
||
unichar *r = 0;
|
||
unsigned int options = GSUniBOM;
|
||
|
||
if (lossy == NO)
|
||
{
|
||
options |= GSUniStrict;
|
||
}
|
||
|
||
if (GSToUnicode(&r, &l, self->_contents.c, self->_count, internalEncoding,
|
||
NSDefaultMallocZone(), options) == NO)
|
||
{
|
||
return nil;
|
||
}
|
||
return [NSDataClass dataWithBytesNoCopy: r length: l * sizeof(unichar)];
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
unsigned char *r = 0;
|
||
unsigned s = 0;
|
||
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count, internalEncoding,
|
||
NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
if (GSFromUnicode(&r, &s, u, l, encoding, NSDefaultMallocZone(),
|
||
(lossy == NO) ? GSUniStrict : 0) == NO)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
return nil;
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
return [NSDataClass dataWithBytesNoCopy: r length: s];
|
||
}
|
||
}
|
||
|
||
static inline NSData*
|
||
dataUsingEncoding_u(GSStr self, NSStringEncoding encoding, BOOL lossy)
|
||
{
|
||
unsigned len = self->_count;
|
||
|
||
if (len == 0)
|
||
{
|
||
return [NSDataClass data];
|
||
}
|
||
|
||
if (encoding == NSUnicodeStringEncoding)
|
||
{
|
||
unichar *buff;
|
||
unsigned l;
|
||
unsigned from = 0;
|
||
unsigned to = 1;
|
||
|
||
if ((l = GSUnicode(self->_contents.u, len, 0, 0)) != len)
|
||
{
|
||
if (lossy == NO)
|
||
{
|
||
return nil;
|
||
}
|
||
}
|
||
buff = (unichar*)NSZoneMalloc(NSDefaultMallocZone(),
|
||
sizeof(unichar)*(len+1));
|
||
buff[0] = 0xFEFF;
|
||
|
||
while (len > 0)
|
||
{
|
||
if (l > 0)
|
||
{
|
||
memcpy(buff + to, self->_contents.u + from, sizeof(unichar)*l);
|
||
from += l;
|
||
to += l;
|
||
len -= l;
|
||
}
|
||
if (len > 0)
|
||
{
|
||
// A bad character in the string ... skip it.
|
||
if (--len > 0)
|
||
{
|
||
// Not at end ... try another batch.
|
||
from++;
|
||
l = GSUnicode(self->_contents.u + from, len, 0, 0);
|
||
}
|
||
}
|
||
}
|
||
return [NSDataClass dataWithBytesNoCopy: buff
|
||
length: sizeof(unichar)*to];
|
||
}
|
||
else
|
||
{
|
||
unsigned char *r = 0;
|
||
unsigned int l = 0;
|
||
|
||
if (GSFromUnicode(&r, &l, self->_contents.u, self->_count, encoding,
|
||
NSDefaultMallocZone(), (lossy == NO) ? GSUniStrict : 0) == NO)
|
||
{
|
||
return nil;
|
||
}
|
||
return [NSDataClass dataWithBytesNoCopy: r length: l];
|
||
}
|
||
}
|
||
|
||
extern BOOL GSScanDouble(unichar*, unsigned, double*);
|
||
|
||
static inline double
|
||
doubleValue_c(GSStr self)
|
||
{
|
||
const char *ptr = (const char*)self->_contents.c;
|
||
const char *end = ptr + self->_count;
|
||
|
||
while (ptr < end && isspace(*ptr))
|
||
{
|
||
ptr++;
|
||
}
|
||
if (ptr == end)
|
||
{
|
||
return 0.0;
|
||
}
|
||
else
|
||
{
|
||
unsigned s = 99;
|
||
unichar b[100];
|
||
unichar *u = b;
|
||
double d = 0.0;
|
||
|
||
/* use static buffer unless string is really long, in which case
|
||
* we use the stack to allocate a bigger one.
|
||
*/
|
||
if (GSToUnicode(&u, &s, (const uint8_t*)ptr, end - ptr,
|
||
internalEncoding, NSDefaultMallocZone(), GSUniTerminate) == NO)
|
||
{
|
||
return 0.0;
|
||
}
|
||
if (GSScanDouble(u, end - ptr, &d) == NO)
|
||
{
|
||
d = 0.0;
|
||
}
|
||
if (u != b)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
}
|
||
return d;
|
||
}
|
||
}
|
||
|
||
static inline double
|
||
doubleValue_u(GSStr self)
|
||
{
|
||
if (self->_count == 0)
|
||
{
|
||
return 0.0;
|
||
}
|
||
else
|
||
{
|
||
double d = 0.0;
|
||
|
||
GSScanDouble(self->_contents.u, self->_count, &d);
|
||
return d;
|
||
}
|
||
}
|
||
|
||
static inline void
|
||
fillHole(GSStr self, unsigned index, unsigned size)
|
||
{
|
||
NSCAssert(size > 0, @"size <= zero");
|
||
NSCAssert(index + size <= self->_count, @"index + size > length");
|
||
|
||
self->_count -= size;
|
||
if (self->_flags.wide == 1)
|
||
{
|
||
memmove(self->_contents.u + index,
|
||
self->_contents.u + index + size,
|
||
sizeof(unichar)*(self->_count - index));
|
||
}
|
||
else
|
||
{
|
||
memmove(self->_contents.c + index,
|
||
self->_contents.c + index + size, (self->_count - index));
|
||
}
|
||
self->_flags.hash = 0;
|
||
}
|
||
|
||
static inline void
|
||
getCharacters_c(GSStr self, unichar *buffer, NSRange aRange)
|
||
{
|
||
if (aRange.length)
|
||
{
|
||
if (NSISOLatin1StringEncoding == internalEncoding)
|
||
{
|
||
register NSUInteger count = aRange.length;
|
||
register NSUInteger base = aRange.location;
|
||
|
||
while (count-- > 0)
|
||
{
|
||
buffer[count] = self->_contents.c[base + count];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned len = aRange.length;
|
||
|
||
if (!GSToUnicode(&buffer, &len, self->_contents.c + aRange.location,
|
||
aRange.length, internalEncoding, 0, 0))
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"Can't convert to Unicode."];
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
static inline void
|
||
getCharacters_u(GSStr self, unichar *buffer, NSRange aRange)
|
||
{
|
||
memcpy(buffer, self->_contents.u + aRange.location,
|
||
aRange.length*sizeof(unichar));
|
||
}
|
||
|
||
static void
|
||
getCString_c(GSStr self, char *buffer, unsigned int maxLength,
|
||
NSRange aRange, NSRange *leftoverRange)
|
||
{
|
||
GSMutableString *o;
|
||
int len;
|
||
|
||
if (maxLength > self->_count)
|
||
{
|
||
maxLength = self->_count;
|
||
}
|
||
if (maxLength < aRange.length)
|
||
{
|
||
len = maxLength;
|
||
if (leftoverRange != 0)
|
||
{
|
||
leftoverRange->location = aRange.location + maxLength;
|
||
leftoverRange->length = aRange.length - maxLength;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
len = aRange.length;
|
||
if (leftoverRange != 0)
|
||
{
|
||
leftoverRange->location = 0;
|
||
leftoverRange->length = 0;
|
||
}
|
||
}
|
||
|
||
if (externalEncoding == internalEncoding)
|
||
{
|
||
memcpy(buffer, &self->_contents.c[aRange.location], len);
|
||
buffer[len] = '\0';
|
||
return;
|
||
}
|
||
|
||
if (isByteEncoding(internalEncoding))
|
||
{
|
||
if (externalEncoding == NSUTF8StringEncoding
|
||
|| isByteEncoding(externalEncoding))
|
||
{
|
||
const unsigned char *ptr = self->_contents.c + aRange.location;
|
||
unsigned i;
|
||
|
||
/*
|
||
* Maybe we actually contain ascii data, which can be
|
||
* copied out directly.
|
||
*/
|
||
for (i = 0; i < len; i++)
|
||
{
|
||
unsigned char c = ptr[i];
|
||
|
||
if (c > 127)
|
||
{
|
||
break;
|
||
}
|
||
buffer[i] = c;
|
||
}
|
||
if (i == len)
|
||
{
|
||
buffer[i] = '\0';
|
||
return;
|
||
}
|
||
}
|
||
}
|
||
|
||
/* As the internal and external encodings don't match, the simplest
|
||
* thing to do is widen the internal data to unicode and use the
|
||
* unicode function to get the cString.
|
||
*/
|
||
o = (GSMutableString*)alloca(class_getInstanceSize(GSMutableStringClass));
|
||
object_setClass(o, GSMutableStringClass);
|
||
o->_count = self->_count;
|
||
o->_flags.wide = 0;
|
||
o->_flags.owned = 0;
|
||
o->_flags.unused = 0;
|
||
o->_flags.hash = 0;
|
||
o->_capacity = self->_count;
|
||
o->_contents.c = self->_contents.c;
|
||
o->_zone = NSDefaultMallocZone();
|
||
GSStrWiden(o);
|
||
getCString_u(o, buffer, maxLength, aRange, leftoverRange);
|
||
if (o->_flags.owned == 1)
|
||
{
|
||
NSZoneFree(o->_zone, o->_contents.u);
|
||
}
|
||
}
|
||
|
||
static void
|
||
getCString_u(GSStr self, char *buffer, unsigned int maxLength,
|
||
NSRange aRange, NSRange *leftoverRange)
|
||
{
|
||
/* The primitive we have for converting from unicode, GSFromUnicode,
|
||
can't deal with our leftoverRange case, so we need to use a bit of
|
||
complexity instead. */
|
||
unsigned int len;
|
||
|
||
/* TODO: this is an extremely ugly hack to work around buggy iconvs
|
||
that return -1/E2BIG for buffers larger than 0x40000acf */
|
||
if (maxLength > 0x40000000)
|
||
maxLength = 0x40000000;
|
||
|
||
/* First, try converting the whole thing. */
|
||
len = maxLength;
|
||
if (GSFromUnicode((unsigned char **)&buffer, &len,
|
||
self->_contents.u + aRange.location, aRange.length,
|
||
externalEncoding, 0, GSUniTerminate | GSUniStrict) == YES)
|
||
{
|
||
if (leftoverRange)
|
||
leftoverRange->location = leftoverRange->length = 0;
|
||
return;
|
||
}
|
||
|
||
/* The conversion failed. Either the buffer is too small for the whole
|
||
range, or there are characters in it we can't convert. Check for
|
||
unconvertable characters first. */
|
||
len = 0;
|
||
if (GSFromUnicode(NULL, &len,
|
||
self->_contents.u + aRange.location, aRange.length,
|
||
externalEncoding, 0, GSUniTerminate | GSUniStrict) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't get cString from Unicode string."];
|
||
return;
|
||
}
|
||
|
||
/* The string can be converted, but not all of it. Do a binary search
|
||
to find the longest subrange that fits in the buffer. */
|
||
{
|
||
unsigned int lo, hi, mid;
|
||
|
||
lo = 0;
|
||
hi = aRange.length;
|
||
while (lo < hi)
|
||
{
|
||
mid = (lo + hi + 1) / 2; /* round up to get edge case right */
|
||
len = maxLength;
|
||
if (GSFromUnicode((unsigned char **)&buffer, &len,
|
||
self->_contents.u + aRange.location, mid,
|
||
externalEncoding, 0, GSUniTerminate | GSUniStrict) == YES)
|
||
{
|
||
lo = mid;
|
||
}
|
||
else
|
||
{
|
||
hi = mid - 1;
|
||
}
|
||
}
|
||
|
||
/* lo==hi characters fit. Do the real conversion. */
|
||
len = maxLength;
|
||
if (lo == 0)
|
||
{
|
||
buffer[0] = 0;
|
||
}
|
||
else if (GSFromUnicode((unsigned char **)&buffer, &len,
|
||
self->_contents.u + aRange.location, lo,
|
||
externalEncoding, 0, GSUniTerminate | GSUniStrict) == NO)
|
||
{
|
||
NSCAssert(NO, @"binary search gave inconsistent results");
|
||
}
|
||
|
||
if (leftoverRange)
|
||
{
|
||
leftoverRange->location = aRange.location + lo;
|
||
leftoverRange->length = NSMaxRange(aRange) - leftoverRange->location;
|
||
}
|
||
}
|
||
}
|
||
|
||
static inline BOOL
|
||
getCStringE_c(GSStr self, char *buffer, unsigned int maxLength,
|
||
NSStringEncoding enc)
|
||
{
|
||
if (buffer == 0)
|
||
{
|
||
return NO; // Can't fit in here
|
||
}
|
||
if (enc == NSUnicodeStringEncoding)
|
||
{
|
||
if (maxLength >= sizeof(unichar))
|
||
{
|
||
unsigned bytes = maxLength - sizeof(unichar);
|
||
unichar *u = (unichar*)(void*)buffer;
|
||
|
||
if (GSToUnicode(&u, &bytes, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(), GSUniTerminate) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
if (u == (unichar*)(void*)buffer)
|
||
{
|
||
return YES;
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
}
|
||
return NO;
|
||
}
|
||
else
|
||
{
|
||
if (maxLength > sizeof(char))
|
||
{
|
||
unsigned bytes = maxLength - sizeof(char);
|
||
|
||
if (enc == internalEncoding)
|
||
{
|
||
if (bytes > self->_count)
|
||
{
|
||
bytes = self->_count;
|
||
}
|
||
memcpy(buffer, self->_contents.c, bytes);
|
||
buffer[bytes] = '\0';
|
||
if (bytes < self->_count)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
|
||
if (enc == NSUTF8StringEncoding
|
||
&& isByteEncoding(internalEncoding))
|
||
{
|
||
unsigned i;
|
||
|
||
/*
|
||
* Maybe we actually contain ascii data, which can be
|
||
* copied out directly as a utf-8 string.
|
||
*/
|
||
if (bytes > self->_count)
|
||
{
|
||
bytes = self->_count;
|
||
}
|
||
for (i = 0; i < bytes; i++)
|
||
{
|
||
unsigned char c = self->_contents.c[i];
|
||
|
||
if (c > 127)
|
||
{
|
||
break;
|
||
}
|
||
buffer[i] = c;
|
||
}
|
||
if (i == bytes)
|
||
{
|
||
buffer[bytes] = '\0';
|
||
if (bytes < self->_count)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
}
|
||
|
||
if (enc == NSASCIIStringEncoding
|
||
&& isByteEncoding(internalEncoding))
|
||
{
|
||
unsigned i;
|
||
|
||
if (bytes > self->_count)
|
||
{
|
||
bytes = self->_count;
|
||
}
|
||
for (i = 0; i < bytes; i++)
|
||
{
|
||
unsigned char c = self->_contents.c[i];
|
||
|
||
if (c > 127)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"unable to convert to encoding"];
|
||
}
|
||
buffer[i] = c;
|
||
}
|
||
buffer[bytes] = '\0';
|
||
if (bytes < self->_count)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned char *c = (unsigned char*)buffer;
|
||
unsigned l = 0;
|
||
|
||
/*
|
||
* The specified C string encoding is not compatible with
|
||
* the internal 8-bit character strings ... we must convert
|
||
* from internal format to unicode and then to the specified
|
||
* C string encoding.
|
||
*/
|
||
bytes = maxLength - sizeof(char);
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to Unicode string."];
|
||
}
|
||
if (GSFromUnicode((unsigned char**)&c, &bytes, u, l, enc,
|
||
0, GSUniTerminate|GSUniStrict) == NO)
|
||
{
|
||
c = 0; // Unable to convert
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
if (c == (unsigned char*)buffer)
|
||
{
|
||
return YES; // Fitted in original buffer
|
||
}
|
||
else if (c != 0)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), c);
|
||
}
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
static inline BOOL
|
||
getCStringE_u(GSStr self, char *buffer, unsigned int maxLength,
|
||
NSStringEncoding enc)
|
||
{
|
||
if (enc == NSUnicodeStringEncoding)
|
||
{
|
||
if (maxLength >= sizeof(unichar))
|
||
{
|
||
unsigned bytes = maxLength - sizeof(unichar);
|
||
|
||
if (bytes/sizeof(unichar) > self->_count)
|
||
{
|
||
bytes = self->_count * sizeof(unichar);
|
||
}
|
||
memcpy(buffer, self->_contents.u, bytes);
|
||
buffer[bytes] = '\0';
|
||
buffer[bytes + 1] = '\0';
|
||
if (bytes/sizeof(unichar) == self->_count)
|
||
{
|
||
return YES;
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
else
|
||
{
|
||
if (maxLength >= 1)
|
||
{
|
||
if (enc == NSISOLatin1StringEncoding)
|
||
{
|
||
unsigned bytes = maxLength - sizeof(char);
|
||
unsigned i;
|
||
|
||
if (bytes > self->_count)
|
||
{
|
||
bytes = self->_count;
|
||
}
|
||
for (i = 0; i < bytes; i++)
|
||
{
|
||
unichar u = self->_contents.u[i];
|
||
|
||
if (u & 0xff00)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"unable to convert to encoding"];
|
||
}
|
||
buffer[i] = (char)u;
|
||
}
|
||
buffer[i] = '\0';
|
||
if (bytes == self->_count)
|
||
{
|
||
return YES;
|
||
}
|
||
}
|
||
else if (enc == NSASCIIStringEncoding)
|
||
{
|
||
unsigned bytes = maxLength - sizeof(char);
|
||
unsigned i;
|
||
|
||
if (bytes > self->_count)
|
||
{
|
||
bytes = self->_count;
|
||
}
|
||
for (i = 0; i < bytes; i++)
|
||
{
|
||
unichar u = self->_contents.u[i];
|
||
|
||
if (u & 0xff80)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"unable to convert to encoding"];
|
||
}
|
||
buffer[i] = (char)u;
|
||
}
|
||
buffer[i] = '\0';
|
||
if (bytes == self->_count)
|
||
{
|
||
return YES;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned char *c = (unsigned char*)buffer;
|
||
|
||
if (GSFromUnicode((unsigned char**)&c, &maxLength,
|
||
self->_contents.u, self->_count, enc,
|
||
0, GSUniTerminate|GSUniStrict) == NO)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
}
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
static inline BOOL
|
||
isEqual_c(GSStr self, id anObject)
|
||
{
|
||
Class c;
|
||
|
||
if (anObject == (id)self)
|
||
{
|
||
return YES;
|
||
}
|
||
if (anObject == nil)
|
||
{
|
||
return NO;
|
||
}
|
||
c = object_getClass(anObject);
|
||
if (class_isMetaClass(c) == YES)
|
||
{
|
||
return NO;
|
||
}
|
||
if (c == NSConstantStringClass)
|
||
{
|
||
return literalIsEqualInternal((NXConstantString*)anObject, (GSStr)self);
|
||
}
|
||
if (c == GSMutableStringClass || GSObjCIsKindOf(c, GSStringClass) == YES)
|
||
{
|
||
GSStr other = (GSStr)anObject;
|
||
NSRange r = {0, self->_count};
|
||
|
||
/* First see if the hash is the same - if not, we can't be equal.
|
||
* However, it's not worth calculating hashes unless the strings
|
||
* are fairly long.
|
||
*/
|
||
if (self->_count > 15)
|
||
{
|
||
if (self->_flags.hash == 0)
|
||
self->_flags.hash = (*hashImp)((id)self, hashSel);
|
||
if (other->_flags.hash == 0)
|
||
other->_flags.hash = (*hashImp)((id)other, hashSel);
|
||
if (self->_flags.hash != other->_flags.hash)
|
||
return NO;
|
||
}
|
||
else if (self->_flags.hash && other->_flags.hash)
|
||
{
|
||
if (self->_flags.hash != other->_flags.hash)
|
||
return NO;
|
||
}
|
||
|
||
/*
|
||
* Do a compare depending on the type of the other string.
|
||
*/
|
||
if (other->_flags.wide == 1)
|
||
{
|
||
if (strCompCsUs((id)self, (id)other, 0, r) == NSOrderedSame)
|
||
return YES;
|
||
}
|
||
else
|
||
{
|
||
if (other->_count == self->_count
|
||
&& memcmp(other->_contents.c, self->_contents.c, self->_count) == 0)
|
||
return YES;
|
||
}
|
||
return NO;
|
||
}
|
||
else if (YES == [anObject isKindOfClass: NSStringClass]) // may be proxy
|
||
{
|
||
return (*equalImp)((id)self, equalSel, anObject);
|
||
}
|
||
else
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
static inline BOOL
|
||
isEqual_u(GSStr self, id anObject)
|
||
{
|
||
Class c;
|
||
|
||
if (anObject == (id)self)
|
||
{
|
||
return YES;
|
||
}
|
||
if (anObject == nil)
|
||
{
|
||
return NO;
|
||
}
|
||
c = object_getClass(anObject);
|
||
if (class_isMetaClass(c) == YES)
|
||
{
|
||
return NO;
|
||
}
|
||
if (c == NSConstantStringClass)
|
||
{
|
||
return literalIsEqualInternal((NXConstantString*)anObject, (GSStr)self);
|
||
}
|
||
if (c == GSMutableStringClass || GSObjCIsKindOf(c, GSStringClass) == YES)
|
||
{
|
||
GSStr other = (GSStr)anObject;
|
||
NSRange r = {0, self->_count};
|
||
|
||
/* First see if the hash is the same - if not, we can't be equal.
|
||
* However, it's not worth calculating hashes unless the strings
|
||
* are fairly long.
|
||
*/
|
||
if (self->_count > 15)
|
||
{
|
||
if (self->_flags.hash == 0)
|
||
self->_flags.hash = (*hashImp)((id)self, hashSel);
|
||
if (other->_flags.hash == 0)
|
||
other->_flags.hash = (*hashImp)((id)other, hashSel);
|
||
if (self->_flags.hash != other->_flags.hash)
|
||
return NO;
|
||
}
|
||
else if (self->_flags.hash && other->_flags.hash)
|
||
{
|
||
if (self->_flags.hash != other->_flags.hash)
|
||
return NO;
|
||
}
|
||
|
||
/*
|
||
* Do a compare depending on the type of the other string.
|
||
*/
|
||
if (other->_flags.wide == 1)
|
||
{
|
||
if (strCompUsUs((id)self, (id)other, 0, r) == NSOrderedSame)
|
||
return YES;
|
||
}
|
||
else
|
||
{
|
||
if (strCompUsCs((id)self, (id)other, 0, r) == NSOrderedSame)
|
||
return YES;
|
||
}
|
||
return NO;
|
||
}
|
||
else if (YES == [anObject isKindOfClass: NSStringClass]) // may be proxy
|
||
{
|
||
return (*equalImp)((id)self, equalSel, anObject);
|
||
}
|
||
else
|
||
{
|
||
return NO;
|
||
}
|
||
}
|
||
|
||
static inline const char*
|
||
lossyCString_c(GSStr self)
|
||
{
|
||
char *r;
|
||
|
||
if (self->_count == 0)
|
||
{
|
||
return "";
|
||
}
|
||
if (externalEncoding == internalEncoding)
|
||
{
|
||
r = (char*)GSAutoreleasedBuffer(self->_count+1);
|
||
|
||
if (self->_count > 0)
|
||
{
|
||
memcpy(r, self->_contents.c, self->_count);
|
||
}
|
||
r[self->_count] = '\0';
|
||
}
|
||
else
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
unsigned s = 0;
|
||
|
||
/*
|
||
* The external C string encoding is not compatible with the internal
|
||
* 8-bit character strings ... we must convert from internal format to
|
||
* unicode and then to the external C string encoding.
|
||
*/
|
||
if (GSToUnicode(&u, &l, self->_contents.c, self->_count,
|
||
internalEncoding, NSDefaultMallocZone(), 0) == NO)
|
||
{
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to/from Unicode string."];
|
||
}
|
||
if (GSFromUnicode((unsigned char**)&r, &s, u, l, externalEncoding,
|
||
NSDefaultMallocZone(), GSUniTerminate|GSUniTemporary) == NO)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
[NSException raise: NSCharacterConversionException
|
||
format: @"Can't convert to/from Unicode string."];
|
||
}
|
||
NSZoneFree(NSDefaultMallocZone(), u);
|
||
}
|
||
|
||
return r;
|
||
}
|
||
|
||
static inline const char*
|
||
lossyCString_u(GSStr self)
|
||
{
|
||
unsigned l = 0;
|
||
unsigned char *r = 0;
|
||
|
||
GSFromUnicode(&r, &l, self->_contents.u, self->_count, externalEncoding,
|
||
NSDefaultMallocZone(), GSUniTemporary|GSUniTerminate);
|
||
return (const char*)r;
|
||
}
|
||
|
||
static void GSStrMakeSpace(GSStr s, unsigned size)
|
||
{
|
||
unsigned want;
|
||
|
||
want = size + s->_count + 1;
|
||
s->_capacity += s->_capacity/2;
|
||
if (want > s->_capacity)
|
||
{
|
||
s->_capacity = want;
|
||
}
|
||
if (s->_flags.owned == 1)
|
||
{
|
||
/*
|
||
* If we own the character buffer, we can simply realloc.
|
||
*/
|
||
if (s->_flags.wide == 1)
|
||
{
|
||
s->_contents.u = NSZoneRealloc(s->_zone,
|
||
s->_contents.u, s->_capacity*sizeof(unichar));
|
||
}
|
||
else
|
||
{
|
||
s->_contents.c = NSZoneRealloc(s->_zone,
|
||
s->_contents.c, s->_capacity);
|
||
}
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* If the initial data was not to be freed, we must allocate new
|
||
* buffer, copy the data, and set up the zone we are using.
|
||
*/
|
||
if (s->_zone == 0)
|
||
{
|
||
#if GS_WITH_GC
|
||
s->_zone = GSAtomicMallocZone();
|
||
#else
|
||
s->_zone = [(NSString*)s zone];
|
||
#endif
|
||
}
|
||
if (s->_flags.wide == 1)
|
||
{
|
||
unichar *tmp = s->_contents.u;
|
||
|
||
s->_contents.u = NSZoneMalloc(s->_zone,
|
||
s->_capacity*sizeof(unichar));
|
||
if (s->_count > 0)
|
||
{
|
||
memcpy(s->_contents.u, tmp, s->_count*sizeof(unichar));
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned char *tmp = s->_contents.c;
|
||
|
||
s->_contents.c = NSZoneMalloc(s->_zone, s->_capacity);
|
||
if (s->_count > 0)
|
||
{
|
||
memcpy(s->_contents.c, tmp, s->_count);
|
||
}
|
||
}
|
||
s->_flags.owned = 1;
|
||
}
|
||
}
|
||
|
||
static void GSStrWiden(GSStr s)
|
||
{
|
||
unichar *tmp = 0;
|
||
unsigned len = 0;
|
||
|
||
NSCAssert(s->_flags.wide == 0, @"string is not wide");
|
||
|
||
/*
|
||
* As a special case, where we are ascii or latin1 and the buffer size
|
||
* is big enough, we can widen to unicode without having to allocate
|
||
* more memory or call a character conversion function.
|
||
*/
|
||
if (s->_count <= s->_capacity / 2)
|
||
{
|
||
if (internalEncoding == NSISOLatin1StringEncoding
|
||
|| internalEncoding == NSASCIIStringEncoding)
|
||
{
|
||
len = s->_count;
|
||
while (len-- > 0)
|
||
{
|
||
s->_contents.u[len] = s->_contents.c[len];
|
||
}
|
||
s->_capacity /= 2;
|
||
s->_flags.wide = 1;
|
||
return;
|
||
}
|
||
}
|
||
|
||
if (!s->_zone)
|
||
{
|
||
#if GS_WITH_GC
|
||
s->_zone = GSAtomicMallocZone();
|
||
#else
|
||
s->_zone = [(NSString*)s zone];
|
||
#endif
|
||
}
|
||
|
||
if (!GSToUnicode(&tmp, &len, s->_contents.c, s->_count,
|
||
internalEncoding, s->_zone, 0))
|
||
{
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"widen of string failed"];
|
||
}
|
||
if (s->_flags.owned == 1)
|
||
{
|
||
NSZoneFree(s->_zone, s->_contents.c);
|
||
}
|
||
else
|
||
{
|
||
s->_flags.owned = 1;
|
||
}
|
||
s->_contents.u = tmp;
|
||
s->_flags.wide = 1;
|
||
s->_count = len;
|
||
s->_capacity = len;
|
||
}
|
||
|
||
static inline void
|
||
makeHole(GSStr self, unsigned int index, unsigned int size)
|
||
{
|
||
NSCAssert(size > 0, @"size < zero");
|
||
NSCAssert(index <= self->_count, @"index > length");
|
||
|
||
if (self->_count + size + 1 >= self->_capacity)
|
||
{
|
||
GSStrMakeSpace((GSStr)self, size);
|
||
}
|
||
|
||
if (index < self->_count)
|
||
{
|
||
if (self->_flags.wide == 1)
|
||
{
|
||
memmove(self->_contents.u + index + size,
|
||
self->_contents.u + index,
|
||
sizeof(unichar)*(self->_count - index));
|
||
}
|
||
else
|
||
{
|
||
memmove(self->_contents.c + index + size,
|
||
self->_contents.c + index,
|
||
(self->_count - index));
|
||
}
|
||
}
|
||
|
||
self->_count += size;
|
||
self->_flags.hash = 0;
|
||
}
|
||
|
||
static inline NSRange
|
||
rangeOfSequence_c(GSStr self, unsigned anIndex)
|
||
{
|
||
if (anIndex >= self->_count)
|
||
[NSException raise: NSRangeException format:@"Invalid location."];
|
||
|
||
return (NSRange){anIndex, 1};
|
||
}
|
||
|
||
static inline NSRange
|
||
rangeOfSequence_u(GSStr self, unsigned anIndex)
|
||
{
|
||
unsigned start;
|
||
unsigned end;
|
||
|
||
if (anIndex >= self->_count)
|
||
[NSException raise: NSRangeException format:@"Invalid location."];
|
||
|
||
start = anIndex;
|
||
while (uni_isnonsp(self->_contents.u[start]) && start > 0)
|
||
start--;
|
||
end = start + 1;
|
||
if (end < self->_count)
|
||
while ((end < self->_count) && (uni_isnonsp(self->_contents.u[end])))
|
||
end++;
|
||
return (NSRange){start, end-start};
|
||
}
|
||
|
||
static inline NSRange
|
||
rangeOfCharacter_c(GSStr self, NSCharacterSet *aSet, unsigned mask,
|
||
NSRange aRange)
|
||
{
|
||
int i;
|
||
int start;
|
||
int stop;
|
||
int step;
|
||
NSRange range;
|
||
BOOL (*mImp)(id, SEL, unichar);
|
||
|
||
if (aSet == nil)
|
||
[NSException raise: NSInvalidArgumentException format: @"range of nil"];
|
||
|
||
if ((mask & NSBackwardsSearch) == NSBackwardsSearch)
|
||
{
|
||
start = NSMaxRange(aRange) - 1;
|
||
stop = aRange.location - 1;
|
||
step = -1;
|
||
}
|
||
else
|
||
{
|
||
start = aRange.location;
|
||
stop = NSMaxRange(aRange);
|
||
step = 1;
|
||
}
|
||
range.location = NSNotFound;
|
||
range.length = 0;
|
||
|
||
mImp = (BOOL(*)(id,SEL,unichar))
|
||
[aSet methodForSelector: cMemberSel];
|
||
|
||
for (i = start; i != stop; i += step)
|
||
{
|
||
unichar u = self->_contents.c[i];
|
||
|
||
if (u > 127 && internalEncoding != NSISOLatin1StringEncoding)
|
||
{
|
||
unsigned char c = (unsigned char)u;
|
||
unsigned int s = 1;
|
||
unichar *d = &u;
|
||
|
||
GSToUnicode(&d, &s, &c, 1, internalEncoding, 0, 0);
|
||
}
|
||
/* FIXME ... what about UTF-16 sequences of more than one 16bit value
|
||
* corresponding to a single UCS-32 codepoint?
|
||
*/
|
||
if ((*mImp)(aSet, cMemberSel, u))
|
||
{
|
||
range = NSMakeRange(i, 1);
|
||
break;
|
||
}
|
||
}
|
||
|
||
return range;
|
||
}
|
||
|
||
static inline NSRange
|
||
rangeOfCharacter_u(GSStr self, NSCharacterSet *aSet, unsigned mask,
|
||
NSRange aRange)
|
||
{
|
||
int i;
|
||
int start;
|
||
int stop;
|
||
int step;
|
||
NSRange range;
|
||
BOOL (*mImp)(id, SEL, unichar);
|
||
|
||
if (aSet == nil)
|
||
[NSException raise: NSInvalidArgumentException format: @"range of nil"];
|
||
|
||
if ((mask & NSBackwardsSearch) == NSBackwardsSearch)
|
||
{
|
||
start = NSMaxRange(aRange) - 1;
|
||
stop = aRange.location - 1;
|
||
step = -1;
|
||
}
|
||
else
|
||
{
|
||
start = aRange.location;
|
||
stop = NSMaxRange(aRange);
|
||
step = 1;
|
||
}
|
||
range.location = NSNotFound;
|
||
range.length = 0;
|
||
|
||
mImp = (BOOL(*)(id,SEL,unichar))
|
||
[aSet methodForSelector: cMemberSel];
|
||
|
||
/* FIXME ... what about UTF-16 sequences of more than one 16bit value
|
||
* corresponding to a single UCS-32 codepoint?
|
||
*/
|
||
for (i = start; i != stop; i += step)
|
||
{
|
||
unichar letter = self->_contents.u[i];
|
||
|
||
if ((*mImp)(aSet, cMemberSel, letter))
|
||
{
|
||
range = NSMakeRange(i, 1);
|
||
break;
|
||
}
|
||
}
|
||
|
||
return range;
|
||
}
|
||
|
||
GSRSFunc
|
||
GSPrivateRangeOfString(NSString *receiver, NSString *target)
|
||
{
|
||
Class c;
|
||
|
||
c = object_getClass(receiver);
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)receiver)->_flags.wide == 1))
|
||
{
|
||
c = object_getClass(target);
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)target)->_flags.wide == 1))
|
||
return (GSRSFunc)strRangeUsUs;
|
||
else if (GSObjCIsKindOf(c, GSCStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)target)->_flags.wide == 0))
|
||
return (GSRSFunc)strRangeUsCs;
|
||
else
|
||
return (GSRSFunc)strRangeUsNs;
|
||
}
|
||
else if (GSObjCIsKindOf(c, GSCStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)target)->_flags.wide == 0))
|
||
{
|
||
c = object_getClass(target);
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)target)->_flags.wide == 1))
|
||
return (GSRSFunc)strRangeCsUs;
|
||
else if (GSObjCIsKindOf(c, GSCStringClass) == YES
|
||
|| (c == GSMutableStringClass && ((GSStr)target)->_flags.wide == 0))
|
||
return (GSRSFunc)strRangeCsCs;
|
||
else
|
||
return (GSRSFunc)strRangeCsNs;
|
||
}
|
||
else
|
||
{
|
||
return (GSRSFunc)strRangeNsNs;
|
||
}
|
||
}
|
||
|
||
static inline NSString*
|
||
substring_c(GSStr self, NSRange aRange)
|
||
{
|
||
GSCSubString *o;
|
||
|
||
if (aRange.length == 0)
|
||
{
|
||
return @"";
|
||
}
|
||
o = (typeof(o))NSAllocateObject(GSCSubStringClass,
|
||
0, NSDefaultMallocZone());
|
||
o->_contents.c = self->_contents.c + aRange.location;
|
||
o->_count = aRange.length;
|
||
o->_flags.wide = 0;
|
||
o->_flags.owned = 0;
|
||
ASSIGN(o->_parent, (id)self);
|
||
return AUTORELEASE((id)o);
|
||
}
|
||
|
||
static inline NSString*
|
||
substring_u(GSStr self, NSRange aRange)
|
||
{
|
||
GSCSubString *o;
|
||
|
||
if (aRange.length == 0)
|
||
{
|
||
return @"";
|
||
}
|
||
o = (typeof(o))NSAllocateObject(GSUnicodeSubStringClass,
|
||
0, NSDefaultMallocZone());
|
||
o->_contents.u = self->_contents.u + aRange.location;
|
||
o->_count = aRange.length;
|
||
o->_flags.wide = 1;
|
||
o->_flags.owned = 0;
|
||
ASSIGN(o->_parent, (id)self);
|
||
return AUTORELEASE((id)o);
|
||
}
|
||
|
||
/*
|
||
* Function to examine the given string and see if it is one of our concrete
|
||
* string classes. Converts the mutable string (self) from 8-bit to 16-bit
|
||
* representation if necessary in order to contain the data in aString.
|
||
* Returns a pointer to aStrings GSStr if aString is a concrete class
|
||
* from which contents may be copied directly without conversion.
|
||
*/
|
||
static inline GSStr
|
||
transmute(GSStr self, NSString *aString)
|
||
{
|
||
GSStr other = (GSStr)aString;
|
||
BOOL transmute = YES;
|
||
Class c = object_getClass(aString); // NB aString must not be nil
|
||
|
||
if (self->_flags.wide == 1)
|
||
{
|
||
/*
|
||
* This is already a unicode string, so we don't need to transmute,
|
||
* but we still need to know if the other string is a unicode
|
||
* string whose GSStr we can access directly.
|
||
*/
|
||
transmute = NO;
|
||
if (GSObjCIsKindOf(c, GSUnicodeStringClass) == NO
|
||
&& (c != GSMutableStringClass || other->_flags.wide != 1))
|
||
{
|
||
other = 0;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* This is a string held in the internal 8-bit encoding.
|
||
*/
|
||
if (GSObjCIsKindOf(c, GSCStringClass)
|
||
|| (c == GSMutableStringClass && other->_flags.wide == 0))
|
||
{
|
||
/*
|
||
* The other string is also held in the internal 8-bit encoding,
|
||
* so we don't need to transmute, and we can use its GSStr.
|
||
*/
|
||
transmute = NO;
|
||
}
|
||
else if ([aString canBeConvertedToEncoding: internalEncoding] == YES)
|
||
{
|
||
/*
|
||
* The other string can be converted to the internal 8-bit encoding,
|
||
* so we don't need to transmute, but we can *not* use its GSStr.
|
||
*/
|
||
transmute = NO;
|
||
other = 0;
|
||
}
|
||
else if ((c == GSMutableStringClass && other->_flags.wide == 1)
|
||
|| GSObjCIsKindOf(c, GSUnicodeStringClass) == YES)
|
||
{
|
||
/*
|
||
* The other string can not be converted to the internal 8-bit
|
||
* encoding, so we need to transmute, and will then be able to
|
||
* use its GSStr.
|
||
*/
|
||
transmute = YES;
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* The other string can not be converted to the internal 8-bit
|
||
* character string, so we need to transmute, but even then we
|
||
* will not be able to use the other strings GSStr because that
|
||
* string is not a known GSString subclass.
|
||
*/
|
||
other = 0;
|
||
}
|
||
}
|
||
|
||
if (transmute == YES)
|
||
{
|
||
GSStrWiden((GSStr)self);
|
||
}
|
||
|
||
return other;
|
||
}
|
||
|
||
|
||
|
||
/*
|
||
* The GSString class is actually only provided to provide a common ivar
|
||
* layout for all subclasses, so that they can all share the same code.
|
||
* This class should never be instantiated, and with the exception of
|
||
* -copyWithZone:, none of its memory management related methods
|
||
* (initializers and -dealloc) should ever be called. We guard against
|
||
* this happening.
|
||
*/
|
||
@implementation GSString
|
||
|
||
+ (void) initialize
|
||
{
|
||
setup(NO);
|
||
}
|
||
|
||
+ (void) reinitialize
|
||
{
|
||
setup(YES);
|
||
}
|
||
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
[self subclassResponsibility: _cmd];
|
||
return nil;
|
||
}
|
||
|
||
/*
|
||
* Return a 28-bit hash value for the string contents - this
|
||
* MUST match the algorithm used by the NSString base class.
|
||
*/
|
||
- (NSUInteger) hash
|
||
{
|
||
if (self->_flags.hash == 0)
|
||
{
|
||
uint32_t ret = 0;
|
||
int len = (int)self->_count;
|
||
|
||
if (len > 0)
|
||
{
|
||
if (self->_flags.wide)
|
||
{
|
||
const unichar *p = self->_contents.u;
|
||
|
||
ret = GSPrivateHash(0, p, len * sizeof(unichar));
|
||
}
|
||
else if (len > 64)
|
||
{
|
||
return (self->_flags.hash = [super hash]);
|
||
}
|
||
else
|
||
{
|
||
unichar buf[64];
|
||
unsigned index;
|
||
const unsigned char *p = self->_contents.c;
|
||
|
||
if (internalEncoding == NSISOLatin1StringEncoding)
|
||
{
|
||
for (index = 0; index < len; index++)
|
||
{
|
||
buf[index] = p[index];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
for (index = 0; index < len; index++)
|
||
{
|
||
unichar u = p[index];
|
||
|
||
if (u > 127)
|
||
{
|
||
return (self->_flags.hash = [super hash]);
|
||
}
|
||
buf[index] = u;
|
||
}
|
||
}
|
||
ret = GSPrivateHash(0, buf, len * sizeof(unichar));
|
||
}
|
||
|
||
/*
|
||
* The hash caching in our concrete string classes uses zero to denote
|
||
* an empty cache value, so we MUST NOT return a hash of zero.
|
||
*/
|
||
ret &= 0x0fffffff;
|
||
if (ret == 0)
|
||
{
|
||
ret = 0x0fffffff;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
ret = 0x0ffffffe; /* Hash for an empty string. */
|
||
}
|
||
self->_flags.hash = ret;
|
||
}
|
||
|
||
return self->_flags.hash;
|
||
}
|
||
|
||
- (id) initWithBytes: (const void*)chars
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
if (length > 0)
|
||
{
|
||
void *tmp = NSZoneMalloc([self zone], length);
|
||
|
||
memcpy(tmp, chars, length);
|
||
chars = tmp;
|
||
}
|
||
return [self initWithBytesNoCopy: (void*)chars
|
||
length: length
|
||
encoding: encoding
|
||
freeWhenDone: YES];
|
||
}
|
||
|
||
- (id) initWithBytesNoCopy: (void*)chars
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
NSString *c = NSStringFromClass([self class]);
|
||
NSString *s = NSStringFromSelector(_cmd);
|
||
|
||
DESTROY(self);
|
||
[NSException raise: NSInternalInconsistencyException
|
||
format: @"[%@-%@] called on string already initialised", c, s];
|
||
return nil;
|
||
}
|
||
|
||
- (id) initWithCharacters: (const unichar*)chars
|
||
length: (NSUInteger)length
|
||
{
|
||
return [self initWithBytes: chars
|
||
length: length * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
}
|
||
|
||
- (id) initWithCharactersNoCopy: (unichar*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: chars
|
||
length: length * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
- (id) initWithCString: (const char*)chars
|
||
{
|
||
return [self initWithBytes: chars
|
||
length: strlen(chars)
|
||
encoding: externalEncoding];
|
||
}
|
||
|
||
- (id) initWithCString: (const char*)chars
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
return [self initWithBytes: chars
|
||
length: strlen(chars)
|
||
encoding: encoding];
|
||
}
|
||
|
||
- (id) initWithCString: (const char*)chars
|
||
length: (NSUInteger)length
|
||
{
|
||
return [self initWithBytes: chars
|
||
length: length
|
||
encoding: externalEncoding];
|
||
}
|
||
|
||
- (id) initWithCStringNoCopy: (char*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: chars
|
||
length: length
|
||
encoding: externalEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSCString
|
||
|
||
- (BOOL) boolValue
|
||
{
|
||
return boolValue_c((GSStr)self);
|
||
}
|
||
|
||
- (BOOL) canBeConvertedToEncoding: (NSStringEncoding)enc
|
||
{
|
||
return canBeConvertedToEncoding_c((GSStr)self, enc);
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)index
|
||
{
|
||
return characterAtIndex_c((GSStr)self, index);
|
||
}
|
||
|
||
- (NSComparisonResult) compare: (NSString*)aString
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (aString == nil)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] nil string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if (GSObjCIsInstance(aString) == NO)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] not a string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
return compare_c((GSStr)self, aString, mask, aRange);
|
||
}
|
||
|
||
/*
|
||
Default copy implementation. Retain if we own the buffer and the zones
|
||
agree, create a new GSCInlineString otherwise.
|
||
*/
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
if (!_flags.owned || NSShouldRetainWithZone(self, z) == NO)
|
||
{
|
||
GSCInlineString *me = newCInline(_count, z);
|
||
|
||
memcpy(me->_contents.c, _contents.c, _count);
|
||
return me;
|
||
}
|
||
else
|
||
{
|
||
return RETAIN(self);
|
||
}
|
||
}
|
||
|
||
- (const char *) cString
|
||
{
|
||
return cString_c((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (const char *) cStringUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
return cString_c((GSStr)self, encoding);
|
||
}
|
||
|
||
- (NSUInteger) cStringLength
|
||
{
|
||
return cStringLength_c((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (NSData*) dataUsingEncoding: (NSStringEncoding)encoding
|
||
allowLossyConversion: (BOOL)flag
|
||
{
|
||
return dataUsingEncoding_c((GSStr)self, encoding, flag);
|
||
}
|
||
|
||
- (double) doubleValue
|
||
{
|
||
return doubleValue_c((GSStr)self);
|
||
}
|
||
|
||
- (void) encodeWithCoder: (NSCoder*)aCoder
|
||
{
|
||
if ([aCoder allowsKeyedCoding])
|
||
{
|
||
[(NSKeyedArchiver*)aCoder _encodePropertyList: self forKey: @"NS.string"];
|
||
return;
|
||
}
|
||
|
||
[aCoder encodeValueOfObjCType: @encode(unsigned) at: &_count];
|
||
if (_count > 0)
|
||
{
|
||
[aCoder encodeValueOfObjCType: @encode(int)
|
||
at: &internalEncoding];
|
||
[aCoder encodeArrayOfObjCType: @encode(unsigned char)
|
||
count: _count
|
||
at: _contents.c];
|
||
}
|
||
}
|
||
|
||
- (NSStringEncoding) fastestEncoding
|
||
{
|
||
return internalEncoding;
|
||
}
|
||
|
||
- (float) floatValue
|
||
{
|
||
return doubleValue_c((GSStr)self);
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer
|
||
{
|
||
getCharacters_c((GSStr)self, buffer, (NSRange){0, _count});
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
getCharacters_c((GSStr)self, buffer, aRange);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
{
|
||
getCString_c((GSStr)self, buffer, NSMaximumStringLength,
|
||
(NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
{
|
||
getCString_c((GSStr)self, buffer, maxLength, (NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (BOOL) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
return getCStringE_c((GSStr)self, buffer, maxLength, encoding);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
range: (NSRange)aRange
|
||
remainingRange: (NSRange*)leftoverRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
getCString_c((GSStr)self, buffer, maxLength, aRange, leftoverRange);
|
||
}
|
||
|
||
- (int) intValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_c((GSStr)self, buf);
|
||
return strtol(buf, 0, 10);
|
||
}
|
||
|
||
- (NSInteger) integerValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_c((GSStr)self, buf);
|
||
#if GS_SIZEOF_VOIDP == GS_SIZEOF_LONG
|
||
return strtol(buf, 0, 10);
|
||
#else
|
||
return strtoll(buf, 0, 10);
|
||
#endif
|
||
}
|
||
|
||
- (BOOL) isEqual: (id)anObject
|
||
{
|
||
return isEqual_c((GSStr)self, anObject);
|
||
}
|
||
|
||
- (BOOL) isEqualToString: (NSString*)anObject
|
||
{
|
||
return isEqual_c((GSStr)self, anObject);
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
return _count;
|
||
}
|
||
|
||
- (NSUInteger) lengthOfBytesUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
return cStringLength_c((GSStr)self, encoding);
|
||
}
|
||
|
||
- (long long) longLongValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_c((GSStr)self, buf);
|
||
return strtoll(buf, 0, 10);
|
||
}
|
||
|
||
- (const char*) lossyCString
|
||
{
|
||
return lossyCString_c((GSStr)self);
|
||
}
|
||
|
||
- (id) mutableCopy
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0,
|
||
NSDefaultMallocZone());
|
||
obj = [obj initWithBytes: (char*)_contents.c
|
||
length: _count
|
||
encoding: internalEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (id) mutableCopyWithZone: (NSZone*)z
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0, z);
|
||
obj = [obj initWithBytes: (char*)_contents.c
|
||
length: _count
|
||
encoding: internalEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (NSRange) rangeOfComposedCharacterSequenceAtIndex: (NSUInteger)anIndex
|
||
{
|
||
return rangeOfSequence_c((GSStr)self, anIndex);
|
||
}
|
||
|
||
- (NSRange) rangeOfCharacterFromSet: (NSCharacterSet*)aSet
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return rangeOfCharacter_c((GSStr)self, aSet, mask, aRange);
|
||
}
|
||
|
||
- (NSStringEncoding) smallestEncoding
|
||
{
|
||
return internalEncoding;
|
||
}
|
||
|
||
- (NSString*) substringFromRange: (NSRange)aRange
|
||
{
|
||
if (!_flags.wide)
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
if (_flags.owned)
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return substring_c((GSStr)self, aRange);
|
||
}
|
||
return [super substringWithRange: aRange];
|
||
}
|
||
|
||
- (NSString*) substringWithRange: (NSRange)aRange
|
||
{
|
||
if (_flags.owned)
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return substring_c((GSStr)self, aRange);
|
||
}
|
||
if (!_flags.wide)
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
return [super substringWithRange: aRange];
|
||
}
|
||
|
||
- (const char *) UTF8String
|
||
{
|
||
return UTF8String_c((GSStr)self);
|
||
}
|
||
|
||
// private method for Unicode level 3 implementation
|
||
- (int) _baseLength
|
||
{
|
||
return _count;
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSCBufferString
|
||
- (void) dealloc
|
||
{
|
||
if (_contents.c != 0)
|
||
{
|
||
if (_flags.owned)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(_contents.c), _contents.c);
|
||
}
|
||
_contents.c = 0;
|
||
}
|
||
[super dealloc];
|
||
}
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSCInlineString
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSCSubString
|
||
|
||
/*
|
||
* Assume that a copy should be a new string, never just a retained substring.
|
||
*/
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
GSCInlineString *o;
|
||
|
||
o = newCInline(_count, z);
|
||
memcpy(o->_contents.c, _contents.c, _count);
|
||
return (id)o;
|
||
}
|
||
|
||
- (void) dealloc
|
||
{
|
||
DESTROY(_parent);
|
||
[super dealloc];
|
||
}
|
||
|
||
- (NSString*) substringFromRange: (NSRange)aRange
|
||
{
|
||
id s;
|
||
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
s = createTinyString((char*)_contents.c + aRange.location, aRange.length);
|
||
if (nil == s)
|
||
{
|
||
aRange.location += (_contents.c - _parent->_contents.c);
|
||
s = substring_c((GSStr)_parent, aRange);
|
||
}
|
||
return s;
|
||
}
|
||
|
||
- (NSString*) substringWithRange: (NSRange)aRange
|
||
{
|
||
id s;
|
||
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
s = createTinyString((char*)_contents.c + aRange.location, aRange.length);
|
||
if (nil == s)
|
||
{
|
||
aRange.location += (_contents.c - _parent->_contents.c);
|
||
s = substring_c((GSStr)_parent, aRange);
|
||
}
|
||
return s;
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSUnicodeString
|
||
- (const char *) UTF8String
|
||
{
|
||
return UTF8String_u((GSStr)self);
|
||
}
|
||
|
||
- (BOOL) boolValue
|
||
{
|
||
return boolValue_u((GSStr)self);
|
||
}
|
||
|
||
- (BOOL) canBeConvertedToEncoding: (NSStringEncoding)enc
|
||
{
|
||
return canBeConvertedToEncoding_u((GSStr)self, enc);
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)index
|
||
{
|
||
return characterAtIndex_u((GSStr)self, index);
|
||
}
|
||
|
||
- (NSComparisonResult) compare: (NSString*)aString
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (aString == nil)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] nil string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if (GSObjCIsInstance(aString) == NO)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] not a string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
return compare_u((GSStr)self, aString, mask, aRange);
|
||
}
|
||
|
||
- (const char *) cString
|
||
{
|
||
return cString_u((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (const char *) cStringUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
return cString_u((GSStr)self, encoding);
|
||
}
|
||
|
||
- (NSUInteger) cStringLength
|
||
{
|
||
return cStringLength_u((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (NSData*) dataUsingEncoding: (NSStringEncoding)encoding
|
||
allowLossyConversion: (BOOL)flag
|
||
{
|
||
return dataUsingEncoding_u((GSStr)self, encoding, flag);
|
||
}
|
||
|
||
- (double) doubleValue
|
||
{
|
||
return doubleValue_u((GSStr)self);
|
||
}
|
||
|
||
- (void) encodeWithCoder: (NSCoder*)aCoder
|
||
{
|
||
if ([aCoder allowsKeyedCoding])
|
||
{
|
||
[(NSKeyedArchiver*)aCoder _encodePropertyList: self forKey: @"NS.string"];
|
||
return;
|
||
}
|
||
|
||
[aCoder encodeValueOfObjCType: @encode(unsigned) at: &_count];
|
||
if (_count > 0)
|
||
{
|
||
NSStringEncoding enc = NSUnicodeStringEncoding;
|
||
|
||
[aCoder encodeValueOfObjCType: @encode(int) at: &enc];
|
||
[aCoder encodeArrayOfObjCType: @encode(unichar)
|
||
count: _count
|
||
at: _contents.u];
|
||
}
|
||
}
|
||
|
||
- (NSStringEncoding) fastestEncoding
|
||
{
|
||
return NSUnicodeStringEncoding;
|
||
}
|
||
|
||
- (float) floatValue
|
||
{
|
||
return doubleValue_u((GSStr)self);
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer
|
||
{
|
||
getCharacters_u((GSStr)self, buffer, (NSRange){0, _count});
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
getCharacters_u((GSStr)self, buffer, aRange);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
{
|
||
getCString_u((GSStr)self, buffer, NSMaximumStringLength,
|
||
(NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
{
|
||
getCString_u((GSStr)self, buffer, maxLength, (NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (BOOL) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
return getCStringE_u((GSStr)self, buffer, maxLength, encoding);
|
||
}
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
range: (NSRange)aRange
|
||
remainingRange: (NSRange*)leftoverRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
|
||
getCString_u((GSStr)self, buffer, maxLength, aRange, leftoverRange);
|
||
}
|
||
|
||
- (int) intValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_u((GSStr)self, buf);
|
||
return strtol(buf, 0, 10);
|
||
}
|
||
|
||
- (NSInteger) integerValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_u((GSStr)self, buf);
|
||
#if GS_SIZEOF_VOIDP == GS_SIZEOF_LONG
|
||
return strtol(buf, 0, 10);
|
||
#else
|
||
return strtoll(buf, 0, 10);
|
||
#endif
|
||
}
|
||
|
||
- (BOOL) isEqual: (id)anObject
|
||
{
|
||
return isEqual_u((GSStr)self, anObject);
|
||
}
|
||
|
||
- (BOOL) isEqualToString: (NSString*)anObject
|
||
{
|
||
return isEqual_u((GSStr)self, anObject);
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
return _count;
|
||
}
|
||
|
||
- (NSUInteger) lengthOfBytesUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
return cStringLength_u((GSStr)self, encoding);
|
||
}
|
||
|
||
- (long long) longLongValue
|
||
{
|
||
char buf[24];
|
||
|
||
intBuf_u((GSStr)self, buf);
|
||
return strtoll(buf, 0, 10);
|
||
}
|
||
|
||
- (const char*) lossyCString
|
||
{
|
||
return lossyCString_u((GSStr)self);
|
||
}
|
||
|
||
- (id) lowercaseString
|
||
{
|
||
GSUInlineString *o;
|
||
unsigned i;
|
||
|
||
o = [newUInline(_count, [self zone]) autorelease];
|
||
i = _count;
|
||
while (i-- > 0)
|
||
{
|
||
o->_contents.u[i] = uni_tolower(_contents.u[i]);
|
||
}
|
||
return o;
|
||
}
|
||
|
||
- (id) mutableCopy
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0,
|
||
NSDefaultMallocZone());
|
||
obj = [obj initWithBytes: (const void*)_contents.u
|
||
length: _count * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (id) mutableCopyWithZone: (NSZone*)z
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0, z);
|
||
obj = [obj initWithBytes: (const void*)_contents.u
|
||
length: _count * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (NSRange) rangeOfComposedCharacterSequenceAtIndex: (NSUInteger)anIndex
|
||
{
|
||
return rangeOfSequence_u((GSStr)self, anIndex);
|
||
}
|
||
|
||
- (NSRange) rangeOfCharacterFromSet: (NSCharacterSet*)aSet
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return rangeOfCharacter_u((GSStr)self, aSet, mask, aRange);
|
||
}
|
||
|
||
/*
|
||
- (NSRange) rangeOfString: (NSString*)aString
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (aString == nil)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] nil string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if (GSObjCIsInstance(aString) == NO)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] not a string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if ((mask & NSRegularExpressionSearch) == NSRegularExpressionSearch)
|
||
{
|
||
return [super rangeOfString: aString options: mask range: aRange];
|
||
}
|
||
return rangeOfString_u((GSStr)self, aString, mask, aRange);
|
||
}
|
||
*/
|
||
|
||
- (NSStringEncoding) smallestEncoding
|
||
{
|
||
return NSUnicodeStringEncoding;
|
||
}
|
||
|
||
- (NSString*) substringFromRange: (NSRange)aRange
|
||
{
|
||
if (!_flags.wide)
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
if (_flags.owned)
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return substring_u((GSStr)self, aRange);
|
||
}
|
||
return [super substringWithRange: aRange];
|
||
}
|
||
|
||
- (NSString*) substringWithRange: (NSRange)aRange
|
||
{
|
||
if (!_flags.wide)
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
}
|
||
if (_flags.owned)
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
return substring_u((GSStr)self, aRange);
|
||
}
|
||
return [super substringWithRange: aRange];
|
||
}
|
||
|
||
- (id) uppercaseString
|
||
{
|
||
GSUInlineString *o;
|
||
unsigned i;
|
||
|
||
o = [newUInline(_count, [self zone]) autorelease];
|
||
i = _count;
|
||
while (i-- > 0)
|
||
{
|
||
o->_contents.u[i] = uni_toupper(_contents.u[i]);
|
||
}
|
||
return o;
|
||
}
|
||
|
||
// private method for Unicode level 3 implementation
|
||
- (int) _baseLength
|
||
{
|
||
unsigned int count = 0;
|
||
unsigned int blen = 0;
|
||
|
||
while (count < _count)
|
||
if (!uni_isnonsp(_contents.u[count++]))
|
||
blen++;
|
||
return blen;
|
||
}
|
||
|
||
/*
|
||
Default -copy implementation. Retain if we own the buffer and the zones
|
||
agree, create a new GSUInlineString otherwise.
|
||
*/
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
if (!_flags.owned || NSShouldRetainWithZone(self, z) == NO)
|
||
{
|
||
GSUInlineString *o;
|
||
|
||
o = newUInline(_count, z);
|
||
memcpy(o->_contents.u, _contents.u, _count * sizeof(unichar));
|
||
return o;
|
||
}
|
||
else
|
||
{
|
||
return RETAIN(self);
|
||
}
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSUnicodeBufferString
|
||
- (void) dealloc
|
||
{
|
||
if (_contents.u != 0)
|
||
{
|
||
if (_flags.owned)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(_contents.u), _contents.u);
|
||
}
|
||
_contents.u = 0;
|
||
}
|
||
[super dealloc];
|
||
}
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSUInlineString
|
||
@end
|
||
|
||
|
||
|
||
@implementation GSUnicodeSubString
|
||
|
||
/*
|
||
* Assume that a copy should be a new string, never just a retained substring.
|
||
*/
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
GSUInlineString *o;
|
||
|
||
o = newUInline(_count, z);
|
||
memcpy(o->_contents.u, _contents.u, _count * sizeof(unichar));
|
||
return o;
|
||
}
|
||
|
||
- (void) dealloc
|
||
{
|
||
DESTROY(_parent);
|
||
[super dealloc];
|
||
}
|
||
|
||
- (NSString*) substringFromRange: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
aRange.location += (_contents.u - _parent->_contents.u);
|
||
return substring_u((GSStr)_parent, aRange);
|
||
}
|
||
|
||
- (NSString*) substringWithRange: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
aRange.location += (_contents.u - _parent->_contents.u);
|
||
return substring_u((GSStr)_parent, aRange);
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
/*
|
||
* The GSMutableString class shares a common initial ivar layout with
|
||
* the GSString class, but adds a few of its own. It uses _flags.wide
|
||
* to determine whether it should use 8-bit or 16-bit characters and
|
||
* is capable of changing that flag (and its underlying storage) to
|
||
* move from an 8-bit to a 16-bit representation is that should be
|
||
* necessary because wide characters have been placed in the string.
|
||
*/
|
||
@implementation GSMutableString
|
||
|
||
+ (void) initialize
|
||
{
|
||
setup(NO);
|
||
GSObjCAddClassBehavior(self, [GSString class]);
|
||
}
|
||
|
||
- (void) appendFormat: (NSString*)format, ...
|
||
{
|
||
va_list ap;
|
||
unichar buf[1024];
|
||
unichar *fmt = buf;
|
||
size_t len;
|
||
|
||
va_start(ap, format);
|
||
|
||
/*
|
||
* Make sure we have the format string in a nul terminated array of
|
||
* unichars for passing to GSPrivateFormat. Use on-stack memory for
|
||
* performance unless the size of the format string is really big
|
||
* (a rare occurrence).
|
||
*/
|
||
len = [format length];
|
||
if (len >= 1024)
|
||
{
|
||
fmt = NSZoneMalloc(NSDefaultMallocZone(), (len+1)*sizeof(unichar));
|
||
}
|
||
[format getCharacters: fmt];
|
||
fmt[len] = '\0';
|
||
|
||
/*
|
||
* If no zone is set, make sure we have one so any memory mangement
|
||
* (buffer growth) is done with the correct zone.
|
||
*/
|
||
if (_zone == 0)
|
||
{
|
||
#if GS_WITH_GC
|
||
_zone = GSAtomicMallocZone();
|
||
#else
|
||
_zone = [self zone];
|
||
#endif
|
||
}
|
||
GSPrivateFormat((GSStr)self, fmt, ap, nil);
|
||
_flags.hash = 0; // Invalidate the hash for this string.
|
||
if (fmt != buf)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), fmt);
|
||
}
|
||
va_end(ap);
|
||
}
|
||
|
||
- (BOOL) boolValue
|
||
{
|
||
if (_flags.wide == 1)
|
||
return boolValue_u((GSStr)self);
|
||
else
|
||
return boolValue_c((GSStr)self);
|
||
}
|
||
|
||
- (BOOL) canBeConvertedToEncoding: (NSStringEncoding)enc
|
||
{
|
||
if (_flags.wide == 1)
|
||
return canBeConvertedToEncoding_u((GSStr)self, enc);
|
||
else
|
||
return canBeConvertedToEncoding_c((GSStr)self, enc);
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)index
|
||
{
|
||
if (_flags.wide == 1)
|
||
return characterAtIndex_u((GSStr)self, index);
|
||
else
|
||
return characterAtIndex_c((GSStr)self, index);
|
||
}
|
||
|
||
- (NSComparisonResult) compare: (NSString*)aString
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (aString == nil)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] nil string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if (GSObjCIsInstance(aString) == NO)
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"[%@ -%@] not a string argument",
|
||
NSStringFromClass([self class]), NSStringFromSelector(_cmd)];
|
||
if (_flags.wide == 1)
|
||
return compare_u((GSStr)self, aString, mask, aRange);
|
||
else
|
||
return compare_c((GSStr)self, aString, mask, aRange);
|
||
}
|
||
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSUInlineString *o;
|
||
|
||
o = newUInline(_count, z);
|
||
memcpy(o->_contents.u, _contents.u, _count * sizeof(unichar));
|
||
return o;
|
||
}
|
||
else
|
||
{
|
||
GSCInlineString *o;
|
||
|
||
o = newCInline(_count, z);
|
||
memcpy(o->_contents.c, _contents.c, _count);
|
||
return o;
|
||
}
|
||
}
|
||
|
||
- (const char *) cString
|
||
{
|
||
if (_flags.wide == 1)
|
||
return cString_u((GSStr)self, externalEncoding);
|
||
else
|
||
return cString_c((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (const char *) cStringUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
if (_flags.wide == 1)
|
||
return cString_u((GSStr)self, encoding);
|
||
else
|
||
return cString_c((GSStr)self, encoding);
|
||
}
|
||
|
||
- (NSUInteger) cStringLength
|
||
{
|
||
if (_flags.wide == 1)
|
||
return cStringLength_u((GSStr)self, externalEncoding);
|
||
else
|
||
return cStringLength_c((GSStr)self, externalEncoding);
|
||
}
|
||
|
||
- (NSData*) dataUsingEncoding: (NSStringEncoding)encoding
|
||
allowLossyConversion: (BOOL)flag
|
||
{
|
||
if (_flags.wide == 1)
|
||
return dataUsingEncoding_u((GSStr)self, encoding, flag);
|
||
else
|
||
return dataUsingEncoding_c((GSStr)self, encoding, flag);
|
||
}
|
||
|
||
- (void) dealloc
|
||
{
|
||
if (_contents.c != 0)
|
||
{
|
||
NSAssert(_flags.owned == 1 && _zone != 0, NSInternalInconsistencyException);
|
||
NSZoneFree(self->_zone, self->_contents.c);
|
||
self->_contents.c = 0;
|
||
self->_zone = 0;
|
||
}
|
||
[super dealloc];
|
||
}
|
||
|
||
- (void) deleteCharactersInRange: (NSRange)range
|
||
{
|
||
GS_RANGE_CHECK(range, _count);
|
||
if (range.length > 0)
|
||
{
|
||
fillHole((GSStr)self, range.location, range.length);
|
||
}
|
||
}
|
||
|
||
- (double) doubleValue
|
||
{
|
||
if (_flags.wide == 1)
|
||
return doubleValue_u((GSStr)self);
|
||
else
|
||
return doubleValue_c((GSStr)self);
|
||
}
|
||
|
||
- (void) encodeWithCoder: (NSCoder*)aCoder
|
||
{
|
||
if ([aCoder allowsKeyedCoding])
|
||
{
|
||
[(NSKeyedArchiver*)aCoder _encodePropertyList: self forKey: @"NS.string"];
|
||
return;
|
||
}
|
||
|
||
[aCoder encodeValueOfObjCType: @encode(unsigned) at: &_count];
|
||
if (_count > 0)
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
NSStringEncoding enc = NSUnicodeStringEncoding;
|
||
|
||
[aCoder encodeValueOfObjCType: @encode(int) at: &enc];
|
||
[aCoder encodeArrayOfObjCType: @encode(unichar)
|
||
count: _count
|
||
at: _contents.u];
|
||
}
|
||
else
|
||
{
|
||
[aCoder encodeValueOfObjCType: @encode(int)
|
||
at: &internalEncoding];
|
||
[aCoder encodeArrayOfObjCType: @encode(unsigned char)
|
||
count: _count
|
||
at: _contents.c];
|
||
}
|
||
}
|
||
}
|
||
|
||
- (NSStringEncoding) fastestEncoding
|
||
{
|
||
if (_flags.wide == 1)
|
||
return NSUnicodeStringEncoding;
|
||
else
|
||
return internalEncoding;
|
||
}
|
||
|
||
- (float) floatValue
|
||
{
|
||
if (_flags.wide == 1)
|
||
return doubleValue_u((GSStr)self);
|
||
else
|
||
return doubleValue_c((GSStr)self);
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer
|
||
{
|
||
if (_flags.wide == 1)
|
||
getCharacters_u((GSStr)self, buffer, (NSRange){0, _count});
|
||
else
|
||
getCharacters_c((GSStr)self, buffer, (NSRange){0, _count});
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (_flags.wide == 1)
|
||
{
|
||
getCharacters_u((GSStr)self, buffer, aRange);
|
||
}
|
||
else
|
||
{
|
||
getCharacters_c((GSStr)self, buffer, aRange);
|
||
}
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
{
|
||
if (_flags.wide == 1)
|
||
getCString_u((GSStr)self, buffer, NSMaximumStringLength,
|
||
(NSRange){0, _count}, 0);
|
||
else
|
||
getCString_c((GSStr)self, buffer, NSMaximumStringLength,
|
||
(NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
{
|
||
if (_flags.wide == 1)
|
||
getCString_u((GSStr)self, buffer, maxLength, (NSRange){0, _count}, 0);
|
||
else
|
||
getCString_c((GSStr)self, buffer, maxLength, (NSRange){0, _count}, 0);
|
||
}
|
||
|
||
- (BOOL) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
if (_flags.wide == 1)
|
||
return getCStringE_u((GSStr)self, buffer, maxLength, encoding);
|
||
else
|
||
return getCStringE_c((GSStr)self, buffer, maxLength, encoding);
|
||
}
|
||
|
||
- (void) getCString: (char*)buffer
|
||
maxLength: (NSUInteger)maxLength
|
||
range: (NSRange)aRange
|
||
remainingRange: (NSRange*)leftoverRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (_flags.wide == 1)
|
||
{
|
||
getCString_u((GSStr)self, buffer, maxLength, aRange, leftoverRange);
|
||
}
|
||
else
|
||
{
|
||
getCString_c((GSStr)self, buffer, maxLength, aRange, leftoverRange);
|
||
}
|
||
}
|
||
|
||
- (id) init
|
||
{
|
||
return [self initWithCapacity: 0];
|
||
}
|
||
|
||
- (id) initWithBytes: (const void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
unsigned char *chars = 0;
|
||
BOOL isASCII = NO;
|
||
BOOL isLatin1 = NO;
|
||
BOOL shouldFree = NO;
|
||
|
||
_flags.owned = YES;
|
||
#if GS_WITH_GC
|
||
_zone = GSAtomicMallocZone();
|
||
#else
|
||
_zone = [self zone];
|
||
#endif
|
||
|
||
if (length > 0)
|
||
{
|
||
fixBOM((unsigned char**)&bytes, &length, &shouldFree, encoding);
|
||
chars = (unsigned char*)bytes;
|
||
}
|
||
if (0 == length)
|
||
{
|
||
return [self initWithCapacity: 0];
|
||
}
|
||
if (0 == chars)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-initWithBytes:lenth:encoding given nul bytes"];
|
||
}
|
||
|
||
if (encoding == NSUTF8StringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < length; i++)
|
||
{
|
||
if (chars[i] > 127)
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
if (i == length)
|
||
{
|
||
/*
|
||
* This is actually ASCII data ... so we can just store it as if
|
||
* in the internal 8bit encoding scheme.
|
||
*/
|
||
encoding = internalEncoding;
|
||
}
|
||
}
|
||
else if (encoding != internalEncoding && isByteEncoding(encoding) == YES)
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < length; i++)
|
||
{
|
||
if (((unsigned char*)chars)[i] > 127)
|
||
{
|
||
if (encoding == NSASCIIStringEncoding)
|
||
{
|
||
DESTROY(self);
|
||
if (shouldFree == YES)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars), chars);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
break;
|
||
}
|
||
}
|
||
if (i == length)
|
||
{
|
||
/*
|
||
* This is actually ASCII data ... so we can just store it as if
|
||
* in the internal 8bit encoding scheme.
|
||
*/
|
||
encoding = internalEncoding;
|
||
}
|
||
}
|
||
|
||
if (encoding == internalEncoding)
|
||
{
|
||
if (0 != chars)
|
||
{
|
||
if (shouldFree == YES)
|
||
{
|
||
_zone = NSZoneFromPointer(chars);
|
||
_contents.c = chars;
|
||
}
|
||
else
|
||
{
|
||
_contents.c = NSZoneMalloc(_zone, length);
|
||
memcpy(_contents.c, chars, length);
|
||
}
|
||
}
|
||
_count = length;
|
||
_flags.wide = 0;
|
||
return self;
|
||
}
|
||
|
||
/*
|
||
* Any remaining encoding needs to be converted to UTF-16.
|
||
*/
|
||
if (encoding != NSUnicodeStringEncoding)
|
||
{
|
||
unichar *u = 0;
|
||
unsigned l = 0;
|
||
|
||
if (GSToUnicode(&u, &l, (unsigned char*)chars, length, encoding,
|
||
_zone, 0) == NO)
|
||
{
|
||
DESTROY(self);
|
||
if (shouldFree == YES)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars), chars);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
chars = (unsigned char*)u;
|
||
length = l * sizeof(unichar);
|
||
shouldFree = YES;
|
||
}
|
||
|
||
length /= sizeof(unichar);
|
||
if (GSUnicode((unichar*)(void*)chars, length, &isASCII, &isLatin1) != length)
|
||
{
|
||
if (shouldFree == YES && chars != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars), chars);
|
||
}
|
||
return nil; // Invalid data
|
||
}
|
||
|
||
if (isASCII == YES
|
||
|| (internalEncoding == NSISOLatin1StringEncoding && isLatin1 == YES))
|
||
{
|
||
_contents.c = NSZoneMalloc(_zone, length);
|
||
_count = length;
|
||
_flags.wide = 0;
|
||
while (length-- > 0)
|
||
{
|
||
_contents.c[length] = ((unichar*)(void*)chars)[length];
|
||
}
|
||
if (shouldFree == YES && chars != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(chars), chars);
|
||
}
|
||
return self;
|
||
}
|
||
else
|
||
{
|
||
if (shouldFree == YES)
|
||
{
|
||
_zone = NSZoneFromPointer(chars);
|
||
_contents.u = (unichar*)(void*)chars;
|
||
}
|
||
else
|
||
{
|
||
_contents.u = NSZoneMalloc(_zone, length * sizeof(unichar));
|
||
memcpy(_contents.u, chars, length * sizeof(unichar));
|
||
}
|
||
_count = length;
|
||
_flags.wide = 1;
|
||
return self;
|
||
}
|
||
}
|
||
|
||
- (id) initWithBytesNoCopy: (void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
self = [self initWithBytes: bytes
|
||
length: length
|
||
encoding: encoding];
|
||
if (flag == YES && bytes != 0)
|
||
{
|
||
NSZoneFree(NSZoneFromPointer(bytes), bytes);
|
||
}
|
||
return self;
|
||
}
|
||
|
||
- (id) initWithCapacity: (NSUInteger)capacity
|
||
{
|
||
if (capacity < 2)
|
||
{
|
||
capacity = 2;
|
||
}
|
||
_count = 0;
|
||
_capacity = capacity;
|
||
#if GS_WITH_GC
|
||
_zone = GSAtomicMallocZone();
|
||
#else
|
||
_zone = [self zone];
|
||
#endif
|
||
_contents.c = NSZoneMalloc(_zone, capacity + 1);
|
||
_flags.wide = 0;
|
||
_flags.owned = 1;
|
||
return self;
|
||
}
|
||
|
||
- (id) initWithCharactersNoCopy: (unichar*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: (void*)chars
|
||
length: length*sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
- (id) initWithCStringNoCopy: (char*)chars
|
||
length: (NSUInteger)length
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
return [self initWithBytesNoCopy: (void*)chars
|
||
length: length
|
||
encoding: externalEncoding
|
||
freeWhenDone: flag];
|
||
}
|
||
|
||
- (id) initWithFormat: (NSString*)format
|
||
locale: (NSDictionary*)locale
|
||
arguments: (va_list)argList
|
||
{
|
||
unichar fbuf[1024];
|
||
unichar *fmt = fbuf;
|
||
size_t len;
|
||
|
||
/*
|
||
* First we provide an array of unichar characters containing the
|
||
* format string. For performance reasons we try to use an on-stack
|
||
* buffer if the format string is small enough ... it almost always
|
||
* will be.
|
||
*/
|
||
len = [format length];
|
||
if (len >= 1024)
|
||
{
|
||
fmt = NSZoneMalloc(NSDefaultMallocZone(), (len+1)*sizeof(unichar));
|
||
}
|
||
[format getCharacters: fmt];
|
||
fmt[len] = '\0';
|
||
|
||
GSPrivateFormat((GSStr)self, fmt, argList, locale);
|
||
if (fmt != fbuf)
|
||
{
|
||
NSZoneFree(NSDefaultMallocZone(), fmt);
|
||
}
|
||
return self;
|
||
}
|
||
|
||
- (int) intValue
|
||
{
|
||
char buf[24];
|
||
|
||
if (_flags.wide == 1)
|
||
intBuf_u((GSStr)self, buf);
|
||
else
|
||
intBuf_c((GSStr)self, buf);
|
||
return strtol(buf, 0, 10);
|
||
}
|
||
|
||
- (NSInteger) integerValue
|
||
{
|
||
char buf[24];
|
||
|
||
if (_flags.wide == 1)
|
||
intBuf_u((GSStr)self, buf);
|
||
else
|
||
intBuf_c((GSStr)self, buf);
|
||
#if GS_SIZEOF_VOIDP == GS_SIZEOF_LONG
|
||
return strtol(buf, 0, 10);
|
||
#else
|
||
return strtoll(buf, 0, 10);
|
||
#endif
|
||
}
|
||
|
||
- (BOOL) isEqual: (id)anObject
|
||
{
|
||
if (_flags.wide == 1)
|
||
return isEqual_u((GSStr)self, anObject);
|
||
else
|
||
return isEqual_c((GSStr)self, anObject);
|
||
}
|
||
|
||
- (BOOL) isEqualToString: (NSString*)anObject
|
||
{
|
||
if (_flags.wide == 1)
|
||
return isEqual_u((GSStr)self, anObject);
|
||
else
|
||
return isEqual_c((GSStr)self, anObject);
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
return _count;
|
||
}
|
||
|
||
- (NSUInteger) lengthOfBytesUsingEncoding: (NSStringEncoding)encoding
|
||
{
|
||
if (_flags.wide == 1)
|
||
return cStringLength_u((GSStr)self, encoding);
|
||
else
|
||
return cStringLength_c((GSStr)self, encoding);
|
||
}
|
||
|
||
- (long long) longLongValue
|
||
{
|
||
char buf[24];
|
||
|
||
if (_flags.wide == 1)
|
||
intBuf_u((GSStr)self, buf);
|
||
else
|
||
intBuf_c((GSStr)self, buf);
|
||
return strtoll(buf, 0, 10);
|
||
}
|
||
|
||
- (const char*) lossyCString
|
||
{
|
||
if (_flags.wide == 1)
|
||
return lossyCString_u((GSStr)self);
|
||
else
|
||
return lossyCString_c((GSStr)self);
|
||
}
|
||
|
||
- (id) lowercaseString
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSUInlineString *o;
|
||
unsigned i;
|
||
|
||
o = newUInline(_count, [self zone]);
|
||
i = _count;
|
||
while (i-- > 0)
|
||
{
|
||
o->_contents.u[i] = uni_tolower(_contents.u[i]);
|
||
}
|
||
return [o autorelease];
|
||
}
|
||
return [super lowercaseString];
|
||
}
|
||
|
||
- (id) makeImmutableCopyOnFail: (BOOL)force
|
||
{
|
||
NSAssert(_flags.owned == 1 && _zone != 0, NSInternalInconsistencyException);
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSClassSwizzle(self, [GSUnicodeBufferString class]);
|
||
}
|
||
else
|
||
{
|
||
GSClassSwizzle(self, [GSCBufferString class]);
|
||
}
|
||
return self;
|
||
}
|
||
|
||
- (id) mutableCopy
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0,
|
||
NSDefaultMallocZone());
|
||
|
||
if (_flags.wide == 1)
|
||
obj = [obj initWithBytes: (void*)_contents.u
|
||
length: _count * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
else
|
||
obj = [obj initWithBytes: (void*)_contents.c
|
||
length: _count
|
||
encoding: internalEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (id) mutableCopyWithZone: (NSZone*)z
|
||
{
|
||
GSMutableString *obj;
|
||
|
||
obj = (GSMutableString*)NSAllocateObject(GSMutableStringClass, 0, z);
|
||
|
||
if (_flags.wide == 1)
|
||
obj = [obj initWithBytes: (void*)_contents.u
|
||
length: _count * sizeof(unichar)
|
||
encoding: NSUnicodeStringEncoding];
|
||
else
|
||
obj = [obj initWithBytes: (char*)_contents.c
|
||
length: _count
|
||
encoding: internalEncoding];
|
||
return obj;
|
||
}
|
||
|
||
- (NSRange) rangeOfComposedCharacterSequenceAtIndex: (NSUInteger)anIndex
|
||
{
|
||
if (_flags.wide == 1)
|
||
return rangeOfSequence_u((GSStr)self, anIndex);
|
||
else
|
||
return rangeOfSequence_c((GSStr)self, anIndex);
|
||
}
|
||
|
||
- (NSRange) rangeOfCharacterFromSet: (NSCharacterSet*)aSet
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (_flags.wide == 1)
|
||
return rangeOfCharacter_u((GSStr)self, aSet, mask, aRange);
|
||
else
|
||
return rangeOfCharacter_c((GSStr)self, aSet, mask, aRange);
|
||
}
|
||
|
||
- (void) replaceCharactersInRange: (NSRange)aRange
|
||
withString: (NSString*)aString
|
||
{
|
||
GSStr other = 0;
|
||
int offset;
|
||
unsigned length = 0;
|
||
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
if (aString != nil)
|
||
{
|
||
if (GSObjCIsInstance(aString) == NO)
|
||
{
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"replace characters with non-string"];
|
||
}
|
||
else
|
||
{
|
||
length = (aString == nil) ? 0 : [aString length];
|
||
}
|
||
}
|
||
offset = length - aRange.length;
|
||
|
||
/*
|
||
* We must change into a unicode string (if necessary) *before*
|
||
* adjusting length and capacity, so that the transmute doesn't
|
||
* mess up due to any hole in the string etc.
|
||
*/
|
||
if (length > 0)
|
||
{
|
||
other = transmute((GSStr)self, aString);
|
||
}
|
||
|
||
if (offset < 0)
|
||
{
|
||
fillHole((GSStr)self, NSMaxRange(aRange) + offset, -offset);
|
||
}
|
||
else if (offset > 0)
|
||
{
|
||
makeHole((GSStr)self, NSMaxRange(aRange), (NSUInteger)offset);
|
||
}
|
||
|
||
if (length > 0)
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
if (other == 0)
|
||
{
|
||
/*
|
||
* Not a cString class - use standard method to get characters.
|
||
*/
|
||
[aString getCharacters: &_contents.u[aRange.location]];
|
||
}
|
||
else
|
||
{
|
||
memcpy(&_contents.u[aRange.location], other->_contents.u,
|
||
length * sizeof(unichar));
|
||
}
|
||
}
|
||
else
|
||
{
|
||
if (other == 0)
|
||
{
|
||
/*
|
||
* Since getCString appends a '\0' terminator, we must handle
|
||
* that problem in copying data into our buffer. Either by
|
||
* saving and restoring the character which would be
|
||
* overwritten by the nul, or by getting a character less,
|
||
* and fetching the last character separately.
|
||
*/
|
||
if (aRange.location + length < _count)
|
||
{
|
||
unsigned char tmp = _contents.c[aRange.location + length];
|
||
|
||
[aString getCString: (char*)&_contents.c[aRange.location]
|
||
maxLength: length+1
|
||
encoding: internalEncoding];
|
||
_contents.c[aRange.location + length] = tmp;
|
||
}
|
||
else
|
||
{
|
||
unsigned int l = length - 1;
|
||
unsigned int size = 1;
|
||
unichar u;
|
||
unsigned char *dst = &_contents.c[aRange.location + l];
|
||
|
||
if (l > 0)
|
||
{
|
||
[aString getCString: (char*)&_contents.c[aRange.location]
|
||
maxLength: l+1
|
||
encoding: internalEncoding];
|
||
}
|
||
u = [aString characterAtIndex: l];
|
||
GSFromUnicode(&dst, &size, &u, 1,
|
||
internalEncoding, 0, GSUniStrict);
|
||
}
|
||
}
|
||
else
|
||
{
|
||
/*
|
||
* Simply copy cString data from other string into self.
|
||
*/
|
||
memcpy(&_contents.c[aRange.location], other->_contents.c, length);
|
||
}
|
||
}
|
||
_flags.hash = 0;
|
||
}
|
||
}
|
||
|
||
- (void) setString: (NSString*)aString
|
||
{
|
||
unsigned int len = (aString == nil) ? 0 : [aString length];
|
||
GSStr other;
|
||
|
||
if (len == 0)
|
||
{
|
||
_count = 0;
|
||
return;
|
||
}
|
||
other = transmute((GSStr)self, aString);
|
||
if (_count < len)
|
||
{
|
||
makeHole((GSStr)self, _count, (NSUInteger)(len - _count));
|
||
}
|
||
else
|
||
{
|
||
_count = len;
|
||
_flags.hash = 0;
|
||
}
|
||
|
||
if (_flags.wide == 1)
|
||
{
|
||
if (other == 0)
|
||
{
|
||
[aString getCharacters: _contents.u];
|
||
}
|
||
else
|
||
{
|
||
memcpy(_contents.u, other->_contents.u, len * sizeof(unichar));
|
||
}
|
||
}
|
||
else
|
||
{
|
||
if (other == 0)
|
||
{
|
||
unsigned l;
|
||
unsigned s = 1;
|
||
unichar u;
|
||
unsigned char *d;
|
||
|
||
/*
|
||
* Since getCString appends a '\0' terminator, we must ask for
|
||
* one character less than we actually want, then get the last
|
||
* character separately.
|
||
*/
|
||
l = len - 1;
|
||
if (l > 0)
|
||
{
|
||
[aString getCString: (char*)_contents.c
|
||
maxLength: l+1
|
||
encoding: internalEncoding];
|
||
}
|
||
u = [aString characterAtIndex: l];
|
||
d = _contents.c + l;
|
||
GSFromUnicode(&d, &s, &u, 1, internalEncoding, 0, GSUniStrict);
|
||
}
|
||
else
|
||
{
|
||
memcpy(_contents.c, other->_contents.c, len);
|
||
}
|
||
}
|
||
}
|
||
|
||
- (NSStringEncoding) smallestEncoding
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
return NSUnicodeStringEncoding;
|
||
}
|
||
else
|
||
{
|
||
return internalEncoding;
|
||
}
|
||
}
|
||
|
||
- (NSString*) substringFromRange: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
|
||
if (aRange.length == 0)
|
||
{
|
||
return @"";
|
||
}
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSUInlineString *o;
|
||
|
||
o = [newUInline(aRange.length, [self zone]) autorelease];
|
||
memcpy(o->_contents.u, _contents.u + aRange.location,
|
||
aRange.length * sizeof(unichar));
|
||
return o;
|
||
}
|
||
else
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
else
|
||
{
|
||
GSCInlineString *o;
|
||
|
||
o = [newCInline(aRange.length, [self zone]) autorelease];
|
||
memcpy(o->_contents.c, _contents.c + aRange.location, aRange.length);
|
||
return o;
|
||
}
|
||
}
|
||
}
|
||
|
||
- (NSString*) substringWithRange: (NSRange)aRange
|
||
{
|
||
GS_RANGE_CHECK(aRange, _count);
|
||
|
||
if (aRange.length == 0)
|
||
{
|
||
return @"";
|
||
}
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSUInlineString *o;
|
||
|
||
o = [newUInline(aRange.length, [self zone]) autorelease];
|
||
memcpy(o->_contents.u, _contents.u + aRange.location,
|
||
aRange.length * sizeof(unichar));
|
||
return o;
|
||
}
|
||
else
|
||
{
|
||
id tinyString;
|
||
|
||
tinyString = createTinyString((char*)_contents.c + aRange.location,
|
||
aRange.length);
|
||
if (tinyString)
|
||
{
|
||
return tinyString;
|
||
}
|
||
else
|
||
{
|
||
GSCInlineString *o;
|
||
|
||
o = [newCInline(aRange.length, [self zone]) autorelease];
|
||
memcpy(o->_contents.c, _contents.c + aRange.location, aRange.length);
|
||
return o;
|
||
}
|
||
}
|
||
}
|
||
|
||
- (id) uppercaseString
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
GSUInlineString *o;
|
||
unsigned i;
|
||
|
||
o = [newUInline(_count, [self zone]) autorelease];
|
||
i = _count;
|
||
while (i-- > 0)
|
||
{
|
||
o->_contents.u[i] = uni_toupper(_contents.u[i]);
|
||
}
|
||
return o;
|
||
}
|
||
return [super uppercaseString];
|
||
}
|
||
|
||
- (const char *) UTF8String
|
||
{
|
||
if (_flags.wide == 1)
|
||
return UTF8String_u((GSStr)self);
|
||
return UTF8String_c((GSStr)self);
|
||
}
|
||
|
||
// private method for Unicode level 3 implementation
|
||
- (int) _baseLength
|
||
{
|
||
if (_flags.wide == 1)
|
||
{
|
||
unsigned int count = 0;
|
||
unsigned int blen = 0;
|
||
|
||
while (count < _count)
|
||
if (!uni_isnonsp(_contents.u[count++]))
|
||
blen++;
|
||
return blen;
|
||
}
|
||
else
|
||
return _count;
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
|
||
static BOOL
|
||
literalIsEqual(NXConstantString *self, id anObject)
|
||
{
|
||
Class c;
|
||
|
||
if (anObject == (id)self)
|
||
{
|
||
return YES;
|
||
}
|
||
if (anObject == nil)
|
||
{
|
||
return NO;
|
||
}
|
||
#if defined(OBJC_SMALL_OBJECT_SHIFT) && (OBJC_SMALL_OBJECT_SHIFT == 3)
|
||
if (useTinyStrings)
|
||
{
|
||
uintptr_t s = (uintptr_t)anObject;
|
||
|
||
if (s & TINY_STRING_MASK)
|
||
{
|
||
return tinyEqualToString((uintptr_t)anObject, self);
|
||
}
|
||
}
|
||
#endif
|
||
if (GSObjCIsInstance(anObject) == NO)
|
||
{
|
||
return NO;
|
||
}
|
||
c = object_getClass(anObject);
|
||
if (c == NSConstantStringClass)
|
||
{
|
||
NXConstantString *other = (NXConstantString*)anObject;
|
||
|
||
if (other->nxcslen != self->nxcslen
|
||
|| strcmp(other->nxcsptr, self->nxcsptr) != 0)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
else if (c == GSMutableStringClass || GSObjCIsKindOf(c, GSStringClass) == YES)
|
||
{
|
||
return literalIsEqualInternal(self, (GSStr)anObject);
|
||
}
|
||
else if (YES == [anObject isKindOfClass: NSStringClass]) // may be proxy
|
||
{
|
||
unichar (*imp)(id, SEL, NSUInteger);
|
||
NSUInteger len = [anObject length];
|
||
NSUInteger pos = 0;
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
unichar u;
|
||
|
||
if (len > self->nxcslen)
|
||
{
|
||
/* Since UTF-8 is a multibyte character set, it must have at least
|
||
* as many bytes as another string of the same length. So if the
|
||
* UTF-8 string is shorter, the two cannot be equal.
|
||
*/
|
||
return NO;
|
||
}
|
||
|
||
/* Do a character by character comparison using characterAtIndex:
|
||
*/
|
||
imp = (unichar(*)(id,SEL,NSUInteger))[anObject methodForSelector:
|
||
@selector(characterAtIndex:)];
|
||
while (i < self->nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)self->nxcsptr,
|
||
self->nxcslen, &i, &n);
|
||
if (pos >= len
|
||
|| (*imp)(anObject, @selector(characterAtIndex:), pos) != u)
|
||
{
|
||
return NO;
|
||
}
|
||
pos++;
|
||
}
|
||
if (pos != len)
|
||
{
|
||
return NO;
|
||
}
|
||
return YES;
|
||
}
|
||
return NO;
|
||
}
|
||
|
||
/**
|
||
* <p>The NXConstantString class is used by the compiler for constant
|
||
* strings, as such its ivar layout is determined by the compiler
|
||
* and consists of a pointer (_contents.c) and a character count
|
||
* (_count).
|
||
*/
|
||
@implementation NXConstantString
|
||
|
||
+ (void) initialize
|
||
{
|
||
if (self == [NXConstantString class])
|
||
{
|
||
NSConstantStringClass = self;
|
||
}
|
||
}
|
||
|
||
- (const char*) UTF8String
|
||
{
|
||
return nxcsptr;
|
||
}
|
||
|
||
- (unichar) characterAtIndex: (NSUInteger)index
|
||
{
|
||
NSUInteger l = 0;
|
||
unichar u;
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
|
||
while (i < nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
if (l++ == index)
|
||
{
|
||
return u;
|
||
}
|
||
}
|
||
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-characterAtIndex: index out of range"];
|
||
return 0;
|
||
}
|
||
|
||
- (BOOL) canBeConvertedToEncoding: (NSStringEncoding)encoding
|
||
{
|
||
/* If the string contains bad (non-utf8) data, the lengthUTF8() function
|
||
* will raise an exception ... we catch it and return NO in that case
|
||
* since this method is not expected to raise exceptions.
|
||
*/
|
||
NS_DURING
|
||
{
|
||
if (NSASCIIStringEncoding == encoding)
|
||
{
|
||
BOOL ascii;
|
||
|
||
lengthUTF8((const uint8_t*)nxcsptr, nxcslen, &ascii, 0);
|
||
NS_VALRETURN(ascii);
|
||
}
|
||
else if (NSISOLatin1StringEncoding == encoding)
|
||
{
|
||
BOOL latin1;
|
||
|
||
lengthUTF8((const uint8_t*)nxcsptr, nxcslen, 0, &latin1);
|
||
NS_VALRETURN(latin1);
|
||
}
|
||
else if (NSUTF8StringEncoding == encoding
|
||
|| NSUnicodeStringEncoding == encoding)
|
||
{
|
||
lengthUTF8((const uint8_t*)nxcsptr, nxcslen, 0, 0);
|
||
NS_VALRETURN(YES);
|
||
}
|
||
else
|
||
{
|
||
id d = [self dataUsingEncoding: encoding allowLossyConversion: NO];
|
||
|
||
NS_VALRETURN(d != nil ? YES : NO);
|
||
}
|
||
}
|
||
NS_HANDLER
|
||
{
|
||
return NO;
|
||
}
|
||
NS_ENDHANDLER
|
||
}
|
||
|
||
- (NSData*) dataUsingEncoding: (NSStringEncoding)encoding
|
||
allowLossyConversion: (BOOL)flag
|
||
{
|
||
BOOL ascii;
|
||
BOOL latin1;
|
||
unsigned length;
|
||
|
||
if (0 == nxcslen)
|
||
{
|
||
return [NSDataClass data];
|
||
}
|
||
|
||
/* Check what is actually in this string ... if it's corrupt an exception
|
||
* is raised.
|
||
*/
|
||
length = lengthUTF8((const uint8_t*)nxcsptr, nxcslen, &ascii, &latin1);
|
||
|
||
if (NSUTF8StringEncoding == encoding)
|
||
{
|
||
/* We want utf-8, so we can just return an object pointing to the
|
||
* constant string data since e just checked that it's UTF8 in
|
||
* lengthUTF8().
|
||
*/
|
||
return [NSDataClass dataWithBytesNoCopy: (void*)nxcsptr
|
||
length: nxcslen
|
||
freeWhenDone: NO];
|
||
}
|
||
|
||
if (YES == ascii && GSPrivateIsByteEncoding(encoding))
|
||
{
|
||
/* The constant string data is just ascii, so we can return a
|
||
* pointer to it directly for any encoding which has ascii as
|
||
* a subset.
|
||
*/
|
||
return [NSDataClass dataWithBytesNoCopy: (void*)nxcsptr
|
||
length: nxcslen
|
||
freeWhenDone: NO];
|
||
}
|
||
|
||
if (YES == latin1 && NSISOLatin1StringEncoding == encoding)
|
||
{
|
||
unsigned i = 0;
|
||
unichar n = 0;
|
||
uint8_t *b;
|
||
|
||
/* If all the characters are latin1 we can copy them efficiently.
|
||
*/
|
||
b = NSAllocateCollectable(length, 0);
|
||
while (i < length)
|
||
{
|
||
b[i] = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
}
|
||
return [NSDataClass dataWithBytesNoCopy: (void*)b
|
||
length: length
|
||
freeWhenDone: YES];
|
||
}
|
||
|
||
return [super dataUsingEncoding: encoding allowLossyConversion: flag];
|
||
}
|
||
|
||
- (void) dealloc
|
||
{
|
||
GSNOSUPERDEALLOC;
|
||
}
|
||
|
||
- (void) getCharacters: (unichar*)buffer
|
||
range: (NSRange)aRange
|
||
{
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
NSUInteger max = NSMaxRange(aRange);
|
||
NSUInteger index = 0;
|
||
|
||
if (NSNotFound == aRange.location)
|
||
[NSException raise: NSRangeException format:
|
||
@"in %s, range { %"PRIuPTR", %"PRIuPTR" } extends beyond string",
|
||
GSNameFromSelector(_cmd), aRange.location, aRange.length];
|
||
|
||
while (index < aRange.location && (i < nxcslen || n > 0))
|
||
{
|
||
nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
index++;
|
||
}
|
||
if (index == aRange.location)
|
||
{
|
||
while (index < max && (i < nxcslen || n > 0))
|
||
{
|
||
*buffer++ = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
index++;
|
||
}
|
||
}
|
||
if (index != max)
|
||
{
|
||
[NSException raise: NSRangeException format:
|
||
@"in %s, range { %"PRIuPTR", %"PRIuPTR" } extends beyond string",
|
||
GSNameFromSelector(_cmd), aRange.location, aRange.length];
|
||
}
|
||
}
|
||
|
||
/* Must match the implementation in NSString
|
||
* To avoid allocating memory, we build the hash incrementally.
|
||
*/
|
||
- (NSUInteger) hash
|
||
{
|
||
if (nxcslen > 0)
|
||
{
|
||
uint32_t s0 = 0;
|
||
uint32_t s1 = 0;
|
||
unichar chunk[64];
|
||
uint32_t ret;
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
int l = 0;
|
||
uint32_t t = 0;
|
||
|
||
while (i < nxcslen)
|
||
{
|
||
chunk[l++] = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
if (64 == l)
|
||
{
|
||
GSPrivateIncrementalHash(&s0, &s1, chunk, l * sizeof(unichar));
|
||
t += l;
|
||
l = 0;
|
||
}
|
||
}
|
||
if (0 != n)
|
||
{
|
||
chunk[l++] = n; // Add final character
|
||
}
|
||
if (l > 0)
|
||
{
|
||
GSPrivateIncrementalHash(&s0, &s1, chunk, l * sizeof(unichar));
|
||
t += l;
|
||
}
|
||
ret = GSPrivateFinishHash(s0, s1, t * sizeof(unichar));
|
||
ret &= 0x0fffffff;
|
||
if (ret == 0)
|
||
{
|
||
ret = 0x0fffffff;
|
||
}
|
||
return ret;
|
||
}
|
||
else
|
||
{
|
||
return 0x0ffffffe; /* Hash for an empty string. */
|
||
}
|
||
}
|
||
|
||
- (id) initWithBytes: (const void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
{
|
||
[NSException raise: NSGenericException
|
||
format: @"Attempt to init a constant string"];
|
||
return nil;
|
||
}
|
||
|
||
- (id) initWithBytesNoCopy: (void*)bytes
|
||
length: (NSUInteger)length
|
||
encoding: (NSStringEncoding)encoding
|
||
freeWhenDone: (BOOL)flag
|
||
{
|
||
[NSException raise: NSGenericException
|
||
format: @"Attempt to init a constant string"];
|
||
return nil;
|
||
}
|
||
|
||
- (BOOL) isEqual: (id)anObject
|
||
{
|
||
return literalIsEqual(self, anObject);
|
||
}
|
||
|
||
- (BOOL) isEqualToString: (NSString*)other
|
||
{
|
||
return literalIsEqual(self, other);
|
||
}
|
||
|
||
- (int) intValue
|
||
{
|
||
return strtol((const char*)nxcsptr, 0, 10);
|
||
}
|
||
|
||
- (NSInteger) integerValue
|
||
{
|
||
#if GS_SIZEOF_VOIDP == GS_SIZEOF_LONG
|
||
return strtol((const char*)nxcsptr, 0, 10);
|
||
#else
|
||
return strtoll((const char*)nxcsptr, 0, 10);
|
||
#endif
|
||
}
|
||
|
||
- (NSUInteger) length
|
||
{
|
||
return lengthUTF8((const uint8_t*)nxcsptr, nxcslen, 0, 0);
|
||
}
|
||
|
||
- (long long) longLongValue
|
||
{
|
||
return strtoll((const char*)nxcsptr, 0, 10);
|
||
}
|
||
|
||
- (NSRange) rangeOfCharacterFromSet: (NSCharacterSet*)aSet
|
||
options: (NSUInteger)mask
|
||
range: (NSRange)aRange
|
||
{
|
||
NSUInteger index;
|
||
NSUInteger start;
|
||
NSUInteger stop;
|
||
NSRange range;
|
||
BOOL ascii;
|
||
|
||
index = lengthUTF8((const uint8_t*)nxcsptr, nxcslen, &ascii, 0);
|
||
GS_RANGE_CHECK(aRange, index);
|
||
|
||
start = aRange.location;
|
||
stop = NSMaxRange(aRange);
|
||
|
||
range.location = NSNotFound;
|
||
range.length = 0;
|
||
|
||
if (stop > start)
|
||
{
|
||
BOOL (*mImp)(id, SEL, unichar);
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
|
||
mImp = (BOOL(*)(id,SEL,unichar))
|
||
[aSet methodForSelector: @selector(characterIsMember:)];
|
||
|
||
for (index = 0; index < start; index++)
|
||
{
|
||
nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
}
|
||
if ((mask & NSBackwardsSearch) == NSBackwardsSearch)
|
||
{
|
||
unichar buf[stop - start];
|
||
NSUInteger pos = 0;
|
||
|
||
for (pos = 0; pos + start < stop; pos++)
|
||
{
|
||
buf[pos] = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
}
|
||
index = stop;
|
||
while (index-- > start)
|
||
{
|
||
if ((*mImp)(aSet, @selector(characterIsMember:), buf[--pos]))
|
||
{
|
||
range = NSMakeRange(index, 1);
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else
|
||
{
|
||
while (index < stop)
|
||
{
|
||
unichar letter;
|
||
|
||
letter = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
if ((*mImp)(aSet, @selector(characterIsMember:), letter))
|
||
{
|
||
range = NSMakeRange(index, 1);
|
||
break;
|
||
}
|
||
index++;
|
||
}
|
||
}
|
||
}
|
||
|
||
return range;
|
||
}
|
||
|
||
- (NSRange) rangeOfComposedCharacterSequenceAtIndex: (NSUInteger)anIndex
|
||
{
|
||
NSUInteger start = 0;
|
||
NSUInteger pos = 0;
|
||
unichar n = 0;
|
||
unsigned i = 0;
|
||
unichar u;
|
||
|
||
/* A composed character sequence consists of a single base character
|
||
* followed by zero or more non-base characters.
|
||
*/
|
||
while (i < nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
if (!uni_isnonsp(u))
|
||
{
|
||
/* This may be the base character at the start of the sequence.
|
||
*/
|
||
start = pos;
|
||
}
|
||
if (pos++ == anIndex)
|
||
{
|
||
/* Look ahead to see if the character at the specified index is
|
||
* followed by one or more non-base characters. If it is, we
|
||
* make the range longer before returning it.
|
||
*/
|
||
while (i < nxcslen || n > 0)
|
||
{
|
||
u = nextUTF8((const uint8_t *)nxcsptr, nxcslen, &i, &n);
|
||
if (!uni_isnonsp(u))
|
||
{
|
||
break;
|
||
}
|
||
pos++;
|
||
}
|
||
return NSMakeRange(start, pos - start);
|
||
}
|
||
}
|
||
|
||
[NSException raise: NSInvalidArgumentException
|
||
format: @"-rangeOfComposedCharacterSequenceAtIndex: index out of range"];
|
||
return NSMakeRange(NSNotFound, 0);
|
||
}
|
||
|
||
- (id) retain
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (oneway void) release
|
||
{
|
||
return;
|
||
}
|
||
|
||
- (id) autorelease
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (id) copyWithZone: (NSZone*)z
|
||
{
|
||
return self;
|
||
}
|
||
|
||
- (NSZone*) zone
|
||
{
|
||
return NSDefaultMallocZone();
|
||
}
|
||
|
||
- (NSStringEncoding) fastestEncoding
|
||
{
|
||
return NSUTF8StringEncoding;
|
||
}
|
||
|
||
- (NSStringEncoding) smallestEncoding
|
||
{
|
||
return NSUTF8StringEncoding;
|
||
}
|
||
|
||
@end
|
||
|
||
|
||
/**
|
||
* Append characters to a string.
|
||
*/
|
||
void
|
||
GSPrivateStrAppendUnichars(GSStr s, const unichar *u, unsigned l)
|
||
{
|
||
/*
|
||
* Make the string wide if necessary.
|
||
*/
|
||
if (s->_flags.wide == 0)
|
||
{
|
||
BOOL widen = NO;
|
||
|
||
if (internalEncoding == NSISOLatin1StringEncoding)
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
if (u[i] > 255)
|
||
{
|
||
widen = YES;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
if (u[i] > 127)
|
||
{
|
||
widen = YES;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
if (widen == YES)
|
||
{
|
||
GSStrWiden(s);
|
||
}
|
||
}
|
||
|
||
/*
|
||
* Make room for the characters we are appending.
|
||
*/
|
||
if (s->_count + l + 1 >= s->_capacity)
|
||
{
|
||
GSStrMakeSpace(s, l);
|
||
}
|
||
|
||
/*
|
||
* Copy the characters into place.
|
||
*/
|
||
if (s->_flags.wide == 1)
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
s->_contents.u[s->_count++] = u[i];
|
||
}
|
||
}
|
||
else
|
||
{
|
||
unsigned i;
|
||
|
||
for (i = 0; i < l; i++)
|
||
{
|
||
s->_contents.c[s->_count++] = u[i];
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
void
|
||
GSPrivateStrExternalize(GSStr s)
|
||
{
|
||
if (s->_flags.wide == 0 && internalEncoding != externalEncoding)
|
||
{
|
||
GSStrWiden(s);
|
||
}
|
||
}
|
||
|