/** * This file is part of the DOM implementation for KDE. * * Copyright (C) 1999 Lars Knoll (knoll@kde.org) * (C) 1999 Antti Koivisto (koivisto@kde.org) * (C) 2001 Dirk Mueller ( mueller@kde.org ) * Copyright (C) 2003 Apple Computer, Inc. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public License * along with this library; see the file COPYING.LIB. If not, write to * the Free Software Foundation, Inc., 59 Temple Place - Suite 330, * Boston, MA 02111-1307, USA. * */ #include "dom_stringimpl.h" #include #include #include "dom_atomicstring.h" using namespace khtml; namespace DOM { using khtml::Fixed; DOMStringImpl* DOMStringImpl::empty() { static WithOneRef w; static DOMStringImpl e(w); return &e; } DOMStringImpl::DOMStringImpl(const QChar *str, unsigned int len) { _hash = 0; _inTable = false; bool havestr = str && len; s = QT_ALLOC_QCHAR_VEC( havestr ? len : 1 ); if(str && len) { memcpy( s, str, len * sizeof(QChar) ); l = len; } else { // crash protection s[0] = 0x0; l = 0; } } DOMStringImpl::DOMStringImpl(const char *str) { _hash = 0; _inTable = false; if(str && *str) { l = strlen(str); s = QT_ALLOC_QCHAR_VEC( l ); int i = l; QChar* ptr = s; while( i-- ) *ptr++ = *str++; } else { s = QT_ALLOC_QCHAR_VEC( 1 ); // crash protection s[0] = 0x0; // == QChar::null; l = 0; } } DOMStringImpl::DOMStringImpl(const char *str, unsigned int len) { _hash = 0; _inTable = false; l = len; if (!l || !str) return; s = QT_ALLOC_QCHAR_VEC(l); int i = l; QChar* ptr = s; while( i-- ) *ptr++ = *str++; } DOMStringImpl::DOMStringImpl(const QChar &ch) { _hash = 0; _inTable = false; s = QT_ALLOC_QCHAR_VEC( 1 ); s[0] = ch; l = 1; } DOMStringImpl::~DOMStringImpl() { if (_inTable) AtomicString::remove(this); if (s) QT_DELETE_QCHAR_VEC(s); } void DOMStringImpl::append(DOMStringImpl *str) { assert(!_inTable); if(str && str->l != 0) { int newlen = l+str->l; QChar *c = QT_ALLOC_QCHAR_VEC(newlen); memcpy(c, s, l*sizeof(QChar)); memcpy(c+l, str->s, str->l*sizeof(QChar)); if(s) QT_DELETE_QCHAR_VEC(s); s = c; l = newlen; } } void DOMStringImpl::insert(DOMStringImpl *str, uint pos) { assert(!_inTable); if(pos > l) { append(str); return; } if(str && str->l != 0) { int newlen = l+str->l; QChar *c = QT_ALLOC_QCHAR_VEC(newlen); memcpy(c, s, pos*sizeof(QChar)); memcpy(c+pos, str->s, str->l*sizeof(QChar)); memcpy(c+pos+str->l, s+pos, (l-pos)*sizeof(QChar)); if(s) QT_DELETE_QCHAR_VEC(s); s = c; l = newlen; } } void DOMStringImpl::truncate(int len) { assert(!_inTable); if(len > (int)l) return; int nl = len < 1 ? 1 : len; QChar *c = QT_ALLOC_QCHAR_VEC(nl); memcpy(c, s, nl*sizeof(QChar)); if(s) QT_DELETE_QCHAR_VEC(s); s = c; l = len; } void DOMStringImpl::remove(uint pos, int len) { assert(!_inTable); if(len <= 0) return; if(pos >= l ) return; if((unsigned)len > l - pos) len = l - pos; uint newLen = l-len; QChar *c = QT_ALLOC_QCHAR_VEC(newLen); memcpy(c, s, pos*sizeof(QChar)); memcpy(c+pos, s+pos+len, (l-len-pos)*sizeof(QChar)); if(s) QT_DELETE_QCHAR_VEC(s); s = c; l = newLen; } DOMStringImpl *DOMStringImpl::split(uint pos) { assert(!_inTable); if( pos >=l ) return new DOMStringImpl(); uint newLen = l-pos; QChar *c = QT_ALLOC_QCHAR_VEC(newLen); memcpy(c, s+pos, newLen*sizeof(QChar)); DOMStringImpl *str = new DOMStringImpl(s + pos, newLen); truncate(pos); return str; } bool DOMStringImpl::containsOnlyWhitespace() const { return containsOnlyWhitespace(0, l); } bool DOMStringImpl::containsOnlyWhitespace(unsigned int from, unsigned int len) const { if (!s) return true; for (uint i = from; i < len; i++) { QChar c = s[i]; if (c.unicode() <= 0x7F) { if (!isspace(c.unicode())) return false; } else return false; } return true; } DOMStringImpl *DOMStringImpl::substring(uint pos, uint len) { if (pos >=l) return new DOMStringImpl(); if (len > l - pos) len = l - pos; return new DOMStringImpl(s + pos, len); } static Length parseLength(QChar *s, unsigned int l) { const QChar* last = s+l-1; if ( *last == QChar('%')) { // CSS allows one decimal after the point, like // 42.2%, but not 42.22% // we ignore the non-integer part for speed/space reasons int i = QConstString(s, l).string().findRev('.'); if ( i >= 0 && i < (int)l-1 ) l = i + 1; return Length(QConstString(s, l-1).string().toInt(), Percent); } if ( *last == QChar('*')) { if(l == 1) return Length(1, Relative); else return Length(QConstString(s, l-1).string().toInt(), Relative); } // should we strip of the non-integer part here also? // CSS says no, all important browsers do so, including Mozilla. sigh. bool ok; // this ugly construct helps in case someone specifies a length as "100." int v = (int) QConstString(s, l).string().toFloat(&ok); if(ok) { return Length(v, Fixed); } return Length(0, Variable); } Length DOMStringImpl::toLength() const { return parseLength(s,l); } khtml::Length* DOMStringImpl::toLengthArray(int& len) const { #if !APPLE_CHANGES QString str(s, l); #endif /* APPLE_CHANGES not defined */ int pos = 0; int pos2; // web authors are so stupid. This is a workaround // to fix lists like "1,2px 3 ,4" // make sure not to break percentage or relative widths // ### what about "auto" ? #if APPLE_CHANGES // This alternate version works around a limitation in our QString implementation. QChar spacified[l]; QChar space(' '); for(unsigned int i=0; i < l; i++) { QChar cc = s[i]; if ( cc > '9' || ( cc < '0' && cc != '-' && cc != '*' && cc != '%' && cc != '.') ){ spacified[i] = space; } else { spacified[i] = cc; } } QString str(spacified, l); #else /* APPLE_CHANGES not defined */ QChar space(' '); for(unsigned int i=0; i < l; i++) { char cc = str[i].latin1(); if ( cc > '9' || ( cc < '0' && cc != '-' && cc != '*' && cc != '%' && cc != '.') ) str[i] = space; } #endif /* APPLE_CHANGES not defined */ str = str.simplifyWhiteSpace(); len = str.contains(' ') + 1; khtml::Length* r = new khtml::Length[len]; int i = 0; while((pos2 = str.find(' ', pos)) != -1) { r[i++] = parseLength((QChar *) str.unicode()+pos, pos2-pos); pos = pos2+1; } r[i] = parseLength((QChar *) str.unicode()+pos, str.length()-pos); return r; } bool DOMStringImpl::isLower() const { unsigned int i; for (i = 0; i < l; i++) if (s[i].lower() != s[i]) return false; return true; } DOMStringImpl *DOMStringImpl::lower() const { DOMStringImpl *c = new DOMStringImpl; if(!l) return c; c->s = QT_ALLOC_QCHAR_VEC(l); c->l = l; for (unsigned int i = 0; i < l; i++) c->s[i] = s[i].lower(); return c; } DOMStringImpl *DOMStringImpl::upper() const { DOMStringImpl *c = new DOMStringImpl; if(!l) return c; c->s = QT_ALLOC_QCHAR_VEC(l); c->l = l; for (unsigned int i = 0; i < l; i++) c->s[i] = s[i].upper(); return c; } DOMStringImpl *DOMStringImpl::capitalize() const { DOMStringImpl *c = new DOMStringImpl; if(!l) return c; c->s = QT_ALLOC_QCHAR_VEC(l); c->l = l; if ( l ) c->s[0] = s[0].upper(); for (unsigned int i = 1; i < l; i++) c->s[i] = s[i-1].isLetterOrNumber() ? s[i] : s[i].upper(); return c; } int DOMStringImpl::toInt(bool *ok) const { unsigned i = 0; // Allow leading spaces. for (; i != l; ++i) { if (!s[i].isSpace()) { break; } } // Allow sign. if (i != l) { if (s[i] == '+' || s[i] == '-') { ++i; } } // Allow digits. for (; i != l; ++i) { if (!s[i].isDigit()) { break; } } return QConstString(s, i).string().toInt(ok); } DOMStringImpl *DOMStringImpl::replace(QChar oldC, QChar newC) { if (oldC == newC) return this; unsigned i; for (i = 0; i != l; ++i) if (s[i] == oldC) break; if (i == l) return this; DOMStringImpl *c = new DOMStringImpl; c->s = QT_ALLOC_QCHAR_VEC(l); c->l = l; for (i = 0; i != l; ++i) { QChar ch = s[i]; if (ch == oldC) ch = newC; c->s[i] = ch; } return c; } // Golden ratio - arbitrary start value to avoid mapping all 0's to all 0's // or anything like that. const unsigned PHI = 0x9e3779b9U; // This hash algorithm comes from: // http://burtleburtle.net/bob/hash/hashfaq.html // http://burtleburtle.net/bob/hash/doobs.html unsigned DOMStringImpl::computeHash(const QChar *s, int length) { int prefixLength = length < 8 ? length : 8; int suffixPosition = length < 16 ? 8 : length - 8; unsigned h = PHI; h += length; h += (h << 10); h ^= (h << 6); for (int i = 0; i < prefixLength; i++) { h += s[i].unicode(); h += (h << 10); h ^= (h << 6); } for (int i = suffixPosition; i < length; i++){ h += s[i].unicode(); h += (h << 10); h ^= (h << 6); } h += (h << 3); h ^= (h >> 11); h += (h << 15); if (h == 0) h = 0x80000000; return h; } // This hash algorithm comes from: // http://burtleburtle.net/bob/hash/hashfaq.html // http://burtleburtle.net/bob/hash/doobs.html unsigned DOMStringImpl::computeHash(const char *s) { int length = strlen(s); int prefixLength = length < 8 ? length : 8; int suffixPosition = length < 16 ? 8 : length - 8; unsigned h = PHI; h += length; h += (h << 10); h ^= (h << 6); for (int i = 0; i < prefixLength; i++) { h += (unsigned char)s[i]; h += (h << 10); h ^= (h << 6); } for (int i = suffixPosition; i < length; i++) { h += (unsigned char)s[i]; h += (h << 10); h ^= (h << 6); } h += (h << 3); h ^= (h >> 11); h += (h << 15); if (h == 0) h = 0x80000000; return h; } const char *DOMStringImpl::ascii() const { char *buffer = new char[l + 1]; char *p = buffer; for (unsigned i = 0; i != l; ++i) { unsigned short c = s[i].unicode(); if (c >= 0x20 && c < 0x7F) *p++ = c; else *p++ = '?'; } *p++ = '\0'; return buffer; } } // namespace DOM