blob: ab75b264e2b6e66843f831e3bdddad05f46c8a2c [file] [log] [blame]
/*
* Copyright (C) 2003 Lars Knoll (knoll@kde.org)
* Copyright (C) 2005 Allan Sandfeld Jensen (kde@carewolf.com)
* Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012 Apple Inc. All rights reserved.
* Copyright (C) 2007 Nicholas Shanks <webkit@nickshanks.com>
* Copyright (C) 2008 Eric Seidel <eric@webkit.org>
* Copyright (C) 2009 Torch Mobile Inc. All rights reserved. (http://www.torchmobile.com/)
* Copyright (C) 2012 Adobe Systems Incorporated. All rights reserved.
* Copyright (C) 2012 Intel Corporation. All rights reserved.
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public License
* along with this library; see the file COPYING.LIB. If not, write to
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
* Boston, MA 02110-1301, USA.
*/
#include "sky/engine/core/css/CSSMarkup.h"
#include "sky/engine/wtf/HexNumber.h"
#include "sky/engine/wtf/text/StringBuffer.h"
namespace blink {
template <typename CharacterType>
static inline bool isCSSTokenizerIdentifier(const CharacterType* characters, unsigned length)
{
const CharacterType* end = characters + length;
// -?
if (characters != end && characters[0] == '-')
++characters;
// {nmstart}
if (characters == end || !(characters[0] == '_' || characters[0] >= 128 || isASCIIAlpha(characters[0])))
return false;
++characters;
// {nmchar}*
for (; characters != end; ++characters) {
if (!(characters[0] == '_' || characters[0] == '-' || characters[0] >= 128 || isASCIIAlphanumeric(characters[0])))
return false;
}
return true;
}
// "ident" from the CSS tokenizer, minus backslash-escape sequences
static bool isCSSTokenizerIdentifier(const String& string)
{
unsigned length = string.length();
if (!length)
return false;
if (string.is8Bit())
return isCSSTokenizerIdentifier(string.characters8(), length);
return isCSSTokenizerIdentifier(string.characters16(), length);
}
template <typename CharacterType>
static inline bool isCSSTokenizerURL(const CharacterType* characters, unsigned length)
{
const CharacterType* end = characters + length;
for (; characters != end; ++characters) {
CharacterType c = characters[0];
switch (c) {
case '!':
case '#':
case '$':
case '%':
case '&':
break;
default:
if (c < '*')
return false;
if (c <= '~')
break;
if (c < 128)
return false;
}
}
return true;
}
// "url" from the CSS tokenizer, minus backslash-escape sequences
static bool isCSSTokenizerURL(const String& string)
{
unsigned length = string.length();
if (!length)
return true;
if (string.is8Bit())
return isCSSTokenizerURL(string.characters8(), length);
return isCSSTokenizerURL(string.characters16(), length);
}
template <typename CharacterType>
static inline String quoteCSSStringInternal(const CharacterType* characters, unsigned length)
{
// For efficiency, we first pre-calculate the length of the quoted string, then we build the actual one.
// Please see below for the actual logic.
unsigned quotedStringSize = 2; // Two quotes surrounding the entire string.
bool afterEscape = false;
for (unsigned i = 0; i < length; ++i) {
CharacterType ch = characters[i];
if (ch == '\\' || ch == '\'') {
quotedStringSize += 2;
afterEscape = false;
} else if (ch < 0x20 || ch == 0x7F) {
quotedStringSize += 2 + (ch >= 0x10);
afterEscape = true;
} else {
quotedStringSize += 1 + (afterEscape && (isASCIIHexDigit(ch) || ch == ' '));
afterEscape = false;
}
}
StringBuffer<CharacterType> buffer(quotedStringSize);
unsigned index = 0;
buffer[index++] = '\'';
afterEscape = false;
for (unsigned i = 0; i < length; ++i) {
CharacterType ch = characters[i];
if (ch == '\\' || ch == '\'') {
buffer[index++] = '\\';
buffer[index++] = ch;
afterEscape = false;
} else if (ch < 0x20 || ch == 0x7F) { // Control characters.
buffer[index++] = '\\';
placeByteAsHexCompressIfPossible(ch, buffer, index, Lowercase);
afterEscape = true;
} else {
// Space character may be required to separate backslash-escape sequence and normal characters.
if (afterEscape && (isASCIIHexDigit(ch) || ch == ' '))
buffer[index++] = ' ';
buffer[index++] = ch;
afterEscape = false;
}
}
buffer[index++] = '\'';
ASSERT(quotedStringSize == index);
return String::adopt(buffer);
}
// We use single quotes for now because markup.cpp uses double quotes.
String quoteCSSString(const String& string)
{
// This function expands each character to at most 3 characters ('\u0010' -> '\' '1' '0') as well as adds
// 2 quote characters (before and after). Make sure the resulting size (3 * length + 2) will not overflow unsigned.
unsigned length = string.length();
if (!length)
return String("\'\'");
if (length > std::numeric_limits<unsigned>::max() / 3 - 2)
return emptyString();
if (string.is8Bit())
return quoteCSSStringInternal(string.characters8(), length);
return quoteCSSStringInternal(string.characters16(), length);
}
String quoteCSSStringIfNeeded(const String& string)
{
return isCSSTokenizerIdentifier(string) ? string : quoteCSSString(string);
}
String quoteCSSURLIfNeeded(const String& string)
{
return isCSSTokenizerURL(string) ? string : quoteCSSString(string);
}
} // namespace blink