LineEnding.cpp   [plain text]


/*
 * Copyright (C) 2005-2017 Apple Inc. All rights reserved.
 * Copyright (C) 2010 Google Inc. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are
 * met:
 *
 *     * Redistributions of source code must retain the above copyright
 * notice, this list of conditions and the following disclaimer.
 *     * Redistributions in binary form must reproduce the above
 * copyright notice, this list of conditions and the following disclaimer
 * in the documentation and/or other materials provided with the
 * distribution.
 *     * Neither the name of Google Inc. nor the names of its
 * contributors may be used to endorse or promote products derived from
 * this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include "config.h"
#include "LineEnding.h"

#include <wtf/Vector.h>

namespace WTF {

Vector<uint8_t> normalizeLineEndingsToLF(Vector<uint8_t>&& vector)
{
    auto q = vector.data();
    for (auto p = vector.data(), end = p + vector.size(); p != end; ) {
        auto character = *p++;
        if (character == '\r') {
            // Turn CRLF and CR into LF.
            if (p != end && *p == '\n')
                ++p;
            *q++ = '\n';
        } else {
            // Leave other characters alone.
            *q++ = character;
        }
    }
    vector.shrink(q - vector.data());
    return WTFMove(vector);
}

Vector<uint8_t> normalizeLineEndingsToCRLF(Vector<uint8_t>&& source)
{
    size_t resultLength = 0;
    for (auto p = source.data(), end = p + source.size(); p != end; ) {
        auto character = *p++;
        if (character == '\r') {
            // Turn CR or CRLF into CRLF;
            if (p != end && *p == '\n')
                ++p;
            resultLength += 2;
        } else if (character == '\n') {
            // Turn LF into CRLF.
            resultLength += 2;
        } else {
            // Leave other characters alone.
            resultLength += 1;
        }
    }

    if (resultLength == source.size())
        return WTFMove(source);

    Vector<uint8_t> result(resultLength);
    auto q = result.data();
    for (auto p = source.data(), end = p + source.size(); p != end; ) {
        auto character = *p++;
        if (character == '\r') {
            // Turn CR or CRLF into CRLF;
            if (p != end && *p == '\n')
                ++p;
            *q++ = '\r';
            *q++ = '\n';
        } else if (character == '\n') {
            // Turn LF into CRLF.
            *q++ = '\r';
            *q++ = '\n';
        } else {
            // Leave other characters alone.
            *q++ = character;
        }
    }
    ASSERT(q == result.data() + resultLength);
    return result;
}

Vector<uint8_t> normalizeLineEndingsToNative(Vector<uint8_t>&& from)
{
#if OS(WINDOWS)
    return normalizeLineEndingsToCRLF(WTFMove(from));
#else
    return normalizeLineEndingsToLF(WTFMove(from));
#endif
}

} // namespace WTF