Source/WebCore/platform/network/FormDataBuilder.cpp - WebKit - Git at Google

 /*
  * Copyright (C) 1999 Lars Knoll (knoll@kde.org)
  *           (C) 1999 Antti Koivisto (koivisto@kde.org)
  *           (C) 2001 Dirk Mueller (mueller@kde.org)
  * Copyright (C) 2004-2017 Apple Inc. All rights reserved.
  *           (C) 2006 Alexey Proskuryakov (ap@nypop.com)
  * Copyright (C) 2008 Torch Mobile Inc. All rights reserved. (http://www.torchmobile.com/)
  *
  * This library is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Library General Public
  * License as published by the Free Software Foundation; either
  * version 2 of the License, or (at your option) any later version.
  *
  * This library is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Library General Public License for more details.
  *
  * You should have received a copy of the GNU Library General Public License
  * along with this library; see the file COPYING.LIB.  If not, write to
  * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
  * Boston, MA 02110-1301, USA.
  */

 #include "config.h"
 #include "FormDataBuilder.h"

 #include "Blob.h"
 #include "TextEncoding.h"
 #include <limits>
 #include <wtf/Assertions.h>
 #include <wtf/HexNumber.h>
 #include <wtf/RandomNumber.h>
 #include <wtf/text/CString.h>
 #include <wtf/text/StringView.h>

 namespace WebCore {

 namespace FormDataBuilder {

 static inline void append(Vector<char>& buffer, char string)
 {
     buffer.append(string);
 }

 static inline void append(Vector<char>& buffer, const char* string)
 {
     buffer.append(string, strlen(string));
 }

 static inline void append(Vector<char>& buffer, const CString& string)
 {
     buffer.append(string.data(), string.length());
 }

 static inline void append(Vector<char>& buffer, const Vector<uint8_t>& string)
 {
     buffer.appendVector(string);
 }

 static void appendQuoted(Vector<char>& buffer, const Vector<uint8_t>& string)
 {
     // Append a string as a quoted value, escaping quotes and line breaks.
     // FIXME: Is it correct to use percent escaping here? When this code was originally written,
     // other browsers were not encoding these characters, so someone should test servers or do
     // research to find out if there is an encoding form that works well.
     // FIXME: If we want to use percent escaping sensibly, we need to escape "%" characters too.
     size_t size = string.size();
     for (size_t i = 0; i < size; ++i) {
         auto character = string[i];
         switch (character) {
         case 0xA:
             append(buffer, "%0A");
             break;
         case 0xD:
             append(buffer, "%0D");
             break;
         case '"':
             append(buffer, "%22");
             break;
         default:
             append(buffer, character);
         }
     }
 }

 // https://url.spec.whatwg.org/#concept-urlencoded-byte-serializer
 static void appendFormURLEncoded(Vector<char>& buffer, const uint8_t* string, size_t length)
 {
     static const char safeCharacters[] = "-._*";
     for (size_t i = 0; i < length; ++i) {
         auto character = string[i];
         if (isASCIIAlphanumeric(character) || strchr(safeCharacters, character))
             append(buffer, character);
         else if (character == ' ')
             append(buffer, '+');
         else if (character == '\n' || (character == '\r' && (i + 1 >= length || string[i + 1] != '\n')))
             append(buffer, "%0D%0A"); // FIXME: Unclear exactly where this rule about normalizing line endings to CRLF comes from.
         else if (character != '\r') {
             append(buffer, '%');
             auto hexBuffer = hex(character, 2);
             append(buffer, hexBuffer.characters()[0]);
             append(buffer, hexBuffer.characters()[1]);
         }
     }
 }

 static void appendFormURLEncoded(Vector<char>& buffer, const Vector<uint8_t>& string)
 {
     appendFormURLEncoded(buffer, string.data(), string.size());
 }

 Vector<char> generateUniqueBoundaryString()
 {
     Vector<char> boundary;

     // The RFC 2046 spec says the alphanumeric characters plus the
     // following characters are legal for boundaries:  '()+_,-./:=?
     // However the following characters, though legal, cause some sites
     // to fail: (),./:=+
     // Note that our algorithm makes it twice as much likely for 'A' or 'B'
     // to appear in the boundary string, because 0x41 and 0x42 are present in
     // the below array twice.
     static const char alphaNumericEncodingMap[64] = {
         0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
         0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50,
         0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58,
         0x59, 0x5A, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66,
         0x67, 0x68, 0x69, 0x6A, 0x6B, 0x6C, 0x6D, 0x6E,
         0x6F, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76,
         0x77, 0x78, 0x79, 0x7A, 0x30, 0x31, 0x32, 0x33,
         0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x41, 0x42
     };

     // Start with an informative prefix.
     append(boundary, "----WebKitFormBoundary");

     // Append 16 random 7bit ascii AlphaNumeric characters.
     Vector<char> randomBytes;

     for (unsigned i = 0; i < 4; ++i) {
         unsigned randomness = static_cast<unsigned>(randomNumber() * (std::numeric_limits<unsigned>::max() + 1.0));
         randomBytes.append(alphaNumericEncodingMap[(randomness >> 24) & 0x3F]);
         randomBytes.append(alphaNumericEncodingMap[(randomness >> 16) & 0x3F]);
         randomBytes.append(alphaNumericEncodingMap[(randomness >> 8) & 0x3F]);
         randomBytes.append(alphaNumericEncodingMap[randomness & 0x3F]);
     }

     boundary.appendVector(randomBytes);
     boundary.append(0); // Add a 0 at the end so we can use this as a C-style string.
     return boundary;
 }

 void beginMultiPartHeader(Vector<char>& buffer, const CString& boundary, const Vector<uint8_t>& name)
 {
     addBoundaryToMultiPartHeader(buffer, boundary);

     // FIXME: This loses data irreversibly if the input name includes characters you can't encode
     // in the website's character set.
     append(buffer, "Content-Disposition: form-data; name=\"");
     appendQuoted(buffer, name);
     append(buffer, '"');
 }

 void addBoundaryToMultiPartHeader(Vector<char>& buffer, const CString& boundary, bool isLastBoundary)
 {
     append(buffer, "--");
     append(buffer, boundary);

     if (isLastBoundary)
         append(buffer, "--");

     append(buffer, "\r\n");
 }

 void addFilenameToMultiPartHeader(Vector<char>& buffer, const TextEncoding& encoding, const String& filename)
 {
     // FIXME: This loses data irreversibly if the filename includes characters you can't encode
     // in the website's character set.
     append(buffer, "; filename=\"");
     appendQuoted(buffer, encoding.encode(filename, UnencodableHandling::QuestionMarks));
     append(buffer, '"');
 }

 void addContentTypeToMultiPartHeader(Vector<char>& buffer, const CString& mimeType)
 {
     ASSERT(Blob::isNormalizedContentType(mimeType));
     append(buffer, "\r\nContent-Type: ");
     append(buffer, mimeType);
 }

 void finishMultiPartHeader(Vector<char>& buffer)
 {
     append(buffer, "\r\n\r\n");
 }

 void addKeyValuePairAsFormData(Vector<char>& buffer, const Vector<uint8_t>& key, const Vector<uint8_t>& value, FormData::EncodingType encodingType)
 {
     if (encodingType == FormData::TextPlain) {
         if (!buffer.isEmpty())
             append(buffer, "\r\n");
         append(buffer, key);
         append(buffer, '=');
         append(buffer, value);
     } else {
         if (!buffer.isEmpty())
             append(buffer, '&');
         appendFormURLEncoded(buffer, key);
         append(buffer, '=');
         appendFormURLEncoded(buffer, value);
     }
 }

 void encodeStringAsFormData(Vector<char>& buffer, const CString& string)
 {
     appendFormURLEncoded(buffer, reinterpret_cast<const uint8_t*>(string.data()), string.length());
 }

 }

 }
	/*
	* Copyright (C) 1999 Lars Knoll (knoll@kde.org)
	* (C) 1999 Antti Koivisto (koivisto@kde.org)
	* (C) 2001 Dirk Mueller (mueller@kde.org)
	* Copyright (C) 2004-2017 Apple Inc. All rights reserved.
	* (C) 2006 Alexey Proskuryakov (ap@nypop.com)
	* Copyright (C) 2008 Torch Mobile Inc. All rights reserved. (http://www.torchmobile.com/)
	*
	* This library is free software; you can redistribute it and/or
	* modify it under the terms of the GNU Library General Public
	* License as published by the Free Software Foundation; either
	* version 2 of the License, or (at your option) any later version.
	*
	* This library is distributed in the hope that it will be useful,
	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	* Library General Public License for more details.
	*
	* You should have received a copy of the GNU Library General Public License
	* along with this library; see the file COPYING.LIB. If not, write to
	* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
	* Boston, MA 02110-1301, USA.
	*/

	#include "config.h"
	#include "FormDataBuilder.h"

	#include "Blob.h"
	#include "TextEncoding.h"
	#include <limits>
	#include <wtf/Assertions.h>
	#include <wtf/HexNumber.h>
	#include <wtf/RandomNumber.h>
	#include <wtf/text/CString.h>
	#include <wtf/text/StringView.h>

	namespace WebCore {

	namespace FormDataBuilder {

	static inline void append(Vector<char>& buffer, char string)
	{
	buffer.append(string);
	}

	static inline void append(Vector<char>& buffer, const char* string)
	{
	buffer.append(string, strlen(string));
	}

	static inline void append(Vector<char>& buffer, const CString& string)
	{
	buffer.append(string.data(), string.length());
	}

	static inline void append(Vector<char>& buffer, const Vector<uint8_t>& string)
	{
	buffer.appendVector(string);
	}

	static void appendQuoted(Vector<char>& buffer, const Vector<uint8_t>& string)
	{
	// Append a string as a quoted value, escaping quotes and line breaks.
	// FIXME: Is it correct to use percent escaping here? When this code was originally written,
	// other browsers were not encoding these characters, so someone should test servers or do
	// research to find out if there is an encoding form that works well.
	// FIXME: If we want to use percent escaping sensibly, we need to escape "%" characters too.
	size_t size = string.size();
	for (size_t i = 0; i < size; ++i) {
	auto character = string[i];
	switch (character) {
	case 0xA:
	append(buffer, "%0A");
	break;
	case 0xD:
	append(buffer, "%0D");
	break;
	case '"':
	append(buffer, "%22");
	break;
	default:
	append(buffer, character);
	}
	}
	}

	// https://url.spec.whatwg.org/#concept-urlencoded-byte-serializer
	static void appendFormURLEncoded(Vector<char>& buffer, const uint8_t* string, size_t length)
	{
	static const char safeCharacters[] = "-._*";
	for (size_t i = 0; i < length; ++i) {
	auto character = string[i];
	if (isASCIIAlphanumeric(character) \|\| strchr(safeCharacters, character))
	append(buffer, character);
	else if (character == ' ')
	append(buffer, '+');
	else if (character == '\n' \|\| (character == '\r' && (i + 1 >= length \|\| string[i + 1] != '\n')))
	append(buffer, "%0D%0A"); // FIXME: Unclear exactly where this rule about normalizing line endings to CRLF comes from.
	else if (character != '\r') {
	append(buffer, '%');
	auto hexBuffer = hex(character, 2);
	append(buffer, hexBuffer.characters()[0]);
	append(buffer, hexBuffer.characters()[1]);
	}
	}
	}

	static void appendFormURLEncoded(Vector<char>& buffer, const Vector<uint8_t>& string)
	{
	appendFormURLEncoded(buffer, string.data(), string.size());
	}

	Vector<char> generateUniqueBoundaryString()
	{
	Vector<char> boundary;

	// The RFC 2046 spec says the alphanumeric characters plus the
	// following characters are legal for boundaries: '()+_,-./:=?
	// However the following characters, though legal, cause some sites
	// to fail: (),./:=+
	// Note that our algorithm makes it twice as much likely for 'A' or 'B'
	// to appear in the boundary string, because 0x41 and 0x42 are present in
	// the below array twice.
	static const char alphaNumericEncodingMap[64] = {
	0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
	0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50,
	0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58,
	0x59, 0x5A, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66,
	0x67, 0x68, 0x69, 0x6A, 0x6B, 0x6C, 0x6D, 0x6E,
	0x6F, 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76,
	0x77, 0x78, 0x79, 0x7A, 0x30, 0x31, 0x32, 0x33,
	0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x41, 0x42
	};

	// Start with an informative prefix.
	append(boundary, "----WebKitFormBoundary");

	// Append 16 random 7bit ascii AlphaNumeric characters.
	Vector<char> randomBytes;

	for (unsigned i = 0; i < 4; ++i) {
	unsigned randomness = static_cast<unsigned>(randomNumber() * (std::numeric_limits<unsigned>::max() + 1.0));
	randomBytes.append(alphaNumericEncodingMap[(randomness >> 24) & 0x3F]);
	randomBytes.append(alphaNumericEncodingMap[(randomness >> 16) & 0x3F]);
	randomBytes.append(alphaNumericEncodingMap[(randomness >> 8) & 0x3F]);
	randomBytes.append(alphaNumericEncodingMap[randomness & 0x3F]);
	}

	boundary.appendVector(randomBytes);
	boundary.append(0); // Add a 0 at the end so we can use this as a C-style string.
	return boundary;
	}

	void beginMultiPartHeader(Vector<char>& buffer, const CString& boundary, const Vector<uint8_t>& name)
	{
	addBoundaryToMultiPartHeader(buffer, boundary);

	// FIXME: This loses data irreversibly if the input name includes characters you can't encode
	// in the website's character set.
	append(buffer, "Content-Disposition: form-data; name=\"");
	appendQuoted(buffer, name);
	append(buffer, '"');
	}

	void addBoundaryToMultiPartHeader(Vector<char>& buffer, const CString& boundary, bool isLastBoundary)
	{
	append(buffer, "--");
	append(buffer, boundary);

	if (isLastBoundary)
	append(buffer, "--");

	append(buffer, "\r\n");
	}

	void addFilenameToMultiPartHeader(Vector<char>& buffer, const TextEncoding& encoding, const String& filename)
	{
	// FIXME: This loses data irreversibly if the filename includes characters you can't encode
	// in the website's character set.
	append(buffer, "; filename=\"");
	appendQuoted(buffer, encoding.encode(filename, UnencodableHandling::QuestionMarks));
	append(buffer, '"');
	}

	void addContentTypeToMultiPartHeader(Vector<char>& buffer, const CString& mimeType)
	{
	ASSERT(Blob::isNormalizedContentType(mimeType));
	append(buffer, "\r\nContent-Type: ");
	append(buffer, mimeType);
	}

	void finishMultiPartHeader(Vector<char>& buffer)
	{
	append(buffer, "\r\n\r\n");
	}

	void addKeyValuePairAsFormData(Vector<char>& buffer, const Vector<uint8_t>& key, const Vector<uint8_t>& value, FormData::EncodingType encodingType)
	{
	if (encodingType == FormData::TextPlain) {
	if (!buffer.isEmpty())
	append(buffer, "\r\n");
	append(buffer, key);
	append(buffer, '=');
	append(buffer, value);
	} else {
	if (!buffer.isEmpty())
	append(buffer, '&');
	appendFormURLEncoded(buffer, key);
	append(buffer, '=');
	appendFormURLEncoded(buffer, value);
	}
	}

	void encodeStringAsFormData(Vector<char>& buffer, const CString& string)
	{
	appendFormURLEncoded(buffer, reinterpret_cast<const uint8_t*>(string.data()), string.length());
	}

	}

	}