| /* |
| * Copyright (C) 2006-2017 Apple Inc. All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
| * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
| * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
| * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #import "config.h" |
| #import "WebContentReader.h" |
| |
| #import "ArchiveResource.h" |
| #import "Blob.h" |
| #import "BlobURL.h" |
| #import "CachedResourceLoader.h" |
| #import "CustomHeaderFields.h" |
| #import "DOMURL.h" |
| #import "Document.h" |
| #import "DocumentFragment.h" |
| #import "DocumentLoader.h" |
| #import "Editor.h" |
| #import "EditorClient.h" |
| #import "File.h" |
| #import "Frame.h" |
| #import "FrameLoader.h" |
| #import "FrameLoaderClient.h" |
| #import "HTMLAnchorElement.h" |
| #import "HTMLAttachmentElement.h" |
| #import "HTMLBRElement.h" |
| #import "HTMLBodyElement.h" |
| #import "HTMLDivElement.h" |
| #import "HTMLIFrameElement.h" |
| #import "HTMLImageElement.h" |
| #import "HTMLObjectElement.h" |
| #import "LegacyWebArchive.h" |
| #import "MIMETypeRegistry.h" |
| #import "Page.h" |
| #import "PublicURLManager.h" |
| #import "RenderView.h" |
| #import "RuntimeEnabledFeatures.h" |
| #import "SerializedAttachmentData.h" |
| #import "Settings.h" |
| #import "SocketProvider.h" |
| #import "TypedElementDescendantIterator.h" |
| #import "UTIUtilities.h" |
| #import "WebArchiveResourceFromNSAttributedString.h" |
| #import "WebArchiveResourceWebResourceHandler.h" |
| #import "WebNSAttributedStringExtras.h" |
| #import "markup.h" |
| #import <pal/spi/cocoa/NSAttributedStringSPI.h> |
| #import <wtf/FileSystem.h> |
| #import <wtf/SoftLinking.h> |
| #import <wtf/URLParser.h> |
| |
| #if PLATFORM(MAC) |
| #include "LocalDefaultSystemAppearance.h" |
| #endif |
| |
| #if (PLATFORM(IOS_FAMILY) && __IPHONE_OS_VERSION_MIN_REQUIRED >= 110000) || PLATFORM(MAC) |
| @interface NSAttributedString () |
| - (NSString *)_htmlDocumentFragmentString:(NSRange)range documentAttributes:(NSDictionary *)dict subresources:(NSArray **)subresources; |
| @end |
| #elif PLATFORM(IOS_FAMILY) |
| SOFT_LINK_PRIVATE_FRAMEWORK(WebKitLegacy) |
| #elif PLATFORM(MAC) |
| SOFT_LINK_FRAMEWORK_IN_UMBRELLA(WebKit, WebKitLegacy) |
| #endif |
| |
| #if (PLATFORM(IOS_FAMILY) && __IPHONE_OS_VERSION_MIN_REQUIRED < 110000) |
| SOFT_LINK(WebKitLegacy, _WebCreateFragment, void, (WebCore::Document& document, NSAttributedString *string, WebCore::FragmentAndResources& result), (document, string, result)) |
| #endif |
| |
| namespace WebCore { |
| |
| #if PLATFORM(MACCATALYST) |
| |
| static FragmentAndResources createFragment(Frame&, NSAttributedString *) |
| { |
| return { }; |
| } |
| |
| #elif (PLATFORM(IOS_FAMILY) && __IPHONE_OS_VERSION_MIN_REQUIRED >= 110000) || PLATFORM(MAC) |
| |
| static NSDictionary *attributesForAttributedStringConversion() |
| { |
| // This function needs to be kept in sync with identically named one in WebKitLegacy, which is used on older OS versions. |
| RetainPtr<NSMutableArray> excludedElements = adoptNS([[NSMutableArray alloc] initWithObjects: |
| // Omit style since we want style to be inline so the fragment can be easily inserted. |
| @"style", |
| // Omit xml so the result is not XHTML. |
| @"xml", |
| // Omit tags that will get stripped when converted to a fragment anyway. |
| @"doctype", @"html", @"head", @"body", |
| // Omit deprecated tags. |
| @"applet", @"basefont", @"center", @"dir", @"font", @"menu", @"s", @"strike", @"u", |
| #if !ENABLE(ATTACHMENT_ELEMENT) |
| // Omit object so no file attachments are part of the fragment. |
| @"object", |
| #endif |
| nil]); |
| |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| if (!RuntimeEnabledFeatures::sharedFeatures().attachmentElementEnabled()) |
| [excludedElements addObject:@"object"]; |
| #endif |
| |
| #if PLATFORM(IOS_FAMILY) |
| static NSString * const NSExcludedElementsDocumentAttribute = @"ExcludedElements"; |
| #endif |
| |
| NSURL *baseURL = URL::fakeURLWithRelativePart(emptyString()); |
| |
| // The output base URL needs +1 refcount to work around the fact that NSHTMLReader over-releases it. |
| CFRetain((__bridge CFTypeRef)baseURL); |
| |
| return @{ |
| NSExcludedElementsDocumentAttribute: excludedElements.get(), |
| @"InterchangeNewline": @YES, |
| @"CoalesceTabSpans": @YES, |
| @"OutputBaseURL": baseURL, |
| @"WebResourceHandler": [[WebArchiveResourceWebResourceHandler new] autorelease], |
| }; |
| } |
| |
| static FragmentAndResources createFragment(Frame& frame, NSAttributedString *string) |
| { |
| FragmentAndResources result; |
| Document& document = *frame.document(); |
| |
| #if PLATFORM(MAC) |
| auto* view = frame.view(); |
| LocalDefaultSystemAppearance localAppearance(view ? view->useDarkAppearance() : false); |
| #endif |
| |
| NSArray *subresources = nil; |
| NSString *fragmentString = [string _htmlDocumentFragmentString:NSMakeRange(0, [string length]) documentAttributes:attributesForAttributedStringConversion() subresources:&subresources]; |
| auto fragment = DocumentFragment::create(document); |
| fragment->parseHTML(fragmentString, document.body(), DisallowScriptingAndPluginContent); |
| |
| result.fragment = WTFMove(fragment); |
| for (WebArchiveResourceFromNSAttributedString *resource in subresources) |
| result.resources.append(*resource->resource); |
| |
| return result; |
| } |
| |
| #else |
| |
| static FragmentAndResources createFragment(Frame& frame, NSAttributedString *string) |
| { |
| FragmentAndResources result; |
| _WebCreateFragment(*frame.document(), string, result); |
| return result; |
| } |
| |
| #endif |
| |
| class DeferredLoadingScope { |
| public: |
| DeferredLoadingScope(Frame& frame) |
| : m_frame(frame) |
| , m_cachedResourceLoader(frame.document()->cachedResourceLoader()) |
| { |
| if (!frame.page()->defersLoading()) { |
| frame.page()->setDefersLoading(true); |
| m_didEnabledDeferredLoading = true; |
| } |
| |
| if (m_cachedResourceLoader->imagesEnabled()) { |
| m_cachedResourceLoader->setImagesEnabled(false); |
| m_didDisableImage = true; |
| } |
| } |
| |
| ~DeferredLoadingScope() |
| { |
| if (m_didDisableImage) |
| m_cachedResourceLoader->setImagesEnabled(true); |
| if (m_didEnabledDeferredLoading) |
| m_frame->page()->setDefersLoading(false); |
| } |
| |
| private: |
| Ref<Frame> m_frame; |
| Ref<CachedResourceLoader> m_cachedResourceLoader; |
| bool m_didEnabledDeferredLoading { false }; |
| bool m_didDisableImage { false }; |
| }; |
| |
| |
| static bool shouldReplaceSubresourceURL(const URL& url) |
| { |
| return !(url.protocolIsInHTTPFamily() || url.protocolIsData()); |
| } |
| |
| static bool shouldReplaceRichContentWithAttachments() |
| { |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| return RuntimeEnabledFeatures::sharedFeatures().attachmentElementEnabled(); |
| #else |
| return false; |
| #endif |
| } |
| |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| |
| static String mimeTypeFromContentType(const String& contentType) |
| { |
| if (contentType == String(kUTTypeVCard)) { |
| // CoreServices erroneously reports that "public.vcard" maps to "text/directory", rather |
| // than either "text/vcard" or "text/x-vcard". Work around this by special casing the |
| // "public.vcard" UTI type. See <rdar://problem/49478229> for more detail. |
| return "text/vcard"_s; |
| } |
| return isDeclaredUTI(contentType) ? MIMETypeFromUTI(contentType) : contentType; |
| } |
| |
| static bool contentTypeIsSuitableForInlineImageRepresentation(const String& contentType) |
| { |
| return MIMETypeRegistry::isSupportedImageMIMEType(mimeTypeFromContentType(contentType)); |
| } |
| |
| static bool supportsClientSideAttachmentData(const Frame& frame) |
| { |
| if (auto* client = frame.editor().client()) |
| return client->supportsClientSideAttachmentData(); |
| |
| return false; |
| } |
| |
| #endif |
| |
| static Ref<DocumentFragment> createFragmentForImageAttachment(Frame& frame, Document& document, Ref<SharedBuffer>&& buffer, const String& contentType, PresentationSize preferredSize) |
| { |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| auto attachment = HTMLAttachmentElement::create(HTMLNames::attachmentTag, document); |
| // FIXME: This fallback image name needs to be a localized string. |
| String defaultImageAttachmentName { "image"_s }; |
| |
| auto fragment = document.createDocumentFragment(); |
| if (supportsClientSideAttachmentData(frame)) { |
| frame.editor().registerAttachmentIdentifier(attachment->ensureUniqueIdentifier(), contentType, defaultImageAttachmentName, WTFMove(buffer)); |
| if (contentTypeIsSuitableForInlineImageRepresentation(contentType)) { |
| auto image = HTMLImageElement::create(document); |
| image->setAttributeWithoutSynchronization(HTMLNames::srcAttr, DOMURL::createObjectURL(document, Blob::create(buffer.get(), contentType))); |
| image->setAttachmentElement(WTFMove(attachment)); |
| if (preferredSize.width) |
| image->setAttributeWithoutSynchronization(HTMLNames::widthAttr, AtomString::number(*preferredSize.width)); |
| if (preferredSize.height) |
| image->setAttributeWithoutSynchronization(HTMLNames::heightAttr, AtomString::number(*preferredSize.height)); |
| fragment->appendChild(WTFMove(image)); |
| } else { |
| attachment->updateAttributes(buffer->size(), contentType, defaultImageAttachmentName); |
| fragment->appendChild(WTFMove(attachment)); |
| } |
| } else { |
| attachment->setFile(File::create(Blob::create(buffer.get(), contentType), defaultImageAttachmentName), HTMLAttachmentElement::UpdateDisplayAttributes::Yes); |
| fragment->appendChild(WTFMove(attachment)); |
| } |
| return fragment; |
| #else |
| UNUSED_PARAM(blob); |
| return document.createDocumentFragment(); |
| #endif |
| } |
| |
| static void replaceRichContentWithAttachments(Frame& frame, DocumentFragment& fragment, const Vector<Ref<ArchiveResource>>& subresources) |
| { |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| struct AttachmentInsertionInfo { |
| String fileName; |
| String contentType; |
| Ref<SharedBuffer> data; |
| Ref<Element> originalElement; |
| }; |
| |
| ASSERT(RuntimeEnabledFeatures::sharedFeatures().attachmentElementEnabled()); |
| if (subresources.isEmpty()) |
| return; |
| |
| // FIXME: Handle resources in subframe archives. |
| HashMap<AtomString, Ref<ArchiveResource>> urlToResourceMap; |
| for (auto& subresource : subresources) { |
| auto& url = subresource->url(); |
| if (shouldReplaceSubresourceURL(url)) |
| urlToResourceMap.set(url.string(), subresource.copyRef()); |
| } |
| |
| Vector<SerializedAttachmentData> serializedAttachmentData; |
| for (auto& attachment : descendantsOfType<HTMLAttachmentElement>(fragment)) { |
| auto resourceURL = HTMLAttachmentElement::archiveResourceURL(attachment.uniqueIdentifier()); |
| auto resourceEntry = urlToResourceMap.find(resourceURL.string()); |
| if (resourceEntry == urlToResourceMap.end()) |
| continue; |
| |
| auto& resource = resourceEntry->value; |
| serializedAttachmentData.append({ attachment.uniqueIdentifier(), resource->mimeType(), resource->data() }); |
| } |
| |
| if (!serializedAttachmentData.isEmpty()) |
| frame.editor().registerAttachments(WTFMove(serializedAttachmentData)); |
| |
| Vector<Ref<Element>> elementsToRemove; |
| Vector<AttachmentInsertionInfo> attachmentInsertionInfo; |
| for (auto& image : descendantsOfType<HTMLImageElement>(fragment)) { |
| auto resourceURLString = image.attributeWithoutSynchronization(HTMLNames::srcAttr); |
| if (resourceURLString.isEmpty()) |
| continue; |
| |
| auto resource = urlToResourceMap.find(resourceURLString); |
| if (resource == urlToResourceMap.end()) |
| continue; |
| |
| auto name = image.attributeWithoutSynchronization(HTMLNames::altAttr); |
| if (name.isEmpty()) |
| name = URL({ }, resourceURLString).lastPathComponent(); |
| if (name.isEmpty()) |
| name = AtomString("media"); |
| |
| attachmentInsertionInfo.append({ name, resource->value->mimeType(), resource->value->data(), image }); |
| } |
| |
| for (auto& object : descendantsOfType<HTMLObjectElement>(fragment)) { |
| auto resourceURLString = object.attributeWithoutSynchronization(HTMLNames::dataAttr); |
| if (resourceURLString.isEmpty()) { |
| elementsToRemove.append(object); |
| continue; |
| } |
| |
| auto resource = urlToResourceMap.find(resourceURLString); |
| if (resource == urlToResourceMap.end()) |
| continue; |
| |
| auto name = URL({ }, resourceURLString).lastPathComponent(); |
| if (name.isEmpty()) |
| name = AtomString("file"); |
| |
| attachmentInsertionInfo.append({ name, resource->value->mimeType(), resource->value->data(), object }); |
| } |
| |
| for (auto& info : attachmentInsertionInfo) { |
| auto originalElement = WTFMove(info.originalElement); |
| auto parent = makeRefPtr(originalElement->parentNode()); |
| if (!parent) |
| continue; |
| |
| auto attachment = HTMLAttachmentElement::create(HTMLNames::attachmentTag, fragment.document()); |
| if (supportsClientSideAttachmentData(frame)) { |
| if (is<HTMLImageElement>(originalElement.get()) && contentTypeIsSuitableForInlineImageRepresentation(info.contentType)) { |
| auto& image = downcast<HTMLImageElement>(originalElement.get()); |
| image.setAttributeWithoutSynchronization(HTMLNames::srcAttr, DOMURL::createObjectURL(*frame.document(), Blob::create(info.data, info.contentType))); |
| image.setAttachmentElement(attachment.copyRef()); |
| } else { |
| attachment->updateAttributes(info.data->size(), info.contentType, info.fileName); |
| parent->replaceChild(attachment, WTFMove(originalElement)); |
| } |
| frame.editor().registerAttachmentIdentifier(attachment->ensureUniqueIdentifier(), WTFMove(info.contentType), WTFMove(info.fileName), WTFMove(info.data)); |
| } else { |
| attachment->setFile(File::create(Blob::create(WTFMove(info.data), WTFMove(info.contentType)), WTFMove(info.fileName)), HTMLAttachmentElement::UpdateDisplayAttributes::Yes); |
| parent->replaceChild(WTFMove(attachment), WTFMove(originalElement)); |
| } |
| } |
| |
| for (auto& elementToRemove : elementsToRemove) |
| elementToRemove->remove(); |
| #else |
| UNUSED_PARAM(fragment); |
| UNUSED_PARAM(subresources); |
| #endif |
| } |
| |
| RefPtr<DocumentFragment> createFragmentAndAddResources(Frame& frame, NSAttributedString *string) |
| { |
| if (!frame.page() || !frame.document()) |
| return nullptr; |
| |
| auto& document = *frame.document(); |
| if (!document.isHTMLDocument() || !string) |
| return nullptr; |
| |
| DeferredLoadingScope scope(frame); |
| auto fragmentAndResources = createFragment(frame, string); |
| if (!fragmentAndResources.fragment) |
| return nullptr; |
| |
| if (!RuntimeEnabledFeatures::sharedFeatures().customPasteboardDataEnabled()) { |
| if (DocumentLoader* loader = frame.loader().documentLoader()) { |
| for (auto& resource : fragmentAndResources.resources) |
| loader->addArchiveResource(resource.copyRef()); |
| } |
| return WTFMove(fragmentAndResources.fragment); |
| } |
| |
| if (shouldReplaceRichContentWithAttachments()) { |
| replaceRichContentWithAttachments(frame, *fragmentAndResources.fragment, fragmentAndResources.resources); |
| return WTFMove(fragmentAndResources.fragment); |
| } |
| |
| HashMap<AtomString, AtomString> blobURLMap; |
| for (const Ref<ArchiveResource>& subresource : fragmentAndResources.resources) { |
| auto blob = Blob::create(subresource->data(), subresource->mimeType()); |
| String blobURL = DOMURL::createObjectURL(document, blob); |
| blobURLMap.set(subresource->url().string(), blobURL); |
| } |
| |
| replaceSubresourceURLs(*fragmentAndResources.fragment, WTFMove(blobURLMap)); |
| return WTFMove(fragmentAndResources.fragment); |
| } |
| |
| struct MarkupAndArchive { |
| String markup; |
| Ref<ArchiveResource> mainResource; |
| Ref<Archive> archive; |
| }; |
| |
| static Optional<MarkupAndArchive> extractMarkupAndArchive(SharedBuffer& buffer, const std::function<bool(const String)>& canShowMIMETypeAsHTML) |
| { |
| auto archive = LegacyWebArchive::create(URL(), buffer); |
| if (!archive) |
| return WTF::nullopt; |
| |
| RefPtr<ArchiveResource> mainResource = archive->mainResource(); |
| if (!mainResource) |
| return WTF::nullopt; |
| |
| auto type = mainResource->mimeType(); |
| if (!canShowMIMETypeAsHTML(type)) |
| return WTF::nullopt; |
| |
| return MarkupAndArchive { String::fromUTF8(mainResource->data().data(), mainResource->data().size()), mainResource.releaseNonNull(), archive.releaseNonNull() }; |
| } |
| |
| static String sanitizeMarkupWithArchive(Frame& frame, Document& destinationDocument, MarkupAndArchive& markupAndArchive, MSOListQuirks msoListQuirks, const std::function<bool(const String)>& canShowMIMETypeAsHTML) |
| { |
| auto page = createPageForSanitizingWebContent(); |
| Document* stagingDocument = page->mainFrame().document(); |
| ASSERT(stagingDocument); |
| auto fragment = createFragmentFromMarkup(*stagingDocument, markupAndArchive.markup, markupAndArchive.mainResource->url(), DisallowScriptingAndPluginContent); |
| |
| if (shouldReplaceRichContentWithAttachments()) { |
| replaceRichContentWithAttachments(frame, fragment, markupAndArchive.archive->subresources()); |
| return sanitizedMarkupForFragmentInDocument(WTFMove(fragment), *stagingDocument, msoListQuirks, markupAndArchive.markup); |
| } |
| |
| HashMap<AtomString, AtomString> blobURLMap; |
| for (const Ref<ArchiveResource>& subresource : markupAndArchive.archive->subresources()) { |
| auto& subresourceURL = subresource->url(); |
| if (!shouldReplaceSubresourceURL(subresourceURL)) |
| continue; |
| auto blob = Blob::create(subresource->data(), subresource->mimeType()); |
| String blobURL = DOMURL::createObjectURL(destinationDocument, blob); |
| blobURLMap.set(subresourceURL.string(), blobURL); |
| } |
| |
| auto contentOrigin = SecurityOrigin::create(markupAndArchive.mainResource->url()); |
| for (const Ref<Archive>& subframeArchive : markupAndArchive.archive->subframeArchives()) { |
| RefPtr<ArchiveResource> subframeMainResource = subframeArchive->mainResource(); |
| if (!subframeMainResource) |
| continue; |
| |
| auto type = subframeMainResource->mimeType(); |
| if (!canShowMIMETypeAsHTML(type)) |
| continue; |
| |
| auto subframeURL = subframeMainResource->url(); |
| if (!shouldReplaceSubresourceURL(subframeURL)) |
| continue; |
| |
| MarkupAndArchive subframeContent = { String::fromUTF8(subframeMainResource->data().data(), subframeMainResource->data().size()), |
| subframeMainResource.releaseNonNull(), subframeArchive.copyRef() }; |
| auto subframeMarkup = sanitizeMarkupWithArchive(frame, destinationDocument, subframeContent, MSOListQuirks::Disabled, canShowMIMETypeAsHTML); |
| |
| CString utf8 = subframeMarkup.utf8(); |
| Vector<uint8_t> blobBuffer; |
| blobBuffer.reserveCapacity(utf8.length()); |
| blobBuffer.append(reinterpret_cast<const uint8_t*>(utf8.data()), utf8.length()); |
| auto blob = Blob::create(WTFMove(blobBuffer), type); |
| |
| String subframeBlobURL = DOMURL::createObjectURL(destinationDocument, blob); |
| blobURLMap.set(subframeURL.string(), subframeBlobURL); |
| } |
| |
| replaceSubresourceURLs(fragment.get(), WTFMove(blobURLMap)); |
| |
| return sanitizedMarkupForFragmentInDocument(WTFMove(fragment), *stagingDocument, msoListQuirks, markupAndArchive.markup); |
| } |
| |
| bool WebContentReader::readWebArchive(SharedBuffer& buffer) |
| { |
| if (frame.settings().preferMIMETypeForImages() || !frame.document()) |
| return false; |
| |
| DeferredLoadingScope scope(frame); |
| auto result = extractMarkupAndArchive(buffer, [&] (const String& type) { |
| return frame.loader().client().canShowMIMETypeAsHTML(type); |
| }); |
| if (!result) |
| return false; |
| |
| if (!RuntimeEnabledFeatures::sharedFeatures().customPasteboardDataEnabled()) { |
| fragment = createFragmentFromMarkup(*frame.document(), result->markup, result->mainResource->url(), DisallowScriptingAndPluginContent); |
| if (DocumentLoader* loader = frame.loader().documentLoader()) |
| loader->addAllArchiveResources(result->archive.get()); |
| return true; |
| } |
| |
| if (!shouldSanitize()) { |
| fragment = createFragmentFromMarkup(*frame.document(), result->markup, result->mainResource->url(), DisallowScriptingAndPluginContent); |
| return true; |
| } |
| |
| String sanitizedMarkup = sanitizeMarkupWithArchive(frame, *frame.document(), *result, msoListQuirksForMarkup(), [&] (const String& type) { |
| return frame.loader().client().canShowMIMETypeAsHTML(type); |
| }); |
| fragment = createFragmentFromMarkup(*frame.document(), sanitizedMarkup, WTF::blankURL(), DisallowScriptingAndPluginContent); |
| |
| if (!fragment) |
| return false; |
| |
| return true; |
| } |
| |
| bool WebContentMarkupReader::readWebArchive(SharedBuffer& buffer) |
| { |
| if (!frame.document()) |
| return false; |
| |
| auto result = extractMarkupAndArchive(buffer, [&] (const String& type) { |
| return frame.loader().client().canShowMIMETypeAsHTML(type); |
| }); |
| if (!result) |
| return false; |
| |
| if (!shouldSanitize()) { |
| markup = result->markup; |
| return true; |
| } |
| |
| markup = sanitizeMarkupWithArchive(frame, *frame.document(), *result, msoListQuirksForMarkup(), [&] (const String& type) { |
| return frame.loader().client().canShowMIMETypeAsHTML(type); |
| }); |
| |
| return true; |
| } |
| |
| static String stripMicrosoftPrefix(const String& string) |
| { |
| #if PLATFORM(MAC) |
| // This code was added to make HTML paste from Microsoft Word on Mac work, back in 2004. |
| // It's a simple-minded way to ignore the CF_HTML clipboard format, just skipping over the |
| // description part and parsing the entire context plus fragment. |
| if (string.startsWith("Version:")) { |
| size_t location = string.findIgnoringASCIICase("<html"); |
| if (location != notFound) |
| return string.substring(location); |
| } |
| #endif |
| return string; |
| } |
| |
| bool WebContentReader::readHTML(const String& string) |
| { |
| if (frame.settings().preferMIMETypeForImages() || !frame.document()) |
| return false; |
| Document& document = *frame.document(); |
| |
| String stringOmittingMicrosoftPrefix = stripMicrosoftPrefix(string); |
| if (stringOmittingMicrosoftPrefix.isEmpty()) |
| return false; |
| |
| String markup; |
| if (RuntimeEnabledFeatures::sharedFeatures().customPasteboardDataEnabled() && shouldSanitize()) { |
| markup = sanitizeMarkup(stringOmittingMicrosoftPrefix, msoListQuirksForMarkup(), WTF::Function<void (DocumentFragment&)> { [] (DocumentFragment& fragment) { |
| removeSubresourceURLAttributes(fragment, [] (const URL& url) { |
| return shouldReplaceSubresourceURL(url); |
| }); |
| } }); |
| } else |
| markup = stringOmittingMicrosoftPrefix; |
| |
| addFragment(createFragmentFromMarkup(document, markup, emptyString(), DisallowScriptingAndPluginContent)); |
| return true; |
| } |
| |
| bool WebContentMarkupReader::readHTML(const String& string) |
| { |
| if (!frame.document()) |
| return false; |
| |
| String rawHTML = stripMicrosoftPrefix(string); |
| if (shouldSanitize()) { |
| markup = sanitizeMarkup(rawHTML, msoListQuirksForMarkup(), WTF::Function<void (DocumentFragment&)> { [] (DocumentFragment& fragment) { |
| removeSubresourceURLAttributes(fragment, [] (const URL& url) { |
| return shouldReplaceSubresourceURL(url); |
| }); |
| } }); |
| } else |
| markup = rawHTML; |
| |
| return !markup.isEmpty(); |
| } |
| |
| bool WebContentReader::readRTFD(SharedBuffer& buffer) |
| { |
| if (frame.settings().preferMIMETypeForImages() || !frame.document()) |
| return false; |
| |
| auto string = adoptNS([[NSAttributedString alloc] initWithRTFD:buffer.createNSData().get() documentAttributes:nullptr]); |
| auto fragment = createFragmentAndAddResources(frame, string.get()); |
| if (!fragment) |
| return false; |
| addFragment(fragment.releaseNonNull()); |
| |
| return true; |
| } |
| |
| bool WebContentMarkupReader::readRTFD(SharedBuffer& buffer) |
| { |
| if (!frame.document()) |
| return false; |
| auto string = adoptNS([[NSAttributedString alloc] initWithRTFD:buffer.createNSData().get() documentAttributes:nullptr]); |
| auto fragment = createFragmentAndAddResources(frame, string.get()); |
| if (!fragment) |
| return false; |
| |
| markup = serializeFragment(*fragment, SerializedNodes::SubtreeIncludingNode); |
| return true; |
| } |
| |
| bool WebContentReader::readRTF(SharedBuffer& buffer) |
| { |
| if (frame.settings().preferMIMETypeForImages()) |
| return false; |
| |
| auto string = adoptNS([[NSAttributedString alloc] initWithRTF:buffer.createNSData().get() documentAttributes:nullptr]); |
| auto fragment = createFragmentAndAddResources(frame, string.get()); |
| if (!fragment) |
| return false; |
| addFragment(fragment.releaseNonNull()); |
| |
| return true; |
| } |
| |
| bool WebContentMarkupReader::readRTF(SharedBuffer& buffer) |
| { |
| if (!frame.document()) |
| return false; |
| auto string = adoptNS([[NSAttributedString alloc] initWithRTF:buffer.createNSData().get() documentAttributes:nullptr]); |
| auto fragment = createFragmentAndAddResources(frame, string.get()); |
| if (!fragment) |
| return false; |
| markup = serializeFragment(*fragment, SerializedNodes::SubtreeIncludingNode); |
| return true; |
| } |
| |
| bool WebContentReader::readPlainText(const String& text) |
| { |
| if (!allowPlainText) |
| return false; |
| |
| addFragment(createFragmentFromText(context, [text precomposedStringWithCanonicalMapping])); |
| |
| madeFragmentFromPlainText = true; |
| return true; |
| } |
| |
| bool WebContentReader::readImage(Ref<SharedBuffer>&& buffer, const String& type, PresentationSize preferredPresentationSize) |
| { |
| ASSERT(frame.document()); |
| auto& document = *frame.document(); |
| if (shouldReplaceRichContentWithAttachments()) |
| addFragment(createFragmentForImageAttachment(frame, document, WTFMove(buffer), type, preferredPresentationSize)); |
| else |
| addFragment(createFragmentForImageAndURL(document, DOMURL::createObjectURL(document, Blob::create(buffer.get(), type)), preferredPresentationSize)); |
| |
| return fragment; |
| } |
| |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| |
| static String typeForAttachmentElement(const String& contentType) |
| { |
| if (contentType.isEmpty()) |
| return { }; |
| |
| auto mimeType = mimeTypeFromContentType(contentType); |
| return mimeType.isEmpty() ? contentType : mimeType; |
| } |
| |
| static Ref<HTMLElement> attachmentForFilePath(Frame& frame, const String& path, PresentationSize preferredSize, const String& explicitContentType) |
| { |
| auto document = makeRef(*frame.document()); |
| auto attachment = HTMLAttachmentElement::create(HTMLNames::attachmentTag, document); |
| if (!supportsClientSideAttachmentData(frame)) { |
| attachment->setFile(File::create(path), HTMLAttachmentElement::UpdateDisplayAttributes::Yes); |
| return attachment; |
| } |
| |
| bool isDirectory = FileSystem::fileIsDirectory(path, FileSystem::ShouldFollowSymbolicLinks::Yes); |
| String contentType = typeForAttachmentElement(explicitContentType); |
| if (contentType.isEmpty()) { |
| if (isDirectory) |
| contentType = kUTTypeDirectory; |
| else { |
| contentType = File::contentTypeForFile(path); |
| if (contentType.isEmpty()) |
| contentType = kUTTypeData; |
| } |
| } |
| |
| Optional<uint64_t> fileSizeForDisplay; |
| if (!isDirectory) { |
| long long fileSize; |
| FileSystem::getFileSize(path, fileSize); |
| fileSizeForDisplay = fileSize; |
| } |
| |
| frame.editor().registerAttachmentIdentifier(attachment->ensureUniqueIdentifier(), contentType, path); |
| |
| if (contentTypeIsSuitableForInlineImageRepresentation(contentType)) { |
| auto image = HTMLImageElement::create(document); |
| image->setAttributeWithoutSynchronization(HTMLNames::srcAttr, DOMURL::createObjectURL(document, File::create(path))); |
| image->setAttachmentElement(WTFMove(attachment)); |
| if (preferredSize.width) |
| image->setAttributeWithoutSynchronization(HTMLNames::widthAttr, AtomString::number(*preferredSize.width)); |
| if (preferredSize.height) |
| image->setAttributeWithoutSynchronization(HTMLNames::heightAttr, AtomString::number(*preferredSize.height)); |
| return image; |
| } |
| |
| attachment->updateAttributes(WTFMove(fileSizeForDisplay), contentType, FileSystem::pathGetFileName(path)); |
| return attachment; |
| } |
| |
| static Ref<HTMLElement> attachmentForData(Frame& frame, SharedBuffer& buffer, const String& contentType, const String& name, PresentationSize preferredSize) |
| { |
| auto document = makeRef(*frame.document()); |
| auto attachment = HTMLAttachmentElement::create(HTMLNames::attachmentTag, document); |
| auto attachmentType = typeForAttachmentElement(contentType); |
| |
| // FIXME: We should instead ask CoreServices for a preferred name corresponding to the given content type. |
| static const char* defaultAttachmentName = "file"; |
| |
| String fileName; |
| if (name.isEmpty()) |
| fileName = defaultAttachmentName; |
| else |
| fileName = name; |
| |
| if (!supportsClientSideAttachmentData(frame)) { |
| attachment->setFile(File::create(Blob::create(buffer, WTFMove(attachmentType)), fileName)); |
| return attachment; |
| } |
| |
| frame.editor().registerAttachmentIdentifier(attachment->ensureUniqueIdentifier(), attachmentType, fileName, buffer); |
| |
| if (contentTypeIsSuitableForInlineImageRepresentation(attachmentType)) { |
| auto image = HTMLImageElement::create(document); |
| image->setAttributeWithoutSynchronization(HTMLNames::srcAttr, DOMURL::createObjectURL(document, File::create(Blob::create(buffer, WTFMove(attachmentType)), WTFMove(fileName)))); |
| image->setAttachmentElement(WTFMove(attachment)); |
| if (preferredSize.width) |
| image->setAttributeWithoutSynchronization(HTMLNames::widthAttr, AtomString::number(*preferredSize.width)); |
| if (preferredSize.height) |
| image->setAttributeWithoutSynchronization(HTMLNames::heightAttr, AtomString::number(*preferredSize.height)); |
| return image; |
| } |
| |
| attachment->updateAttributes({ buffer.size() }, WTFMove(attachmentType), WTFMove(fileName)); |
| return attachment; |
| } |
| |
| #endif // ENABLE(ATTACHMENT_ELEMENT) |
| |
| bool WebContentReader::readFilePath(const String& path, PresentationSize preferredPresentationSize, const String& contentType) |
| { |
| if (path.isEmpty() || !frame.document()) |
| return false; |
| |
| auto& document = *frame.document(); |
| if (!fragment) |
| fragment = document.createDocumentFragment(); |
| |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| if (RuntimeEnabledFeatures::sharedFeatures().attachmentElementEnabled()) |
| fragment->appendChild(attachmentForFilePath(frame, path, preferredPresentationSize, contentType)); |
| #endif |
| |
| return true; |
| } |
| |
| bool WebContentReader::readFilePaths(const Vector<String>& paths) |
| { |
| if (paths.isEmpty() || !frame.document()) |
| return false; |
| |
| for (auto& path : paths) |
| readFilePath(path); |
| |
| return true; |
| } |
| |
| bool WebContentReader::readURL(const URL& url, const String& title) |
| { |
| if (url.isEmpty()) |
| return false; |
| |
| #if PLATFORM(IOS_FAMILY) |
| // FIXME: This code shouldn't be accessing selection and changing the behavior. |
| if (!frame.editor().client()->hasRichlyEditableSelection()) { |
| if (readPlainText([(NSURL *)url absoluteString])) |
| return true; |
| } |
| |
| if ([(NSURL *)url isFileURL]) |
| return false; |
| #endif // PLATFORM(IOS_FAMILY) |
| |
| auto document = makeRef(*frame.document()); |
| auto anchor = HTMLAnchorElement::create(document.get()); |
| anchor->setAttributeWithoutSynchronization(HTMLNames::hrefAttr, url.string()); |
| |
| NSString *linkText = title.isEmpty() ? [(NSURL *)url absoluteString] : (NSString *)title; |
| anchor->appendChild(document->createTextNode([linkText precomposedStringWithCanonicalMapping])); |
| |
| auto newFragment = document->createDocumentFragment(); |
| if (fragment) |
| newFragment->appendChild(HTMLBRElement::create(document.get())); |
| newFragment->appendChild(anchor); |
| addFragment(WTFMove(newFragment)); |
| return true; |
| } |
| |
| bool WebContentReader::readDataBuffer(SharedBuffer& buffer, const String& type, const String& name, PresentationSize preferredPresentationSize) |
| { |
| if (buffer.isEmpty()) |
| return false; |
| |
| if (!shouldReplaceRichContentWithAttachments()) |
| return false; |
| |
| auto document = makeRefPtr(frame.document()); |
| if (!document) |
| return false; |
| |
| if (!fragment) |
| fragment = document->createDocumentFragment(); |
| |
| #if ENABLE(ATTACHMENT_ELEMENT) |
| fragment->appendChild(attachmentForData(frame, buffer, type, name, preferredPresentationSize)); |
| #else |
| UNUSED_PARAM(type); |
| UNUSED_PARAM(name); |
| #endif |
| return true; |
| } |
| |
| } |