summaryrefslogtreecommitdiffstats
path: root/src/core/clipboard_util_win.cpp
blob: ae615b3b6ae5e2f81abfc7676dbf29532546946f (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
/*
 * Copyright (C) 2007, 2008 Apple Inc. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY APPLE COMPUTER, INC. ``AS IS'' AND ANY
 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL APPLE COMPUTER, INC. OR
 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE.Chromium file.

#include <string>

#include "base/strings/stringprintf.h"
#include "base/strings/string_util.h"

// These functions are copied from ui/base/clipboard/clipboard_util_win.cc

namespace QtWebEngineCore {

// Helper method for converting from text/html to MS CF_HTML.
// Documentation for the CF_HTML format is available at
// http://msdn.microsoft.com/en-us/library/aa767917(VS.85).aspx
// HtmlToCFHtml is based on similar method in
// WebCore/platform/win/ClipboardUtilitiesWin.cpp.
std::string HtmlToCFHtml(const std::string &html, const std::string &base_url)
{
    if (html.empty())
        return std::string();

#define MAX_DIGITS 10
#define MAKE_NUMBER_FORMAT_1(digits) MAKE_NUMBER_FORMAT_2(digits)
#define MAKE_NUMBER_FORMAT_2(digits) "%0" #digits "u"
#define NUMBER_FORMAT MAKE_NUMBER_FORMAT_1(MAX_DIGITS)

    static const char *header = "Version:0.9\r\n"
                                "StartHTML:" NUMBER_FORMAT "\r\n"
                                "EndHTML:" NUMBER_FORMAT "\r\n"
                                "StartFragment:" NUMBER_FORMAT "\r\n"
                                "EndFragment:" NUMBER_FORMAT "\r\n";
    static const char *source_url_prefix = "SourceURL:";

    static const char *start_markup = "<html>\r\n<body>\r\n<!--StartFragment-->";
    static const char *end_markup = "<!--EndFragment-->\r\n</body>\r\n</html>";

    // Calculate offsets
    size_t start_html_offset = strlen(header) - strlen(NUMBER_FORMAT) * 4 + MAX_DIGITS * 4;
    if (!base_url.empty()) {
        start_html_offset += strlen(source_url_prefix) + base_url.length() + 2; // Add 2 for \r\n.
    }
    size_t start_fragment_offset = start_html_offset + strlen(start_markup);
    size_t end_fragment_offset = start_fragment_offset + html.length();
    size_t end_html_offset = end_fragment_offset + strlen(end_markup);

    std::string result = base::StringPrintf(header, start_html_offset, end_html_offset,
                                            start_fragment_offset, end_fragment_offset);
    if (!base_url.empty()) {
        result += source_url_prefix;
        result += base_url;
        result += "\r\n";
    }
    result += start_markup;
    result += html;
    result += end_markup;

#undef MAX_DIGITS
#undef MAKE_NUMBER_FORMAT_1
#undef MAKE_NUMBER_FORMAT_2
#undef NUMBER_FORMAT

    return result;
}

void CFHtmlExtractMetadata(const std::string &cf_html, std::string *base_url, size_t *html_start,
                           size_t *fragment_start, size_t *fragment_end)
{
    // Obtain base_url if present.
    if (base_url) {
        static constexpr char kSrcUrlStr[] = "SourceURL:";
        size_t line_start = cf_html.find(kSrcUrlStr);
        if (line_start != std::string::npos) {
            size_t src_end = cf_html.find("\n", line_start);
            size_t src_start = line_start + strlen(kSrcUrlStr);
            if (src_end != std::string::npos && src_start != std::string::npos) {
                *base_url = cf_html.substr(src_start, src_end - src_start);
                base::TrimWhitespaceASCII(*base_url, base::TRIM_ALL, base_url);
            }
        }
    }

    // Find the markup between "<!--StartFragment-->" and "<!--EndFragment-->".
    // If the comments cannot be found, like copying from OpenOffice Writer,
    // we simply fall back to using StartFragment/EndFragment bytecount values
    // to determine the fragment indexes.
    std::string cf_html_lower = base::ToLowerASCII(cf_html);
    size_t markup_start = cf_html_lower.find("<html", 0);
    if (html_start) {
        *html_start = markup_start;
    }
    size_t tag_start = cf_html.find("<!--StartFragment", markup_start);
    if (tag_start == std::string::npos) {
        static constexpr char kStartFragmentStr[] = "StartFragment:";
        size_t start_fragment_start = cf_html.find(kStartFragmentStr);
        if (start_fragment_start != std::string::npos) {
            *fragment_start = static_cast<size_t>(
                    atoi(cf_html.c_str() + start_fragment_start + strlen(kStartFragmentStr)));
        }

        static constexpr char kEndFragmentStr[] = "EndFragment:";
        size_t end_fragment_start = cf_html.find(kEndFragmentStr);
        if (end_fragment_start != std::string::npos) {
            *fragment_end = static_cast<size_t>(
                    atoi(cf_html.c_str() + end_fragment_start + strlen(kEndFragmentStr)));
        }
    } else {
        *fragment_start = cf_html.find('>', tag_start) + 1;
        size_t tag_end = cf_html.rfind("<!--EndFragment", std::string::npos);
        *fragment_end = cf_html.rfind('<', tag_end);
    }
}

} // namespace QtWebEngineCore