15821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Copyright (c) 2012 The Chromium Authors. All rights reserved.
25821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be
35821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// found in the LICENSE file.
45821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
55821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "base/basictypes.h"
65821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "net/base/data_url.h"
75821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#include "testing/gtest/include/gtest/gtest.h"
87dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch#include "url/gurl.h"
95821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)namespace {
115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)struct ParseTestData {
135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  const char* url;
145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  bool is_valid;
155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  const char* mime_type;
165821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  const char* charset;
175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  const char* data;
185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)};
195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)TEST(DataURLTest, Parse) {
235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  const ParseTestData tests[] = {
245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:",
255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)       false,
265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)       "",
275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)       "",
285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)       "" },
295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:,",
315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
335821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "" },
355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,",
375821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
395821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "" },
415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;charset=,test",
435821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
445821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
455821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
465821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "test" },
475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
485821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:TeXt/HtMl,<b>x</b>",
495821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
505821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/html",
515821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
525821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "<b>x</b>" },
535821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:,foo",
555821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
575821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
585821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "foo" },
595821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
605821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,aGVsbG8gd29ybGQ=",
615821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
625821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
635821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
645821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "hello world" },
655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
665821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:foo/bar;baz=1;charset=kk,boo",
675821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
685821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "foo/bar",
695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "kk",
705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "boo" },
715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:foo/bar;charset=kk;baz=1,boo",
735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "foo/bar",
755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "kk",
765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "boo" },
775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
785821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:text/html,%3Chtml%3E%3Cbody%3E%3Cb%3Ehello%20world"
795821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)          "%3C%2Fb%3E%3C%2Fbody%3E%3C%2Fhtml%3E",
805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/html",
825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "<html><body><b>hello world</b></body></html>" },
845821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
855821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:text/html,<html><body><b>hello world</b></body></html>",
865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/html",
885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
895821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "<html><body><b>hello world</b></body></html>" },
905821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
91cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)    // Bad mime type
92cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)    { "data:f(oo/bar;baz=1;charset=kk,boo",
93cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)      false,
94cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)      "",
95cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)      "",
96cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)      "" },
97cedac228d2dd51db4b79ea1e72c7f249408ee061Torne (Richard Coles)
985821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // the comma cannot be url-escaped!
995821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:%2Cblah",
1005821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      false,
1015821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1025821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1035821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "" },
1045821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1055821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // invalid base64 content
1065821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,aGVs_-_-",
1075821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      false,
1085821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1095821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "" },
1115821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Spaces should be removed from non-text data URLs (we already tested
1135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // spaces above).
1145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { " bG8gd2  9ybGQ=",
1225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1235821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
1245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
1255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "hello world" },
1265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Other whitespace should also be removed from anything base-64 encoded.
1285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,aGVs bG8gd2  \n9ybGQ=",
1295821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
1315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
1325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "hello world" },
1335821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // In base64 encoding, escaped whitespace should be stripped.
1355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // (This test was taken from acid3)
1365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // http://b/1054495
1375821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:text/javascript;base64,%20ZD%20Qg%0D%0APS%20An%20Zm91cic%0D%0A%207"
1385821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)          "%20",
1395821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/javascript",
1415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
1425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "d4 = 'four';" },
1435821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1445821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Only unescaped whitespace should be stripped in non-base64.
1455821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // http://b/1157796
1465821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:img/png,A  B  %20  %0A  C",
1475821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1485821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "img/png",
1495821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
1505821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "AB \nC" },
1515821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1525821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:text/plain;charset=utf-8;base64,SGVsbMO2",
1535821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
1555821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "utf-8",
1565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "Hell\xC3\xB6" },
1575821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1585821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Not sufficiently padded.
1595821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,aGVsbG8gd29ybGQ",
1605821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      true,
1615821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "text/plain",
1625821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "US-ASCII",
1635821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "hello world" },
1645821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // Bad encoding (truncated).
1665821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    { "data:;base64,aGVsbG8gd29yb",
1675821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      false,
1685821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1695821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "",
1705821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      "" },
1715821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1725821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    // TODO(darin): add more interesting tests
1735821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  };
1745821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
1755821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  for (size_t i = 0; i < arraysize(tests); ++i) {
1765821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    std::string mime_type;
1775821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    std::string charset;
1785821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    std::string data;
1795821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    bool ok =
1805821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)        net::DataURL::Parse(GURL(tests[i].url), &mime_type, &charset, &data);
1815821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    EXPECT_EQ(ok, tests[i].is_valid);
1825821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    if (tests[i].is_valid) {
1835821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      EXPECT_EQ(tests[i].mime_type, mime_type);
1845821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      EXPECT_EQ(tests[i].charset, charset);
1855821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)      EXPECT_EQ(tests[i].data, data);
1865821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    }
1875821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  }
1885821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
189