[SCM] jsoup HTML parser branch, master, updated. debian/1.6.2-1-9-ge68369a
Emmanuel Bourg
ebourg at apache.org
Mon May 13 09:32:12 UTC 2013
The following commit has been merged in the master branch:
commit bcfcab61acf1ea8b3d882c595dcd5261ffb4b916
Author: Emmanuel Bourg <ebourg at apache.org>
Date: Mon May 13 10:32:06 2013 +0200
Refreshed the patch
diff --git a/debian/patches/dfsg-free-test-data.patch b/debian/patches/dfsg-free-test-data.patch
index b5a645f..266ceec 100644
--- a/debian/patches/dfsg-free-test-data.patch
+++ b/debian/patches/dfsg-free-test-data.patch
@@ -8,11 +8,17 @@ Subject: dfsg-free-test-data
2 files changed, 1192 insertions(+), 85 deletions(-)
create mode 100644 src/test/resources/htmltests/wikipedia-article-1.html
-diff --git a/src/test/java/org/jsoup/integration/ParseTest.java b/src/test/java/org/jsoup/integration/ParseTest.java
-index dc03973..d49e3e5 100644
--- a/src/test/java/org/jsoup/integration/ParseTest.java
+++ b/src/test/java/org/jsoup/integration/ParseTest.java
-@@ -19,50 +19,41 @@ import java.net.URISyntaxException;
+@@ -6,6 +6,7 @@
+ import org.jsoup.select.Elements;
+ import static org.junit.Assert.*;
+ import org.junit.Test;
++import org.junit.Ignore;
+
+ import java.io.File;
+ import java.io.IOException;
+@@ -19,50 +20,41 @@
public class ParseTest {
@Test
@@ -86,49 +92,23 @@ index dc03973..d49e3e5 100644
}
@Test
-@@ -74,41 +65,6 @@ public class ParseTest {
+@@ -74,6 +66,7 @@
}
@Test
-- public void testYahooJp() throws IOException {
-- File in = getFile("/htmltests/yahoo-jp.html");
-- Document doc = Jsoup.parse(in, "UTF-8", "http://www.yahoo.co.jp/index.html"); // http charset is utf-8.
-- assertEquals("Yahoo! JAPAN", doc.title());
-- Element a = doc.select("a[href=t/2322m2]").first();
-- assertEquals("http://www.yahoo.co.jp/_ylh=X3oDMTB0NWxnaGxsBF9TAzIwNzcyOTYyNjUEdGlkAzEyBHRtcGwDZ2Ex/t/2322m2",
-- a.attr("abs:href")); // session put into <base>
-- assertEquals("全国、人気の駅ランキング", a.text());
-- }
--
-- @Test
-- public void testBaidu() throws IOException {
-- // tests <meta http-equiv="Content-Type" content="text/html;charset=gb2312">
-- File in = getFile("/htmltests/baidu-cn-home.html");
-- Document doc = Jsoup.parse(in, null,
-- "http://www.baidu.com/"); // http charset is gb2312, but NOT specifying it, to test http-equiv parse
-- Element submit = doc.select("#su").first();
-- assertEquals("百度一下", submit.attr("value"));
--
-- // test from attribute match
-- submit = doc.select("input[value=百度一下]").first();
-- assertEquals("su", submit.id());
-- Element newsLink = doc.select("a:contains(新)").first();
-- assertEquals("http://news.baidu.com", newsLink.absUrl("href"));
--
-- // check auto-detect from meta
-- assertEquals("GB2312", doc.outputSettings().charset().displayName());
-- assertEquals("<title>百度一下,你就知道 </title>", doc.select("title").outerHtml());
--
-- doc.outputSettings().charset("ascii");
-- assertEquals("<title>百度一下,你就知道 </title>",
-- doc.select("title").outerHtml());
-- }
--
-- @Test
- public void testBaiduVariant() throws IOException {
- // tests <meta charset> when preceded by another <meta>
- File in = getFile("/htmltests/baidu-variant.html");
-@@ -140,24 +96,6 @@ public class ParseTest {
++ @Ignore
+ public void testYahooJp() throws IOException {
+ File in = getFile("/htmltests/yahoo-jp.html");
+ Document doc = Jsoup.parse(in, "UTF-8", "http://www.yahoo.co.jp/index.html"); // http charset is utf-8.
+@@ -85,6 +78,7 @@
+ }
+
+ @Test
++ @Ignore
+ public void testBaidu() throws IOException {
+ // tests <meta http-equiv="Content-Type" content="text/html;charset=gb2312">
+ File in = getFile("/htmltests/baidu-cn-home.html");
+@@ -140,24 +134,6 @@
assertEquals("新", doc.text());
}
@@ -153,9 +133,6 @@ index dc03973..d49e3e5 100644
File getFile(String resourceName) {
try {
File file = new File(ParseTest.class.getResource(resourceName).toURI());
-diff --git a/src/test/resources/htmltests/wikipedia-article-1.html b/src/test/resources/htmltests/wikipedia-article-1.html
-new file mode 100644
-index 0000000..14e7758
--- /dev/null
+++ b/src/test/resources/htmltests/wikipedia-article-1.html
@@ -0,0 +1,1169 @@
--
jsoup HTML parser
More information about the pkg-java-commits
mailing list