?? tablecontentbyhtmlparse.java
字號:
package test;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.List;
import net.htmlparser.jericho.Element;
import net.htmlparser.jericho.HTMLElementName;
import net.htmlparser.jericho.Source;
/**
* 1.使用htmlparser.jericho方法來實現 2.通過列和行來定位表格元素。獲取表格元素 3.可以獲取所有的表格。
* 4.對于表格嵌套的話,可能還需要做相應更改
*
* @author Administrator
*
*/
public class TableContentByHtmlParse {
public Element getTableContent(Element element, int rows, int cols) {
Element resultElement = null;
List<Element> trList = element.findAllElements(HTMLElementName.TR);
if (rows < trList.size()) {
Element trElement = trList.get(rows);
List<Element> tdList = trElement
.findAllElements(HTMLElementName.TD);
if (cols < tdList.size()) {
// Element tdElement=tdList.get(cols);
resultElement = tdList.get(cols);
System.out.println(resultElement.getContent().toString());
}
}
return resultElement;
}
public static void test(String url) {
Source source = null;
try {
source = new Source(new URL(url));
} catch (MalformedURLException e) {
e.printStackTrace();
} catch (IOException e) {
e.printStackTrace();
}
List<Element> elementList = source
.findAllElements(HTMLElementName.TABLE);
for (Element element : elementList) {
Element currentElement = new TableContentByHtmlParse()
.getTableContent(element, 2, 2);
if (currentElement != null)
System.out.println(currentElement.getContent().toString());
}
}
public static void main(String[] args) {
test("http://www.akae.cn/study/resourceShareC.html");
}
}
?? 快捷鍵說明
復制代碼
Ctrl + C
搜索代碼
Ctrl + F
全屏模式
F11
切換主題
Ctrl + Shift + D
顯示快捷鍵
?
增大字號
Ctrl + =
減小字號
Ctrl + -