锘??xml version="1.0" encoding="utf-8" standalone="yes"?>在线观看av网站,国产精品久久久久久久龚玥菲 ,蜜桃一区二区http://www.aygfsteel.com/xiaolitnt/category/43901.html鏀瑰彉涓嶄簡鐜板疄錛岄偅灝卞幓鏀瑰彉浣犵殑蹇冩?/description>zh-cnFri, 05 Feb 2010 01:59:44 GMTFri, 05 Feb 2010 01:59:44 GMT60HtmlParser鎶撳彇鐧懼害鏂版瓕TOP100http://www.aygfsteel.com/xiaolitnt/archive/2010/02/05/312050.html闃挎媺紲炵伅闃挎媺紲炵伅Fri, 05 Feb 2010 01:41:00 GMThttp://www.aygfsteel.com/xiaolitnt/archive/2010/02/05/312050.htmlhttp://www.aygfsteel.com/xiaolitnt/comments/312050.htmlhttp://www.aygfsteel.com/xiaolitnt/archive/2010/02/05/312050.html#Feedback0http://www.aygfsteel.com/xiaolitnt/comments/commentRss/312050.htmlhttp://www.aygfsteel.com/xiaolitnt/services/trackbacks/312050.html 

import org.htmlparser.NodeFilter;
import
 org.htmlparser.Parser;
import
 org.htmlparser.filters.HasAttributeFilter;
import
 org.htmlparser.filters.NodeClassFilter;
import
 org.htmlparser.filters.TagNameFilter;
import
 org.htmlparser.tags.LinkTag;
import
 org.htmlparser.tags.Span;
import
 org.htmlparser.tags.TableColumn;
import
 org.htmlparser.tags.TableRow;
import
 org.htmlparser.tags.TableTag;
import
 org.htmlparser.util.NodeList;
import
 org.htmlparser.util.ParserException;

public class
 test3 {
    
public static void main(String[] args) throws
 ParserException {
        String url 
= "http://list.mp3.baidu.com/top/top100.html"
;
        Parser parser 
= new
 Parser(url);
        NodeFilter filter_table 
= new NodeClassFilter(TableTag.class
);
        NodeFilter filter_span 
= new NodeClassFilter(Span.class
);
        NodeFilter filter_link 
= new TagNameFilter("A"
);
        NodeFilter filter_search 
= new HasAttributeFilter("class","search"
);
        NodeList nodelist 
=
 parser.extractAllNodesThatMatch(filter_table);
        
for(int i = 0  ; i < nodelist.size() ; i++
){
            TableTag table 
=
 (TableTag) nodelist.elementAt(i);
            
for(int j = 0 ; j < table.getRowCount() ; j++
){
                TableRow row 
=
 table.getRow(j);
                TableColumn[] column 
=
 row.getColumns();
                
for(int m = 0 ; m < row.getColumnCount() ; m++
){
                    String tempstr 
=
 column[m].getStringText() ;
                    parser 
= Parser.createParser(tempstr,"utf-8"
);
                    NodeList list_span 
=
 parser.extractAllNodesThatMatch(filter_span);
                    
if(list_span.size() > 0
){
                        
for(int i1 = 0 ; i1 < list_span.size() ; i1++
){
                            System.out.print(list_span.elementAt(i1).toPlainTextString() 
+ "  "
);
                        }
                    }
                    parser.reset();
                    NodeList list_link 
=
 parser.extractAllNodesThatMatch(filter_link);
                    
if(list_link.size() > 0
){
                        
for(int i1 = 0 ; i1 < list_link.size() ; i1++
){    
                            String content 
=
 ((LinkTag)list_link.elementAt(i1)).getLinkText() ;
                            
if(!content.equals(null
)){
                                System.out.print(content 
+ "  "
);
                            }
                        }
                    }
                    parser.reset();
                    NodeList list_search 
=
 parser.extractAllNodesThatMatch(filter_search);
                    
if(list_search.size() > 0
){
                        
for(int i1 = 0 ; i1 < list_search.size() ; i1++
){    
                            String link 
=
 ((LinkTag)list_search.elementAt(i1)).getLink() ;
                            
if(!link.equals(null
)){
                                System.out.print(link 
+ "  "
);
                            }
                        }
                    }
                }
                System.out.println();
            }
        }    
    }
}


]]>
主站蜘蛛池模板: 九江县| 嘉祥县| 绥宁县| 油尖旺区| 清苑县| 马龙县| 浙江省| 民县| 泽库县| 鄯善县| 涿鹿县| 桐乡市| 安丘市| 醴陵市| 来宾市| 永春县| 虎林市| 呼伦贝尔市| 新田县| 枣阳市| 蚌埠市| 阜康市| 略阳县| 高安市| 鄂托克前旗| 同德县| 阳东县| 无锡市| 旬邑县| 如皋市| 张家界市| 沽源县| 宜兴市| 德江县| 西盟| 晋江市| 新野县| 炎陵县| 安陆市| 石首市| 琼结县|