正则表达式(根据Tag查询Html内容)

使用正则表达式查询一段Html中的Title标签,包括内容!!


import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class Test {

    public static void main(String args[]) {
        String html = "<title fdsafdsa>ABCD<hrf></title>gsdggas<title>ggds</title>jkll<title fdfdsa>005</title>";
        List resultList = getContextByTag(html,"title");
        for (Iterator iterator = resultList.iterator(); iterator.hasNext();) {
            String context = (String) iterator.next();
            System.out.println(context);
        }
    }
    
    public static List getContextByTag(String html,String tag) {
    	String reg="<"+tag+"(([^<|^>|.]*>)|( >)).*?</"+tag+">";
        List resultList = new ArrayList();
        Pattern p = Pattern.compile(reg);
        Matcher m = p.matcher(html );
        while (m.find()) {
            resultList.add(m.group());
        }
        return resultList;
    }
}


结果:
<title fdsafdsa>ABCD<hrf></title>
<title>ggds</title>
<title fdfdsa>005</title>

你可能感兴趣的:(java,html,正则表达式)