[Regular Expression] regular expressions application

JavaScript form validation

<!DOCTYPE html>
<html>
<head>
<meta charset="UTF-8">
<title>Insert title here</title>
</head>
<body>
    <form action="#" method="post" id="frmInfo">
        <div id="err" style="color: red"></div>
        <div>
            姓名:<input id="name" name="name" />
        </div>
        <div>
            身份证:<input id="idno" name="idno" />
        </div>
        <div>
            <input type="submit" />
        </div>
    </form>
    <script type="text/javascript">
        document.getElementById("frmInfo").onsubmit = function() {
            //在JS中定义正则表达式对象只需要在/正则表达式/
            var regex1 = /^[\u4e00-\u9fa5]{2,8}$/; //全字匹配2-8个中文字符
            var regex2 = /^[1234568]\d{16}[0-9xX]$/; 
            var name = document.getElementById("name").value;
            var idno = document.getElementById("idno").value;
            if (regex1.test(name) == false) { //利用正则校验数据,true代表匹配成功,false代表匹配失败
                document.getElementById("err").innerHTML = "无效姓名";
                return false; //不提交表单数据
            }else if(regex2.test(idno) == false) {
                document.getElementById("err").innerHTML = "无效身份证号";
                return false;
            }else {
                alert("验证通过,准备提交");
                return true;
            }
        }
    </script>
</body>
</html>

Java, Web page information extraction

Extraction of Web pages and urban Chinese name English name

Web page

<!DOCTYPE html>
<html>
<head>
<meta charset="UTF-8">
<title>国际主要城市</title>
</head>
<body>
    <h1>国际主要城市</h1>
    <ul>
        <li>纽约NewYork</li>
        <li>伦敦London</li>
        <li>东京Tokyo</li>
        <li>巴黎Paris</li>
        <li>香港HongKong</li>
        <li>新加坡Singapore</li>
        <li>悉尼Sydney</li>
        <li>米兰Milano</li>
        <li>上海Shanghai</li>
        <li>北京Beijing</li>
        <li>马德里Madrid</li>
        <li>莫斯科Moscow</li>
        <li>首尔Seoul</li>
        <li>曼谷Bangkok</li>
        <li>多伦多Toronto</li>
        <li>布鲁塞尔Brussels</li>
        <li>芝加哥Chicago</li>
        <li>吉隆坡KualaLumpur</li>
    </ul>
</body>
</html>

Information extraction

package com.imooc.regex;

import java.io.BufferedReader;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.InputStreamReader;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class RegexSample {
    public static void main(String[] args) {
        StringBuilder content = new StringBuilder();
        try {
            FileInputStream fis = new FileInputStream("D:/workspace/regex/WebContent/sample.html"); //原始的文件输入流,擅长处理二进制数据
            InputStreamReader isr = new InputStreamReader(fis,"UTF-8"); //转换为可读的字符串流
            BufferedReader bufferedReader = new BufferedReader(isr); //从缓冲流读取,提高读取效率
            String lineText = "";
            while((lineText = bufferedReader.readLine()) != null) {
//              System.out.println(lineText);
                content.append(lineText + "\n");
            }
            bufferedReader.close();
            System.out.println(content);
        
        } catch (Exception e) {
            // TODO Auto-generated catch block
            e.printStackTrace();
        }
        
        //1.创建正则表达式对象
        Pattern p = Pattern.compile("<li>([\\u4e00-\\u9fa5]{2,10})([a-zA-Z]+)</li>");
        //2.匹配正则表达式
        Matcher m = p.matcher(content);
        //3.查找匹配的结果
        while(m.find()) {
//          System.out.println(m.group(0)); //完整匹配信息
            String chs = m.group(1); //分组1
            String eng = m.group(2); //分组2
            System.out.println(chs + "-" + eng);
        }
    }
}

Guess you like

Origin www.cnblogs.com/huowuyan/p/11300745.html