美文网首页正则表达式
日期区间正则表达式生成模块

日期区间正则表达式生成模块

作者: 白杨春晓 | 来源:发表于2017-06-23 14:06 被阅读5次

    功能:给定开始日期和结束日期,返回匹配该段日期区间的正则表达式。生成的正则表达式假定了每个月都有39天,即01-39,所以不要使用该模块来判断日期的合法性。该模块生成的正则表达式的使用场景是从一组合法日期中提取给定区间内的日期。源码如下,使用scala实现。

    def genRegexp(start:String,end:String): String = {
            //s:开始e:结束y:年m:月d:日o:个位t:十位
            //sy:开始年em:结束月,其他变量命名规则相同
            val sy = start.substring(0, 4)
            val sm = start.substring(4, 6)
            val sd = start.substring(6, 8)
            val ey = end.substring(0, 4)
            val em = end.substring(4, 6)
            val ed = end.substring(6, 8)
            val sdo = sd.substring(1, 2)
            val sdt = sd.substring(0, 1)
            val smo = sm.substring(1, 2)
            val smt = sm.substring(0, 1)
            val syo = sy.substring(3, 4)
            val syt = sy.substring(2, 3)
            val edo = ed.substring(1, 2)
            val edt = ed.substring(0, 1)
            val emo = em.substring(1, 2)
            val emt = em.substring(0, 1)
            val eyo = ey.substring(3, 4)
            val eyt = ey.substring(2, 3)
            var PAL = ""
            var PAR = ""
            var PA = ""
            var PB = ""
            var PC = ""
            var PCL = ""
            var PCR = ""
            var pattern = ""
            var PL = ""
            var PR = ""
            var PRT = ""
            if (sy == ey) {
                if (sm == em) {
                    if (sdt == edt) {
                        pattern = "(^%s%s%s[%s-%s]$)".format(sy, sm, sdt, sdo, edo)
                    }
                    else {
                        if (sdt.toInt + 1 == edt.toInt) {
                            pattern = "(^%s%s((%s[%s-9])|(%s[0-%s]))$)".format(sy, sm, sdt, sdo, edt, edo)
                        }
                        else {
                            pattern = "(^%s%s((%s[%s-9])|(%s[0-%s])|([%d-%d]\\d))$)".format(sy, sm, sdt, sdo,
                                edt, edo, sdt.toInt + 1, edt.toInt - 1)
                        }
                    }
                }
                else {
                    if (sdt == "3") {
                        PL = "(%s3[%s-9])".format(sm, sdo)
                    }
                    else {
                        PL = "(%s((%s[%s-9])|([%d-3]\\d)))".format(sm, sdt, sdo, sdt.toInt + 1)
                    }
                    if (edt == "0") {
                        PR = "(%s0[0-%s])".format(em, edo)
                    }
                    else {
                        PR = "(%s(([0-%d]\\d)|(%s[0-%s])))".format(em, edt.toInt - 1, edt, edo)
                    }
                    PRT = "(pass)"
                    if (sm.toInt + 1 != em.toInt) {
                        val sma = sm.toInt + 1
                        val emr = em.toInt - 1
                        if (sma < 10) {
                            if (emr < 10) {
                                PRT = "(0[%d-%d]\\d{2})".format(sma, emr)
                            }
                            else {
                                PRT = "(((0[%d-9])|(1[0-%d]))\\d{2})".format(smo.toInt + 1, emo.toInt - 1)
                            }
                        }
                        else {
                            PRT = "((1[%s-%s])\\d{2})".format((sma.toString).substring(1,2),
                                (emr.toString).substring(1,2))
                        }
                    }
                    pattern = "(^%s(%s|%s|%s)$)".format(sy, PL, PR, PRT)
                }
            }
            else {
                //构造PA
                if (sdt == "3") {
                    PAL = "%s(%s[%s-9])".format(sm, sdt, sdo)
                }
                else {
                    PAL = "(%s((%s[%s-9])|([%d-3]\\d)))".format(sm, sdt, sdo, sdt.toInt + 1)
                }
                if (sm.toInt == 12) {
                    PAR = "(pass)"
                }
                else if (sm.toInt >= 9) {
                    var sm2 = (sm.toInt + 1).toString
                    var smo2 = sm2.substring(1,2)
                    PAR = "(1[%s-2]\\d\\d)".format(smo2)
                }
                else {
                    PAR = "(((0[%d-9])|(1[0-2]))\\d{2})".format(smo.toInt + 1)
                }
                PA = "(^%s(%s|%s)$)".format(sy, PAL, PAR)
                //构造PB,已知问题,结束年不可为2000
                if (sy.toInt + 1 != ey.toInt) {
                    var sy2 = (sy.toInt + 1).toString
                    var syt2 = sy2.substring(2,3)
                    var syo2 = sy2.substring(3,4)
                    var ey2 = (ey.toInt - 1).toString
                    var eyt2 = ey2.substring(2,3)
                    var eyo2 = ey2.substring(3,4)
                    if (syt2 == eyt2) {
                        PB = "(^20%s[%s-%s]\\d{4}$)".format(syt2, syo2, eyo2)
                    }
                    else {
                        if (syt2.toInt + 1 != eyt2.toInt) {
                            PB = "(^20((%s[%d-9])|([%d-%d]\\d)|(%s[0-%s]))\\d{4}$)".format(syt2, syo2.toInt,
                                syt2.toInt + 1, eyt2.toInt - 1, eyt2, eyo2)
                        }
                        else {
                            PB = "(^20((%s[%d-9])|(%s[0-%s]))\\d{4}$)".format(syt2, syo2.toInt,
                                eyt2, eyo2)
                        }
                    }
                }
                else {
                    PB = "(pass)"
                }
                //构造PC
                if (edt == "0") {
                    PCR = "(%s%s[0-%s])".format(em, edt, edo)
                }
                else {
                    PCR = "(%s(([0-%d]\\d)|(%s[0-%s])))".format(em, edt.toInt - 1, edt, edo)
                }
                if (em.toInt >= 11) {
                    PCL = "(((0[1-9])|(1[0-%d]))\\d{2})".format( emo.toInt - 1)
                }
                else if (em.toInt == 10) {
                    PCL = "(0[1-9]\\d{2})"
                }
                else {
                    PCL = "(0[0-%d]\\d{2})".format(emo.toInt - 1)
                }
                PC = "(^%s(%s|%s)$)".format(ey, PCL, PCR)
                pattern = "%s|%s|%s".format(PA, PB, PC)
            }
            pattern
        }
    

    相关文章

      网友评论

        本文标题:日期区间正则表达式生成模块

        本文链接:https://www.haomeiwen.com/subject/jelccxtx.html