Go Home Page
The Go Programming Language

Source file src/pkg/testing/regexp_test.go

// Copyright 2009 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

package testing

var good_re = []string{
    ``,
    `.`,
    `^.$`,
    `a`,
    `a*`,
    `a+`,
    `a?`,
    `a|b`,
    `a*|b*`,
    `(a*|b)(c*|d)`,
    `[a-z]`,
    `[a-abc-c\-\]\[]`,
    `[a-z]+`,
    `[]`,
    `[abc]`,
    `[^1234]`,
    `[^\n]`,
}

// TODO: nice to do this with a map
type stringError struct {
    re  string
    err string
}

var bad_re = []stringError{
    stringError{`*`, ErrBareClosure},
    stringError{`(abc`, ErrUnmatchedLpar},
    stringError{`abc)`, ErrUnmatchedRpar},
    stringError{`x[a-z`, ErrUnmatchedLbkt},
    stringError{`abc]`, ErrUnmatchedRbkt},
    stringError{`[z-a]`, ErrBadRange},
    stringError{`abc\`, ErrExtraneousBackslash},
    stringError{`a**`, ErrBadClosure},
    stringError{`a*+`, ErrBadClosure},
    stringError{`a??`, ErrBadClosure},
    stringError{`*`, ErrBareClosure},
    stringError{`\x`, ErrBadBackslash},
}

type vec []int

type tester struct {
    re    string
    text  string
    match vec
}

var matches = []tester{
    tester{``, "", vec{0, 0}},
    tester{`a`, "a", vec{0, 1}},
    tester{`x`, "y", vec{}},
    tester{`b`, "abc", vec{1, 2}},
    tester{`.`, "a", vec{0, 1}},
    tester{`.*`, "abcdef", vec{0, 6}},
    tester{`^abcd$`, "abcd", vec{0, 4}},
    tester{`^bcd'`, "abcdef", vec{}},
    tester{`^abcd$`, "abcde", vec{}},
    tester{`a+`, "baaab", vec{1, 4}},
    tester{`a*`, "baaab", vec{0, 0}},
    tester{`[a-z]+`, "abcd", vec{0, 4}},
    tester{`[^a-z]+`, "ab1234cd", vec{2, 6}},
    tester{`[a\-\]z]+`, "az]-bcz", vec{0, 4}},
    tester{`[^\n]+`, "abcd\n", vec{0, 4}},
    tester{`[日本語]+`, "日本語日本語", vec{0, 18}},
    tester{`()`, "", vec{0, 0, 0, 0}},
    tester{`(a)`, "a", vec{0, 1, 0, 1}},
    tester{`(.)(.)`, "日a", vec{0, 4, 0, 3, 3, 4}},
    tester{`(.*)`, "", vec{0, 0, 0, 0}},
    tester{`(.*)`, "abcd", vec{0, 4, 0, 4}},
    tester{`(..)(..)`, "abcd", vec{0, 4, 0, 2, 2, 4}},
    tester{`(([^xyz]*)(d))`, "abcd", vec{0, 4, 0, 4, 0, 3, 3, 4}},
    tester{`((a|b|c)*(d))`, "abcd", vec{0, 4, 0, 4, 2, 3, 3, 4}},
    tester{`(((a|b|c)*)(d))`, "abcd", vec{0, 4, 0, 4, 0, 3, 2, 3, 3, 4}},
    tester{`a*(|(b))c*`, "aacc", vec{0, 4, 2, 2, -1, -1}},
}

func compileTest(t *T, expr string, error string) *Regexp {
    re, err := CompileRegexp(expr)
    if err != error {
        t.Error("compiling `", expr, "`; unexpected error: ", err)
    }
    return re
}

func TestGoodCompile(t *T) {
    for i := 0; i < len(good_re); i++ {
        compileTest(t, good_re[i], "")
    }
}

func TestBadCompile(t *T) {
    for i := 0; i < len(bad_re); i++ {
        compileTest(t, bad_re[i].re, bad_re[i].err)
    }
}

func matchTest(t *T, expr string, str string, match []int) {
    re := compileTest(t, expr, "")
    if re == nil {
        return
    }
    m := re.MatchString(str)
    if m != (len(match) > 0) {
        t.Error("MatchString failure on `", expr, "` matching `", str, "`:", m, "should be", len(match) > 0)
    }
    // now try bytes
    m = re.Match([]byte(str))
    if m != (len(match) > 0) {
        t.Error("Match failure on `", expr, "` matching `", str, "`:", m, "should be", len(match) > 0)
    }
}

func TestMatch(t *T) {
    for i := 0; i < len(matches); i++ {
        test := &matches[i]
        matchTest(t, test.re, test.text, test.match)
    }
}

func matchFunctionTest(t *T, expr string, str string, match []int) {
    m, err := MatchString(expr, str)
    if err == "" {
        return
    }
    if m != (len(match) > 0) {
        t.Error("function Match failure on `", expr, "` matching `", str, "`:", m, "should be", len(match) > 0)
    }
}

func TestMatchFunction(t *T) {
    for i := 0; i < len(matches); i++ {
        test := &matches[i]
        matchFunctionTest(t, test.re, test.text, test.match)
    }
}