// Copyright 2016 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. //go:build go1.10 package bidirule import ( "golang.org/x/text/transform" "golang.org/x/text/unicode/bidi" ) var testCases = [][]ruleTest{ // Go-specific rules. // Invalid UTF-8 is invalid. 0: []ruleTest{{ in: "", dir: bidi.LeftToRight, }, { in: "\x80", dir: bidi.LeftToRight, err: ErrInvalid, n: 0, }, { in: "\xcc", dir: bidi.LeftToRight, err: ErrInvalid, n: 0, }, { in: "abc\x80", dir: bidi.LeftToRight, err: ErrInvalid, n: 3, }, { in: "abc\xcc", dir: bidi.LeftToRight, err: ErrInvalid, n: 3, }, { in: "abc\xccdef", dir: bidi.LeftToRight, err: ErrInvalid, n: 3, }, { in: "\xccdef", dir: bidi.LeftToRight, err: ErrInvalid, n: 0, }, { in: strR + "\x80", dir: bidi.RightToLeft, err: ErrInvalid, n: len(strR), }, { in: strR + "\xcc", dir: bidi.RightToLeft, err: ErrInvalid, n: len(strR), }, { in: strAL + "\xcc" + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: len(strAL), }, { in: "\xcc" + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 0, }}, // Rule 2.1: The first character must be a character with Bidi property L, // R, or AL. If it has the R or AL property, it is an RTL label; if it has // the L property, it is an LTR label. 1: []ruleTest{{ in: strL, dir: bidi.LeftToRight, }, { in: strR, dir: bidi.RightToLeft, }, { in: strAL, dir: bidi.RightToLeft, }, { in: strAN, dir: bidi.RightToLeft, err: ErrInvalid, }, { in: strEN, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strEN), }, { in: strES, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strES), }, { in: strET, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strET), }, { in: strCS, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strCS), }, { in: strNSM, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strNSM), }, { in: strBN, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strBN), }, { in: strB, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strB), }, { in: strS, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strS), }, { in: strWS, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strWS), }, { in: strON, dir: bidi.LeftToRight, err: ErrInvalid, n: len(strON), }, { in: strEN + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 3, }, { in: strES + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 2, }, { in: strET + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 1, }, { in: strCS + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 1, }, { in: strNSM + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 2, }, { in: strBN + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 3, }, { in: strB + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 3, }, { in: strS + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 1, }, { in: strWS + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 1, }, { in: strON + strR, dir: bidi.RightToLeft, err: ErrInvalid, n: 1, }}, // Rule 2.2: In an RTL label, only characters with the Bidi properties R, // AL, AN, EN, ES, CS, ET, ON, BN, or NSM are allowed. 2: []ruleTest{{ in: strR + strR + strAL, dir: bidi.RightToLeft, }, { in: strR + strAL + strR, dir: bidi.RightToLeft, }, { in: strR + strAN + strAL, dir: bidi.RightToLeft, }, { in: strR + strEN + strR, dir: bidi.RightToLeft, }, { in: strR + strES + strR, dir: bidi.RightToLeft, }, { in: strR + strCS + strR, dir: bidi.RightToLeft, }, { in: strR + strET + strAL, dir: bidi.RightToLeft, }, { in: strR + strON + strR, dir: bidi.RightToLeft, }, { in: strR + strBN + strR, dir: bidi.RightToLeft, }, { in: strR + strNSM + strAL, dir: bidi.RightToLeft, }, { in: strR + strL + strR, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strB + strR, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strS + strAL, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strWS + strAL, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strAL + strR + strAL, dir: bidi.RightToLeft, }, { in: strAL + strAL + strR, dir: bidi.RightToLeft, }, { in: strAL + strAN + strAL, dir: bidi.RightToLeft, }, { in: strAL + strEN + strR, dir: bidi.RightToLeft, }, { in: strAL + strES + strR, dir: bidi.RightToLeft, }, { in: strAL + strCS + strR, dir: bidi.RightToLeft, }, { in: strAL + strET + strAL, dir: bidi.RightToLeft, }, { in: strAL + strON + strR, dir: bidi.RightToLeft, }, { in: strAL + strBN + strR, dir: bidi.RightToLeft, }, { in: strAL + strNSM + strAL, dir: bidi.RightToLeft, }, { in: strAL + strL + strR, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strB + strR, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strS + strAL, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strWS + strAL, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }}, // Rule 2.3: In an RTL label, the end of the label must be a character with // Bidi property R, AL, EN, or AN, followed by zero or more characters with // Bidi property NSM. 3: []ruleTest{{ in: strR + strNSM, dir: bidi.RightToLeft, }, { in: strR + strR, dir: bidi.RightToLeft, }, { in: strR + strAL + strNSM, dir: bidi.RightToLeft, }, { in: strR + strEN + strNSM + strNSM, dir: bidi.RightToLeft, }, { in: strR + strAN, dir: bidi.RightToLeft, }, { in: strR + strES + strNSM, dir: bidi.RightToLeft, n: len(strR + strES + strNSM), err: ErrInvalid, }, { in: strR + strCS + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strR + strCS + strNSM + strNSM), err: ErrInvalid, }, { in: strR + strET, dir: bidi.RightToLeft, n: len(strR + strET), err: ErrInvalid, }, { in: strR + strON + strNSM, dir: bidi.RightToLeft, n: len(strR + strON + strNSM), err: ErrInvalid, }, { in: strR + strBN + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strR + strBN + strNSM + strNSM), err: ErrInvalid, }, { in: strR + strL + strNSM, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strB + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strS, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strR + strWS, dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, }, { in: strAL + strNSM, dir: bidi.RightToLeft, }, { in: strAL + strR, dir: bidi.RightToLeft, }, { in: strAL + strAL + strNSM, dir: bidi.RightToLeft, }, { in: strAL + strEN + strNSM + strNSM, dir: bidi.RightToLeft, }, { in: strAL + strAN, dir: bidi.RightToLeft, }, { in: strAL + strES + strNSM, dir: bidi.RightToLeft, n: len(strAL + strES + strNSM), err: ErrInvalid, }, { in: strAL + strCS + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strAL + strCS + strNSM + strNSM), err: ErrInvalid, }, { in: strAL + strET, dir: bidi.RightToLeft, n: len(strAL + strET), err: ErrInvalid, }, { in: strAL + strON + strNSM, dir: bidi.RightToLeft, n: len(strAL + strON + strNSM), err: ErrInvalid, }, { in: strAL + strBN + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strAL + strBN + strNSM + strNSM), err: ErrInvalid, }, { in: strAL + strL + strNSM, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strB + strNSM + strNSM, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strS, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }, { in: strAL + strWS, dir: bidi.RightToLeft, n: len(strAL), err: ErrInvalid, }}, // Rule 2.4: In an RTL label, if an EN is present, no AN may be present, // and vice versa. 4: []ruleTest{{ in: strR + strEN + strAN, dir: bidi.RightToLeft, n: len(strR + strEN), err: ErrInvalid, }, { in: strR + strAN + strEN + strNSM, dir: bidi.RightToLeft, n: len(strR + strAN), err: ErrInvalid, }, { in: strAL + strEN + strAN, dir: bidi.RightToLeft, n: len(strAL + strEN), err: ErrInvalid, }, { in: strAL + strAN + strEN + strNSM, dir: bidi.RightToLeft, n: len(strAL + strAN), err: ErrInvalid, }}, // Rule 2.5: In an LTR label, only characters with the Bidi properties L, // EN, ES, CS, ET, ON, BN, or NSM are allowed. 5: []ruleTest{{ in: strL + strL + strL, dir: bidi.LeftToRight, }, { in: strL + strEN + strL, dir: bidi.LeftToRight, }, { in: strL + strES + strL, dir: bidi.LeftToRight, }, { in: strL + strCS + strL, dir: bidi.LeftToRight, }, { in: strL + strET + strL, dir: bidi.LeftToRight, }, { in: strL + strON + strL, dir: bidi.LeftToRight, }, { in: strL + strBN + strL, dir: bidi.LeftToRight, }, { in: strL + strNSM + strL, dir: bidi.LeftToRight, }, { in: strL + strR + strL, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strAL + strL, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strAN + strL, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strB + strL, dir: bidi.LeftToRight, n: len(strL + strB + strL), err: ErrInvalid, }, { in: strL + strB + strL + strR, dir: bidi.RightToLeft, n: len(strL + strB + strL), err: ErrInvalid, }, { in: strL + strS + strL, dir: bidi.LeftToRight, n: len(strL + strS + strL), err: ErrInvalid, }, { in: strL + strS + strL + strR, dir: bidi.RightToLeft, n: len(strL + strS + strL), err: ErrInvalid, }, { in: strL + strWS + strL, dir: bidi.LeftToRight, n: len(strL + strWS + strL), err: ErrInvalid, }, { in: strL + strWS + strL + strR, dir: bidi.RightToLeft, n: len(strL + strWS + strL), err: ErrInvalid, }}, // Rule 2.6: In an LTR label, the end of the label must be a character with // Bidi property L or EN, followed by zero or more characters with Bidi // property NSM. 6: []ruleTest{{ in: strL, dir: bidi.LeftToRight, }, { in: strL + strNSM, dir: bidi.LeftToRight, }, { in: strL + strNSM + strNSM, dir: bidi.LeftToRight, }, { in: strL + strEN, dir: bidi.LeftToRight, }, { in: strL + strEN + strNSM, dir: bidi.LeftToRight, }, { in: strL + strEN + strNSM + strNSM, dir: bidi.LeftToRight, }, { in: strL + strES, dir: bidi.LeftToRight, n: len(strL + strES), err: ErrInvalid, }, { in: strL + strES + strR, dir: bidi.RightToLeft, n: len(strL + strES), err: ErrInvalid, }, { in: strL + strCS, dir: bidi.LeftToRight, n: len(strL + strCS), err: ErrInvalid, }, { in: strL + strCS + strR, dir: bidi.RightToLeft, n: len(strL + strCS), err: ErrInvalid, }, { in: strL + strET, dir: bidi.LeftToRight, n: len(strL + strET), err: ErrInvalid, }, { in: strL + strET + strR, dir: bidi.RightToLeft, n: len(strL + strET), err: ErrInvalid, }, { in: strL + strON, dir: bidi.LeftToRight, n: len(strL + strON), err: ErrInvalid, }, { in: strL + strON + strR, dir: bidi.RightToLeft, n: len(strL + strON), err: ErrInvalid, }, { in: strL + strBN, dir: bidi.LeftToRight, n: len(strL + strBN), err: ErrInvalid, }, { in: strL + strBN + strR, dir: bidi.RightToLeft, n: len(strL + strBN), err: ErrInvalid, }, { in: strL + strR, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strAL, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strAN, dir: bidi.RightToLeft, n: len(strL), err: ErrInvalid, }, { in: strL + strB, dir: bidi.LeftToRight, n: len(strL + strB), err: ErrInvalid, }, { in: strL + strB + strR, dir: bidi.RightToLeft, n: len(strL + strB), err: ErrInvalid, }, { in: strL + strS, dir: bidi.LeftToRight, n: len(strL + strS), err: ErrInvalid, }, { in: strL + strS + strR, dir: bidi.RightToLeft, n: len(strL + strS), err: ErrInvalid, }, { in: strL + strWS, dir: bidi.LeftToRight, n: len(strL + strWS), err: ErrInvalid, }, { in: strL + strWS + strR, dir: bidi.RightToLeft, n: len(strL + strWS), err: ErrInvalid, }}, // Incremental processing. 9: []ruleTest{{ in: "e\u0301", // é dir: bidi.LeftToRight, pSrc: 2, nSrc: 1, err0: transform.ErrShortSrc, }, { in: "e\u1000f", // é dir: bidi.LeftToRight, pSrc: 3, nSrc: 1, err0: transform.ErrShortSrc, }, { // Remain invalid once invalid. in: strR + "ab", dir: bidi.RightToLeft, n: len(strR), err: ErrInvalid, pSrc: len(strR) + 1, nSrc: len(strR), err0: ErrInvalid, }, { // Short destination in: "abcdefghij", dir: bidi.LeftToRight, pSrc: 10, szDst: 5, nSrc: 5, err0: transform.ErrShortDst, }, { in: "\U000102f7", dir: bidi.LeftToRight, n: len("\U000102f7"), err: ErrInvalid, }, { // Short destination splitting input rune in: "e\u0301", dir: bidi.LeftToRight, pSrc: 3, szDst: 2, nSrc: 1, err0: transform.ErrShortDst, }, { // Unicode 10.0.0 IDNA test string. in: "FAX\u2a77\U0001d186", dir: bidi.LeftToRight, n: len("FAX\u2a77\U0001d186"), err: ErrInvalid, }, { in: "\x80\u0660", dir: bidi.RightToLeft, n: 0, err: ErrInvalid, }}, }