ceph-csi/vendor/github.com/google/cel-go/parser/unescape.go

// Copyright 2018 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//      http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package parser

import (
	"fmt"
	"strings"
	"unicode/utf8"
)

// Unescape takes a quoted string, unquotes, and unescapes it.
//
// This function performs escaping compatible with GoogleSQL.
func unescape(value string, isBytes bool) (string, error) {
	// All strings normalize newlines to the \n representation.
	value = newlineNormalizer.Replace(value)
	n := len(value)

	// Nothing to unescape / decode.
	if n < 2 {
		return value, fmt.Errorf("unable to unescape string")
	}

	// Raw string preceded by the 'r|R' prefix.
	isRawLiteral := false
	if value[0] == 'r' || value[0] == 'R' {
		value = value[1:]
		n = len(value)
		isRawLiteral = true
	}

	// Quoted string of some form, must have same first and last char.
	if value[0] != value[n-1] || (value[0] != '"' && value[0] != '\'') {
		return value, fmt.Errorf("unable to unescape string")
	}

	// Normalize the multi-line CEL string representation to a standard
	// Go quoted string.
	if n >= 6 {
		if strings.HasPrefix(value, "'''") {
			if !strings.HasSuffix(value, "'''") {
				return value, fmt.Errorf("unable to unescape string")
			}
			value = "\"" + value[3:n-3] + "\""
		} else if strings.HasPrefix(value, `"""`) {
			if !strings.HasSuffix(value, `"""`) {
				return value, fmt.Errorf("unable to unescape string")
			}
			value = "\"" + value[3:n-3] + "\""
		}
		n = len(value)
	}
	value = value[1 : n-1]
	// If there is nothing to escape, then return.
	if isRawLiteral || !strings.ContainsRune(value, '\\') {
		return value, nil
	}

	// Otherwise the string contains escape characters.
	// The following logic is adapted from `strconv/quote.go`
	var runeTmp [utf8.UTFMax]byte
	buf := make([]byte, 0, 3*n/2)
	for len(value) > 0 {
		c, encode, rest, err := unescapeChar(value, isBytes)
		if err != nil {
			return "", err
		}
		value = rest
		if c < utf8.RuneSelf || !encode {
			buf = append(buf, byte(c))
		} else {
			n := utf8.EncodeRune(runeTmp[:], c)
			buf = append(buf, runeTmp[:n]...)
		}
	}
	return string(buf), nil
}

// unescapeChar takes a string input and returns the following info:
//
//   value - the escaped unicode rune at the front of the string.
//   encode - the value should be unicode-encoded
//   tail - the remainder of the input string.
//   err - error value, if the character could not be unescaped.
//
// When encode is true the return value may still fit within a single byte,
// but unicode encoding is attempted which is more expensive than when the
// value is known to self-represent as a single byte.
//
// If isBytes is set, unescape as a bytes literal so octal and hex escapes
// represent byte values, not unicode code points.
func unescapeChar(s string, isBytes bool) (value rune, encode bool, tail string, err error) {
	// 1. Character is not an escape sequence.
	switch c := s[0]; {
	case c >= utf8.RuneSelf:
		r, size := utf8.DecodeRuneInString(s)
		return r, true, s[size:], nil
	case c != '\\':
		return rune(s[0]), false, s[1:], nil
	}

	// 2. Last character is the start of an escape sequence.
	if len(s) <= 1 {
		err = fmt.Errorf("unable to unescape string, found '\\' as last character")
		return
	}

	c := s[1]
	s = s[2:]
	// 3. Common escape sequences shared with Google SQL
	switch c {
	case 'a':
		value = '\a'
	case 'b':
		value = '\b'
	case 'f':
		value = '\f'
	case 'n':
		value = '\n'
	case 'r':
		value = '\r'
	case 't':
		value = '\t'
	case 'v':
		value = '\v'
	case '\\':
		value = '\\'
	case '\'':
		value = '\''
	case '"':
		value = '"'
	case '`':
		value = '`'
	case '?':
		value = '?'

	// 4. Unicode escape sequences, reproduced from `strconv/quote.go`
	case 'x', 'X', 'u', 'U':
		n := 0
		encode = true
		switch c {
		case 'x', 'X':
			n = 2
			encode = !isBytes
		case 'u':
			n = 4
			if isBytes {
				err = fmt.Errorf("unable to unescape string")
				return
			}
		case 'U':
			n = 8
			if isBytes {
				err = fmt.Errorf("unable to unescape string")
				return
			}
		}
		var v rune
		if len(s) < n {
			err = fmt.Errorf("unable to unescape string")
			return
		}
		for j := 0; j < n; j++ {
			x, ok := unhex(s[j])
			if !ok {
				err = fmt.Errorf("unable to unescape string")
				return
			}
			v = v<<4 | x
		}
		s = s[n:]
		if !isBytes && v > utf8.MaxRune {
			err = fmt.Errorf("unable to unescape string")
			return
		}
		value = v

	// 5. Octal escape sequences, must be three digits \[0-3][0-7][0-7]
	case '0', '1', '2', '3':
		if len(s) < 2 {
			err = fmt.Errorf("unable to unescape octal sequence in string")
			return
		}
		v := rune(c - '0')
		for j := 0; j < 2; j++ {
			x := s[j]
			if x < '0' || x > '7' {
				err = fmt.Errorf("unable to unescape octal sequence in string")
				return
			}
			v = v*8 + rune(x-'0')
		}
		if !isBytes && v > utf8.MaxRune {
			err = fmt.Errorf("unable to unescape string")
			return
		}
		value = v
		s = s[2:]
		encode = !isBytes

		// Unknown escape sequence.
	default:
		err = fmt.Errorf("unable to unescape string")
	}

	tail = s
	return
}

func unhex(b byte) (rune, bool) {
	c := rune(b)
	switch {
	case '0' <= c && c <= '9':
		return c - '0', true
	case 'a' <= c && c <= 'f':
		return c - 'a' + 10, true
	case 'A' <= c && c <= 'F':
		return c - 'A' + 10, true
	}
	return 0, false
}

var (
	newlineNormalizer = strings.NewReplacer("\r\n", "\n", "\r", "\n")
)
rebase: bump k8s.io/kubernetes from 1.26.2 to 1.27.2 Bumps [k8s.io/kubernetes](https://github.com/kubernetes/kubernetes) from 1.26.2 to 1.27.2. - [Release notes](https://github.com/kubernetes/kubernetes/releases) - [Commits](https://github.com/kubernetes/kubernetes/compare/v1.26.2...v1.27.2) --- updated-dependencies: - dependency-name: k8s.io/kubernetes dependency-type: direct:production update-type: version-update:semver-minor ... Signed-off-by: dependabot[bot] <support@github.com> 2023-05-29 21:03:29 +00:00			`// Copyright 2018 Google LLC`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

			`package parser`

			`import (`
			`"fmt"`
			`"strings"`
			`"unicode/utf8"`
			`)`

			`// Unescape takes a quoted string, unquotes, and unescapes it.`
			`//`
			`// This function performs escaping compatible with GoogleSQL.`
			`func unescape(value string, isBytes bool) (string, error) {`
			`// All strings normalize newlines to the \n representation.`
			`value = newlineNormalizer.Replace(value)`
			`n := len(value)`

			`// Nothing to unescape / decode.`
			`if n < 2 {`
			`return value, fmt.Errorf("unable to unescape string")`
			`}`

			`// Raw string preceded by the 'r\|R' prefix.`
			`isRawLiteral := false`
			`if value[0] == 'r' \|\| value[0] == 'R' {`
			`value = value[1:]`
			`n = len(value)`
			`isRawLiteral = true`
			`}`

			`// Quoted string of some form, must have same first and last char.`
			`if value[0] != value[n-1] \|\| (value[0] != '"' && value[0] != '\'') {`
			`return value, fmt.Errorf("unable to unescape string")`
			`}`

			`// Normalize the multi-line CEL string representation to a standard`
			`// Go quoted string.`
			`if n >= 6 {`
			`if strings.HasPrefix(value, "'''") {`
			`if !strings.HasSuffix(value, "'''") {`
			`return value, fmt.Errorf("unable to unescape string")`
			`}`
			`value = "\"" + value[3:n-3] + "\""`
			} else if strings.HasPrefix(value, `"""`) {
			if !strings.HasSuffix(value, `"""`) {
			`return value, fmt.Errorf("unable to unescape string")`
			`}`
			`value = "\"" + value[3:n-3] + "\""`
			`}`
			`n = len(value)`
			`}`
			`value = value[1 : n-1]`
			`// If there is nothing to escape, then return.`
			`if isRawLiteral \|\| !strings.ContainsRune(value, '\\') {`
			`return value, nil`
			`}`

			`// Otherwise the string contains escape characters.`
			// The following logic is adapted from `strconv/quote.go`
			`var runeTmp [utf8.UTFMax]byte`
			`buf := make([]byte, 0, 3*n/2)`
			`for len(value) > 0 {`
			`c, encode, rest, err := unescapeChar(value, isBytes)`
			`if err != nil {`
			`return "", err`
			`}`
			`value = rest`
			`if c < utf8.RuneSelf \|\| !encode {`
			`buf = append(buf, byte(c))`
			`} else {`
			`n := utf8.EncodeRune(runeTmp[:], c)`
			`buf = append(buf, runeTmp[:n]...)`
			`}`
			`}`
			`return string(buf), nil`
			`}`

			`// unescapeChar takes a string input and returns the following info:`
			`//`
			`// value - the escaped unicode rune at the front of the string.`
			`// encode - the value should be unicode-encoded`
			`// tail - the remainder of the input string.`
			`// err - error value, if the character could not be unescaped.`
			`//`
			`// When encode is true the return value may still fit within a single byte,`
			`// but unicode encoding is attempted which is more expensive than when the`
			`// value is known to self-represent as a single byte.`
			`//`
			`// If isBytes is set, unescape as a bytes literal so octal and hex escapes`
			`// represent byte values, not unicode code points.`
			`func unescapeChar(s string, isBytes bool) (value rune, encode bool, tail string, err error) {`
			`// 1. Character is not an escape sequence.`
			`switch c := s[0]; {`
			`case c >= utf8.RuneSelf:`
			`r, size := utf8.DecodeRuneInString(s)`
			`return r, true, s[size:], nil`
			`case c != '\\':`
			`return rune(s[0]), false, s[1:], nil`
			`}`

			`// 2. Last character is the start of an escape sequence.`
			`if len(s) <= 1 {`
			`err = fmt.Errorf("unable to unescape string, found '\\' as last character")`
			`return`
			`}`

			`c := s[1]`
			`s = s[2:]`
			`// 3. Common escape sequences shared with Google SQL`
			`switch c {`
			`case 'a':`
			`value = '\a'`
			`case 'b':`
			`value = '\b'`
			`case 'f':`
			`value = '\f'`
			`case 'n':`
			`value = '\n'`
			`case 'r':`
			`value = '\r'`
			`case 't':`
			`value = '\t'`
			`case 'v':`
			`value = '\v'`
			`case '\\':`
			`value = '\\'`
			`case '\'':`
			`value = '\''`
			`case '"':`
			`value = '"'`
			case '`':
			value = '`'
			`case '?':`
			`value = '?'`

			// 4. Unicode escape sequences, reproduced from `strconv/quote.go`
			`case 'x', 'X', 'u', 'U':`
			`n := 0`
			`encode = true`
			`switch c {`
			`case 'x', 'X':`
			`n = 2`
			`encode = !isBytes`
			`case 'u':`
			`n = 4`
			`if isBytes {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`case 'U':`
			`n = 8`
			`if isBytes {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`}`
			`var v rune`
			`if len(s) < n {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`for j := 0; j < n; j++ {`
			`x, ok := unhex(s[j])`
			`if !ok {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`v = v<<4 \| x`
			`}`
			`s = s[n:]`
			`if !isBytes && v > utf8.MaxRune {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`value = v`

			`// 5. Octal escape sequences, must be three digits \[0-3][0-7][0-7]`
			`case '0', '1', '2', '3':`
			`if len(s) < 2 {`
			`err = fmt.Errorf("unable to unescape octal sequence in string")`
			`return`
			`}`
			`v := rune(c - '0')`
			`for j := 0; j < 2; j++ {`
			`x := s[j]`
			`if x < '0' \|\| x > '7' {`
			`err = fmt.Errorf("unable to unescape octal sequence in string")`
			`return`
			`}`
			`v = v*8 + rune(x-'0')`
			`}`
			`if !isBytes && v > utf8.MaxRune {`
			`err = fmt.Errorf("unable to unescape string")`
			`return`
			`}`
			`value = v`
			`s = s[2:]`
			`encode = !isBytes`

			`// Unknown escape sequence.`
			`default:`
			`err = fmt.Errorf("unable to unescape string")`
			`}`

			`tail = s`
			`return`
			`}`

			`func unhex(b byte) (rune, bool) {`
			`c := rune(b)`
			`switch {`
			`case '0' <= c && c <= '9':`
			`return c - '0', true`
			`case 'a' <= c && c <= 'f':`
			`return c - 'a' + 10, true`
			`case 'A' <= c && c <= 'F':`
			`return c - 'A' + 10, true`
			`}`
			`return 0, false`
			`}`

			`var (`
			`newlineNormalizer = strings.NewReplacer("\r\n", "\n", "\r", "\n")`
			`)`