ext/strings.go - external/github.com/google/cel-go - Git at Google

 // Copyright 2020 Google LLC
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //      http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 // Package ext contains CEL extension libraries where each library defines a related set of
 // constants, functions, macros, or other configuration settings which may not be covered by
 // the core CEL spec.
 package ext

 import (
 	"fmt"
 	"math"
 	"reflect"
 	"strings"
 	"unicode"
 	"unicode/utf8"

 	"golang.org/x/text/language"

 	"github.com/google/cel-go/cel"
 	"github.com/google/cel-go/checker"
 	"github.com/google/cel-go/common"
 	"github.com/google/cel-go/common/types"
 	"github.com/google/cel-go/common/types/ref"
 	"github.com/google/cel-go/common/types/traits"
 	"github.com/google/cel-go/interpreter"
 )

 const (
 	defaultLocale    = "en-US"
 	defaultPrecision = 6
 )

 // Strings returns a cel.EnvOption to configure extended functions for string manipulation.
 // As a general note, all indices are zero-based.
 //
 // # CharAt
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns the character at the given position. If the position is negative, or greater than
 // the length of the string, the function will produce an error:
 //
 //	<string>.charAt(<int>) -> <string>
 //
 // Examples:
 //
 //	'hello'.charAt(4)  // return 'o'
 //	'hello'.charAt(5)  // return ''
 //	'hello'.charAt(-1) // error
 //
 // # Format
 //
 // Introduced at version: 1 (cost at version 5)
 //
 // Returns a new string with substitutions being performed, printf-style.
 // The valid formatting clauses are:
 //
 // `%s` - substitutes a string. This can also be used on bools, lists, maps, bytes,
 // Duration and Timestamp, in addition to all numerical types (int, uint, and double).
 // Note that the dot/period decimal separator will always be used when printing a list
 // or map that contains a double, and that null can be passed (which results in the
 // string "null") in addition to types.
 // `%d` - substitutes an integer.
 // `%f` - substitutes a double with fixed-point precision. The default precision is 6, but
 // this can be adjusted. The strings `Infinity`, `-Infinity`, and `NaN` are also valid input
 // for this clause.
 // `%e` - substitutes a double in scientific notation. The default precision is 6, but this
 // can be adjusted.
 // `%b` - substitutes an integer with its equivalent binary string. Can also be used on bools.
 // `%x` - substitutes an integer with its equivalent in hexadecimal, or if given a string or
 // bytes, will output each character's equivalent in hexadecimal.
 // `%X` - same as above, but with A-F capitalized.
 // `%o` - substitutes an integer with its equivalent in octal.
 //
 //	<string>.format(<list>) -> <string>
 //
 // Examples:
 //
 //	"this is a string: %s\nand an integer: %d".format(["str", 42]) // returns "this is a string: str\nand an integer: 42"
 //	"a double substituted with %%s: %s".format([64.2]) // returns "a double substituted with %s: 64.2"
 //	"string type: %s".format([type(string)]) // returns "string type: string"
 //	"timestamp: %s".format([timestamp("2023-02-03T23:31:20+00:00")]) // returns "timestamp: 2023-02-03T23:31:20Z"
 //	"duration: %s".format([duration("1h45m47s")]) // returns "duration: 6347s"
 //	"%f".format([3.14]) // returns "3.140000"
 //	"scientific notation: %e".format([2.71828]) // returns "scientific notation: 2.718280\u202f\u00d7\u202f10\u2070\u2070"
 //	"5 in binary: %b".format([5]), // returns "5 in binary; 101"
 //	"26 in hex: %x".format([26]), // returns "26 in hex: 1a"
 //	"26 in hex (uppercase): %X".format([26]) // returns "26 in hex (uppercase): 1A"
 //	"30 in octal: %o".format([30]) // returns "30 in octal: 36"
 //	"a map inside a list: %s".format([[1, 2, 3, {"a": "x", "b": "y", "c": "z"}]]) // returns "a map inside a list: [1, 2, 3, {"a":"x", "b":"y", "c":"d"}]"
 //	"true bool: %s - false bool: %s\nbinary bool: %b".format([true, false, true]) // returns "true bool: true - false bool: false\nbinary bool: 1"
 //
 // Passing an incorrect type (a string to `%b`) is considered an error, as well as attempting
 // to use more formatting clauses than there are arguments (`%d %d %d` while passing two ints, for instance).
 // If compile-time checking is enabled, and the formatting string is a constant, and the argument list is a literal,
 // then letting any arguments go unused/unformatted is also considered an error.
 //
 // # IndexOf
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns the integer index of the first occurrence of the search string. If the search string is
 // not found the function returns -1.
 //
 // The function also accepts an optional position from which to begin the substring search. If the
 // substring is the empty string, the index where the search starts is returned (zero or custom).
 //
 //	<string>.indexOf(<string>) -> <int>
 //	<string>.indexOf(<string>, <int>) -> <int>
 //
 // Examples:
 //
 //	'hello mellow'.indexOf('')         // returns 0
 //	'hello mellow'.indexOf('ello')     // returns 1
 //	'hello mellow'.indexOf('jello')    // returns -1
 //	'hello mellow'.indexOf('', 2)      // returns 2
 //	'hello mellow'.indexOf('ello', 2)  // returns 7
 //	'hello mellow'.indexOf('ello', 20) // returns -1
 //	'hello mellow'.indexOf('ello', -1) // error
 //
 // # Join
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a new string where the elements of string list are concatenated.
 //
 // The function also accepts an optional separator which is placed between elements in the resulting string.
 //
 // <list<string>>.join() -> <string>
 // <list<string>>.join(<string>) -> <string>
 //
 // Examples:
 //
 //	['hello', 'mellow'].join() // returns 'hellomellow'
 //	['hello', 'mellow'].join(' ') // returns 'hello mellow'
 //	[].join() // returns ''
 //	[].join('/') // returns ''
 //
 // # LastIndexOf
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns the integer index at the start of the last occurrence of the search string. If the
 // search string is not found the function returns -1.
 //
 // The function also accepts an optional position which represents the last index to be
 // considered as the beginning of the substring match. If the substring is the empty string,
 // the index where the search starts is returned (string length or custom).
 //
 //	<string>.lastIndexOf(<string>) -> <int>
 //	<string>.lastIndexOf(<string>, <int>) -> <int>
 //
 // Examples:
 //
 //	'hello mellow'.lastIndexOf('')         // returns 12
 //	'hello mellow'.lastIndexOf('ello')     // returns 7
 //	'hello mellow'.lastIndexOf('jello')    // returns -1
 //	'hello mellow'.lastIndexOf('ello', 6)  // returns 1
 //	'hello mellow'.lastIndexOf('ello', 20) // returns -1
 //	'hello mellow'.lastIndexOf('ello', -1) // error
 //
 // # LowerAscii
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a new string where all ASCII characters are lower-cased.
 //
 // This function does not perform Unicode case-mapping for characters outside the ASCII range.
 //
 //	<string>.lowerAscii() -> <string>
 //
 // Examples:
 //
 //	'TacoCat'.lowerAscii()      // returns 'tacocat'
 //	'TacoCÆt Xii'.lowerAscii()  // returns 'tacocÆt xii'
 //
 // # Strings.Quote
 //
 // Introduced in version: 1 (cost support in version 5)
 //
 // Takes the given string and makes it safe to print (without any formatting due to escape sequences).
 // If any invalid UTF-8 characters are encountered, they are replaced with \uFFFD.
 //
 // strings.quote(<string>)
 //
 // Examples:
 //
 // strings.quote('single-quote with "double quote"') // returns '"single-quote with \"double quote\""'
 // strings.quote("two escape sequences \a\n") // returns '"two escape sequences \\a\\n"'
 //
 // # Replace
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a new string based on the target, which replaces the occurrences of a search string
 // with a replacement string if present. The function accepts an optional limit on the number of
 // substring replacements to be made.
 //
 // When the replacement limit is 0, the result is the original string. When the limit is a negative
 // number, the function behaves the same as replace all.
 //
 //	<string>.replace(<string>, <string>) -> <string>
 //	<string>.replace(<string>, <string>, <int>) -> <string>
 //
 // Examples:
 //
 //	'hello hello'.replace('he', 'we')     // returns 'wello wello'
 //	'hello hello'.replace('he', 'we', -1) // returns 'wello wello'
 //	'hello hello'.replace('he', 'we', 1)  // returns 'wello hello'
 //	'hello hello'.replace('he', 'we', 0)  // returns 'hello hello'
 //	'hello hello'.replace('', '_')  // returns '_h_e_l_l_o_ _h_e_l_l_o_'
 //	'hello hello'.replace('h', '')  // returns 'ello ello'
 //
 // # Split
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a list of strings split from the input by the given separator. The function accepts
 // an optional argument specifying a limit on the number of substrings produced by the split.
 //
 // When the split limit is 0, the result is an empty list. When the limit is 1, the result is the
 // target string to split. When the limit is a negative number, the function behaves the same as
 // split all.
 //
 //	<string>.split(<string>) -> <list<string>>
 //	<string>.split(<string>, <int>) -> <list<string>>
 //
 // Examples:
 //
 //	'hello hello hello'.split(' ')     // returns ['hello', 'hello', 'hello']
 //	'hello hello hello'.split(' ', 0)  // returns []
 //	'hello hello hello'.split(' ', 1)  // returns ['hello hello hello']
 //	'hello hello hello'.split(' ', 2)  // returns ['hello', 'hello hello']
 //	'hello hello hello'.split(' ', -1) // returns ['hello', 'hello', 'hello']
 //
 // # Substring
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns the substring given a numeric range corresponding to character positions. Optionally
 // may omit the trailing range for a substring from a given character position until the end of
 // a string.
 //
 // Character offsets are 0-based with an inclusive start range and exclusive end range. It is an
 // error to specify an end range that is lower than the start range, or for either the start or end
 // index to be negative or exceed the string length.
 //
 //	<string>.substring(<int>) -> <string>
 //	<string>.substring(<int>, <int>) -> <string>
 //
 // Examples:
 //
 //	'tacocat'.substring(4)    // returns 'cat'
 //	'tacocat'.substring(0, 4) // returns 'taco'
 //	'tacocat'.substring(-1)   // error
 //	'tacocat'.substring(2, 1) // error
 //
 // # Trim
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a new string which removes the leading and trailing whitespace in the target string.
 // The trim function uses the Unicode definition of whitespace which does not include the
 // zero-width spaces. See: https://en.wikipedia.org/wiki/Whitespace_character#Unicode
 //
 //	<string>.trim() -> <string>
 //
 // Examples:
 //
 //	'  \ttrim\n    '.trim() // returns 'trim'
 //
 // # UpperAscii
 //
 // Introduced at version: 0 (cost support in version 5)
 //
 // Returns a new string where all ASCII characters are upper-cased.
 //
 // This function does not perform Unicode case-mapping for characters outside the ASCII range.
 //
 //	<string>.upperAscii() -> <string>
 //
 // Examples:
 //
 //	'TacoCat'.upperAscii()      // returns 'TACOCAT'
 //	'TacoCÆt Xii'.upperAscii()  // returns 'TACOCÆT XII'
 //
 // # Reverse
 //
 // Introduced at version: 3 (cost support in version 5)
 //
 // Returns a new string whose characters are the same as the target string, only formatted in
 // reverse order.
 // This function relies on converting strings to rune arrays in order to reverse
 //
 //	<string>.reverse() -> <string>
 //
 // Examples:
 //
 //	'gums'.reverse() // returns 'smug'
 //	'John Smith'.reverse() // returns 'htimS nhoJ'
 //
 // Introduced at version: 4 (cost support in version 5)
 //
 // Formatting updated to adhere to https://github.com/google/cel-spec/blob/master/doc/extensions/strings.md.
 //
 // <string>.format(<list>) -> <string>
 func Strings(options ...StringsOption) cel.EnvOption {
 	s := &stringLib{
 		version: math.MaxUint32,
 	}
 	for _, o := range options {
 		s = o(s)
 	}
 	return cel.Lib(s)
 }

 type stringLib struct {
 	locale       string
 	version      uint32
 	maxPrecision int
 }

 // LibraryName implements the SingletonLibrary interface method.
 func (*stringLib) LibraryName() string {
 	return "cel.lib.ext.strings"
 }

 // StringsOption is a functional interface for configuring the strings library.
 type StringsOption func(*stringLib) *stringLib

 // StringsLocale configures the library with the given locale. The locale tag will
 // be checked for validity at the time that EnvOptions are configured. If this option
 // is not passed, string.format will behave as if en_US was passed as the locale.
 //
 // If StringsVersion is greater than or equal to 4, this option is ignored.
 func StringsLocale(locale string) StringsOption {
 	return func(sl *stringLib) *stringLib {
 		sl.locale = locale
 		return sl
 	}
 }

 // StringsVersion configures the version of the string library.
 //
 // The version limits which functions are available. Only functions introduced
 // below or equal to the given version included in the library. If this option
 // is not set, all functions are available.
 //
 // See the library documentation to determine which version a function was introduced.
 // If the documentation does not state which version a function was introduced, it can
 // be assumed to be introduced at version 0, when the library was first created.
 func StringsVersion(version uint32) StringsOption {
 	return func(lib *stringLib) *stringLib {
 		lib.version = version
 		return lib
 	}
 }

 // StringsValidateFormatCalls validates type-checked ASTs to ensure that string.format() calls have
 // valid formatting clauses and valid argument types for each clause.
 //
 // Deprecated
 func StringsValidateFormatCalls(value bool) StringsOption {
 	return func(s *stringLib) *stringLib {
 		return s
 	}
 }

 // StringsMaxPrecision configures the maximum precision for floating-point format clauses.
 //
 // If not set, the default is 100 for version >= 5, and no limit for earlier versions.
 func StringsMaxPrecision(limit int) StringsOption {
 	return func(lib *stringLib) *stringLib {
 		lib.maxPrecision = limit
 		return lib
 	}
 }

 // CompileOptions implements the Library interface method.
 func (lib *stringLib) CompileOptions() []cel.EnvOption {
 	formatLocale := "en_US"
 	if lib.version < 4 && lib.locale != "" {
 		// ensure locale is properly-formed if set
 		_, err := language.Parse(lib.locale)
 		if err != nil {
 			return []cel.EnvOption{
 				func(e *cel.Env) (*cel.Env, error) {
 					return nil, fmt.Errorf("failed to parse locale: %w", err)
 				},
 			}
 		}
 		formatLocale = lib.locale
 	}

 	opts := []cel.EnvOption{
 		cel.Function("charAt",
 			cel.MemberOverload("string_char_at_int", []*cel.Type{cel.StringType, cel.IntType}, cel.StringType,
 				cel.BinaryBinding(func(str, ind ref.Val) ref.Val {
 					s := str.(types.String)
 					i := ind.(types.Int)
 					return stringOrError(charAt(string(s), int64(i)))
 				}))),
 		cel.Function("indexOf",
 			cel.MemberOverload("string_index_of_string", []*cel.Type{cel.StringType, cel.StringType}, cel.IntType,
 				cel.BinaryBinding(func(str, substr ref.Val) ref.Val {
 					s := str.(types.String)
 					sub := substr.(types.String)
 					return intOrError(indexOf(string(s), string(sub)))
 				})),
 			cel.MemberOverload("string_index_of_string_int", []*cel.Type{cel.StringType, cel.StringType, cel.IntType}, cel.IntType,
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					s := args[0].(types.String)
 					sub := args[1].(types.String)
 					offset := args[2].(types.Int)
 					return intOrError(indexOfOffset(string(s), string(sub), int64(offset)))
 				}))),
 		cel.Function("lastIndexOf",
 			cel.MemberOverload("string_last_index_of_string", []*cel.Type{cel.StringType, cel.StringType}, cel.IntType,
 				cel.BinaryBinding(func(str, substr ref.Val) ref.Val {
 					s := str.(types.String)
 					sub := substr.(types.String)
 					return intOrError(lastIndexOf(string(s), string(sub)))
 				})),
 			cel.MemberOverload("string_last_index_of_string_int", []*cel.Type{cel.StringType, cel.StringType, cel.IntType}, cel.IntType,
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					s := args[0].(types.String)
 					sub := args[1].(types.String)
 					offset := args[2].(types.Int)
 					return intOrError(lastIndexOfOffset(string(s), string(sub), int64(offset)))
 				}))),
 		cel.Function("lowerAscii",
 			cel.MemberOverload("string_lower_ascii", []*cel.Type{cel.StringType}, cel.StringType,
 				cel.UnaryBinding(func(str ref.Val) ref.Val {
 					s := str.(types.String)
 					return stringOrError(lowerASCII(string(s)))
 				}))),
 		cel.Function("replace",
 			cel.MemberOverload(
 				"string_replace_string_string", []*cel.Type{cel.StringType, cel.StringType, cel.StringType}, cel.StringType,
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					str := args[0].(types.String)
 					old := args[1].(types.String)
 					new := args[2].(types.String)
 					return stringOrError(replace(string(str), string(old), string(new)))
 				})),
 			cel.MemberOverload(
 				"string_replace_string_string_int", []*cel.Type{cel.StringType, cel.StringType, cel.StringType, cel.IntType}, cel.StringType,
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					str := args[0].(types.String)
 					old := args[1].(types.String)
 					new := args[2].(types.String)
 					n := args[3].(types.Int)
 					return stringOrError(replaceN(string(str), string(old), string(new), int64(n)))
 				}))),
 		cel.Function("split",
 			cel.MemberOverload("string_split_string", []*cel.Type{cel.StringType, cel.StringType}, cel.ListType(cel.StringType),
 				cel.BinaryBinding(func(str, separator ref.Val) ref.Val {
 					s := str.(types.String)
 					sep := separator.(types.String)
 					return listStringOrError(split(string(s), string(sep)))
 				})),
 			cel.MemberOverload("string_split_string_int", []*cel.Type{cel.StringType, cel.StringType, cel.IntType}, cel.ListType(cel.StringType),
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					s := args[0].(types.String)
 					sep := args[1].(types.String)
 					n := args[2].(types.Int)
 					return listStringOrError(splitN(string(s), string(sep), int64(n)))
 				}))),
 		cel.Function("substring",
 			cel.MemberOverload("string_substring_int", []*cel.Type{cel.StringType, cel.IntType}, cel.StringType,
 				cel.BinaryBinding(func(str, offset ref.Val) ref.Val {
 					s := str.(types.String)
 					off := offset.(types.Int)
 					return stringOrError(substr(string(s), int64(off)))
 				})),
 			cel.MemberOverload("string_substring_int_int", []*cel.Type{cel.StringType, cel.IntType, cel.IntType}, cel.StringType,
 				cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 					s := args[0].(types.String)
 					start := args[1].(types.Int)
 					end := args[2].(types.Int)
 					return stringOrError(substrRange(string(s), int64(start), int64(end)))
 				}))),
 		cel.Function("trim",
 			cel.MemberOverload("string_trim", []*cel.Type{cel.StringType}, cel.StringType,
 				cel.UnaryBinding(func(str ref.Val) ref.Val {
 					s := str.(types.String)
 					return stringOrError(trimSpace(string(s)))
 				}))),
 		cel.Function("upperAscii",
 			cel.MemberOverload("string_upper_ascii", []*cel.Type{cel.StringType}, cel.StringType,
 				cel.UnaryBinding(func(str ref.Val) ref.Val {
 					s := str.(types.String)
 					return stringOrError(upperASCII(string(s)))
 				}))),
 	}
 	// maxPrecision is unbounded (0) for versions < 5 to maintain backward
 	// compatibility. For version >= 5, the default is 100 if not explicitly
 	// configured via StringsMaxPrecision().
 	maxPrecision := lib.maxPrecision
 	if maxPrecision == 0 && lib.version >= 5 {
 		maxPrecision = 100
 	}
 	if lib.version >= 1 {
 		if lib.version >= 4 {
 			opts = append(opts, cel.Function("format",
 				cel.MemberOverload("string_format", []*cel.Type{cel.StringType, cel.ListType(cel.DynType)}, cel.StringType,
 					cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 						s := string(args[0].(types.String))
 						formatArgs := args[1].(traits.Lister)
 						return stringOrError(parseFormatStringV2(s, &stringFormatterV2{}, &stringArgList{formatArgs}, maxPrecision))
 					}))))
 		} else {
 			opts = append(opts, cel.Function("format",
 				cel.MemberOverload("string_format", []*cel.Type{cel.StringType, cel.ListType(cel.DynType)}, cel.StringType,
 					cel.FunctionBinding(func(args ...ref.Val) ref.Val {
 						s := string(args[0].(types.String))
 						formatArgs := args[1].(traits.Lister)
 						return stringOrError(parseFormatString(s, &stringFormatter{}, &stringArgList{formatArgs}, formatLocale, maxPrecision))
 					}))))
 		}
 		opts = append(opts,
 			cel.Function("strings.quote", cel.Overload("strings_quote", []*cel.Type{cel.StringType}, cel.StringType,
 				cel.UnaryBinding(func(str ref.Val) ref.Val {
 					s := str.(types.String)
 					return stringOrError(quote(string(s)))
 				}))))
 	}
 	if lib.version >= 2 {
 		opts = append(opts,
 			cel.Function("join",
 				cel.MemberOverload("list_join", []*cel.Type{cel.ListType(cel.StringType)}, cel.StringType,
 					cel.UnaryBinding(func(list ref.Val) ref.Val {
 						l := list.(traits.Lister)
 						return stringOrError(joinValSeparator(l, ""))
 					})),
 				cel.MemberOverload("list_join_string", []*cel.Type{cel.ListType(cel.StringType), cel.StringType}, cel.StringType,
 					cel.BinaryBinding(func(list, delim ref.Val) ref.Val {
 						l := list.(traits.Lister)
 						d := delim.(types.String)
 						return stringOrError(joinValSeparator(l, string(d)))
 					}))),
 		)
 	} else {
 		opts = append(opts,
 			cel.Function("join",
 				cel.MemberOverload("list_join", []*cel.Type{cel.ListType(cel.StringType)}, cel.StringType,
 					cel.UnaryBinding(func(list ref.Val) ref.Val {
 						l, err := list.ConvertToNative(stringListType)
 						if err != nil {
 							return types.WrapErr(err)
 						}
 						return stringOrError(join(l.([]string)))
 					})),
 				cel.MemberOverload("list_join_string", []*cel.Type{cel.ListType(cel.StringType), cel.StringType}, cel.StringType,
 					cel.BinaryBinding(func(list, delim ref.Val) ref.Val {
 						l, err := list.ConvertToNative(stringListType)
 						if err != nil {
 							return types.WrapErr(err)
 						}
 						d := delim.(types.String)
 						return stringOrError(joinSeparator(l.([]string), string(d)))
 					}))),
 		)
 	}
 	if lib.version >= 3 {
 		opts = append(opts,
 			cel.Function("reverse",
 				cel.MemberOverload("string_reverse", []*cel.Type{cel.StringType}, cel.StringType,
 					cel.UnaryBinding(func(str ref.Val) ref.Val {
 						s := str.(types.String)
 						return stringOrError(reverse(string(s)))
 					}))),
 		)
 	}
 	if lib.version >= 1 {
 		if lib.version >= 4 {
 			opts = append(opts, cel.ASTValidators(stringFormatValidatorV2{maxPrecision: maxPrecision}))
 		} else {
 			opts = append(opts, cel.ASTValidators(stringFormatValidator{maxPrecision: maxPrecision}))
 		}
 	}

 	if lib.version >= 5 {
 		// Cost estimators for string extension functions.
 		estimators := []checker.CostOption{
 			// Format is captured in the core cost estimator logic and needs to be extracted out.
 			checker.OverloadCostEstimate("string_char_at_int", estimateStringCharAtCost),
 			checker.OverloadCostEstimate("string_index_of_string", estimateStringSearchCost),
 			checker.OverloadCostEstimate("string_index_of_string_int", estimateStringSearchCost),
 			checker.OverloadCostEstimate("string_last_index_of_string", estimateStringSearchCost),
 			checker.OverloadCostEstimate("string_last_index_of_string_int", estimateStringSearchCost),
 			checker.OverloadCostEstimate("string_lower_ascii", estimateStringFixedTransformCost),
 			checker.OverloadCostEstimate("string_upper_ascii", estimateStringFixedTransformCost),
 			checker.OverloadCostEstimate("string_replace_string_string", estimateStringReplaceCost),
 			checker.OverloadCostEstimate("string_replace_string_string_int", estimateStringReplaceCost),
 			checker.OverloadCostEstimate("string_split_string", estimateStringSplitCost),
 			checker.OverloadCostEstimate("string_split_string_int", estimateStringSplitCost),
 			checker.OverloadCostEstimate("string_substring_int", estimateSubstringCost),
 			checker.OverloadCostEstimate("string_substring_int_int", estimateSubstringCost),
 			checker.OverloadCostEstimate("string_trim", estimateStringVariableTransformCost),
 			checker.OverloadCostEstimate("string_reverse", estimateStringFixedTransformCost),
 			checker.OverloadCostEstimate("list_join", estimateStringJoinCost),
 			checker.OverloadCostEstimate("list_join_string", estimateStringJoinCost),
 		}
 		opts = append(opts, cel.CostEstimatorOptions(estimators...))
 	}
 	return opts
 }

 // ProgramOptions implements the Library interface method.
 func (lib *stringLib) ProgramOptions() []cel.ProgramOption {
 	if lib.version >= 5 {
 		return []cel.ProgramOption{
 			cel.CostTrackerOptions(
 				interpreter.OverloadCostTracker("string_char_at_int", trackStringCharAtCost),
 				interpreter.OverloadCostTracker("string_index_of_string", trackStringSearchCost),
 				interpreter.OverloadCostTracker("string_index_of_string_int", trackStringSearchCost),
 				interpreter.OverloadCostTracker("string_last_index_of_string", trackStringSearchCost),
 				interpreter.OverloadCostTracker("string_last_index_of_string_int", trackStringSearchCost),
 				interpreter.OverloadCostTracker("string_lower_ascii", trackStringTransformCost),
 				interpreter.OverloadCostTracker("string_upper_ascii", trackStringTransformCost),
 				interpreter.OverloadCostTracker("string_replace_string_string", trackStringReplaceCost),
 				interpreter.OverloadCostTracker("string_replace_string_string_int", trackStringReplaceCost),
 				interpreter.OverloadCostTracker("string_split_string", trackStringSplitCost),
 				interpreter.OverloadCostTracker("string_split_string_int", trackStringSplitCost),
 				interpreter.OverloadCostTracker("string_substring_int", trackStringTransformCost),
 				interpreter.OverloadCostTracker("string_substring_int_int", trackStringTransformCost),
 				interpreter.OverloadCostTracker("string_trim", trackStringTransformCost),
 				interpreter.OverloadCostTracker("string_reverse", trackStringTransformCost),
 				interpreter.OverloadCostTracker("list_join", trackStringJoinCost),
 				interpreter.OverloadCostTracker("list_join_string", trackStringJoinCost),
 			),
 		}
 	}
 	return []cel.ProgramOption{}
 }

 func charAt(str string, ind int64) (string, error) {
 	i := int(ind)
 	runes := []rune(str)
 	if i < 0 || i > len(runes) {
 		return "", fmt.Errorf("index out of range: %d", ind)
 	}
 	if i == len(runes) {
 		return "", nil
 	}
 	return string(runes[i]), nil
 }

 func indexOf(str, substr string) (int64, error) {
 	return indexOfOffset(str, substr, int64(0))
 }

 func indexOfOffset(str, substr string, offset int64) (int64, error) {
 	if substr == "" {
 		return offset, nil
 	}
 	off := int(offset)
 	runes := []rune(str)
 	subrunes := []rune(substr)
 	if off < 0 {
 		return -1, fmt.Errorf("index out of range: %d", off)
 	}
 	// If the offset exceeds the length, return -1 rather than error.
 	if off >= len(runes) {
 		return -1, nil
 	}
 	for i := off; i < len(runes)-(len(subrunes)-1); i++ {
 		found := true
 		for j := 0; j < len(subrunes); j++ {
 			if runes[i+j] != subrunes[j] {
 				found = false
 				break
 			}
 		}
 		if found {
 			return int64(i), nil
 		}
 	}
 	return -1, nil
 }

 func lastIndexOf(str, substr string) (int64, error) {
 	runes := []rune(str)
 	if substr == "" {
 		return int64(len(runes)), nil
 	}

 	if len(str) < len(substr) {
 		return -1, nil
 	}
 	return lastIndexOfOffset(str, substr, int64(len(runes)-1))
 }

 func lastIndexOfOffset(str, substr string, offset int64) (int64, error) {
 	if substr == "" {
 		return offset, nil
 	}
 	off := int(offset)
 	runes := []rune(str)
 	subrunes := []rune(substr)
 	if off < 0 {
 		return -1, fmt.Errorf("index out of range: %d", off)
 	}
 	// If the offset is far greater than the length return -1
 	if off >= len(runes) {
 		return -1, nil
 	}
 	if off > len(runes)-len(subrunes) {
 		off = len(runes) - len(subrunes)
 	}
 	for i := off; i >= 0; i-- {
 		found := true
 		for j := 0; j < len(subrunes); j++ {
 			if runes[i+j] != subrunes[j] {
 				found = false
 				break
 			}
 		}
 		if found {
 			return int64(i), nil
 		}
 	}
 	return -1, nil
 }

 func lowerASCII(str string) (string, error) {
 	runes := []rune(str)
 	for i, r := range runes {
 		if r <= unicode.MaxASCII {
 			r = unicode.ToLower(r)
 			runes[i] = r
 		}
 	}
 	return string(runes), nil
 }

 func replace(str, old, new string) (string, error) {
 	return strings.ReplaceAll(str, old, new), nil
 }

 func replaceN(str, old, new string, n int64) (string, error) {
 	return strings.Replace(str, old, new, int(n)), nil
 }

 func split(str, sep string) ([]string, error) {
 	return strings.Split(str, sep), nil
 }

 func splitN(str, sep string, n int64) ([]string, error) {
 	return strings.SplitN(str, sep, int(n)), nil
 }

 func substr(str string, start int64) (string, error) {
 	runes := []rune(str)
 	if int(start) < 0 || int(start) > len(runes) {
 		return "", fmt.Errorf("index out of range: %d", start)
 	}
 	return string(runes[start:]), nil
 }

 func substrRange(str string, start, end int64) (string, error) {
 	runes := []rune(str)
 	l := len(runes)
 	if start > end {
 		return "", fmt.Errorf("invalid substring range. start: %d, end: %d", start, end)
 	}
 	if int(start) < 0 || int(start) > l {
 		return "", fmt.Errorf("index out of range: %d", start)
 	}
 	if int(end) < 0 || int(end) > l {
 		return "", fmt.Errorf("index out of range: %d", end)
 	}
 	return string(runes[int(start):int(end)]), nil
 }

 func trimSpace(str string) (string, error) {
 	return strings.TrimSpace(str), nil
 }

 func upperASCII(str string) (string, error) {
 	runes := []rune(str)
 	for i, r := range runes {
 		if r <= unicode.MaxASCII {
 			r = unicode.ToUpper(r)
 			runes[i] = r
 		}
 	}
 	return string(runes), nil
 }

 func reverse(str string) (string, error) {
 	chars := []rune(str)
 	for i, j := 0, len(chars)-1; i < j; i, j = i+1, j-1 {
 		chars[i], chars[j] = chars[j], chars[i]
 	}
 	return string(chars), nil
 }

 func joinSeparator(strs []string, separator string) (string, error) {
 	return strings.Join(strs, separator), nil
 }

 func join(strs []string) (string, error) {
 	return strings.Join(strs, ""), nil
 }

 func joinValSeparator(strs traits.Lister, separator string) (string, error) {
 	sz := strs.Size().(types.Int)
 	var sb strings.Builder
 	for i := types.Int(0); i < sz; i++ {
 		if i != 0 {
 			sb.WriteString(separator)
 		}
 		elem := strs.Get(i)
 		str, ok := elem.(types.String)
 		if !ok {
 			return "", fmt.Errorf("join: invalid input: %v", elem)
 		}
 		sb.WriteString(string(str))
 	}
 	return sb.String(), nil
 }

 // quote implements a string quoting function. The string will be wrapped in
 // double quotes, and all valid CEL escape sequences will be escaped to show up
 // literally if printed. If the input contains any invalid UTF-8, the invalid runes
 // will be replaced with utf8.RuneError.
 func quote(s string) (string, error) {
 	var quotedStrBuilder strings.Builder
 	for _, c := range sanitize(s) {
 		switch c {
 		case '\a':
 			quotedStrBuilder.WriteString("\\a")
 		case '\b':
 			quotedStrBuilder.WriteString("\\b")
 		case '\f':
 			quotedStrBuilder.WriteString("\\f")
 		case '\n':
 			quotedStrBuilder.WriteString("\\n")
 		case '\r':
 			quotedStrBuilder.WriteString("\\r")
 		case '\t':
 			quotedStrBuilder.WriteString("\\t")
 		case '\v':
 			quotedStrBuilder.WriteString("\\v")
 		case '\\':
 			quotedStrBuilder.WriteString("\\\\")
 		case '"':
 			quotedStrBuilder.WriteString("\\\"")
 		default:
 			quotedStrBuilder.WriteRune(c)
 		}
 	}
 	escapedStr := quotedStrBuilder.String()
 	return "\"" + escapedStr + "\"", nil
 }

 // sanitize replaces all invalid runes in the given string with utf8.RuneError.
 func sanitize(s string) string {
 	var sanitizedStringBuilder strings.Builder
 	for _, r := range s {
 		if !utf8.ValidRune(r) {
 			sanitizedStringBuilder.WriteRune(utf8.RuneError)
 		} else {
 			sanitizedStringBuilder.WriteRune(r)
 		}
 	}
 	return sanitizedStringBuilder.String()
 }

 var (
 	stringListType = reflect.TypeFor[[]string]()
 )

 // Cost estimation functions for string extensions.
 //
 // These functions provide compile-time cost estimates proportional to the size of
 // the input string(s), ensuring that the CEL cost system accurately reflects the
 // computational work performed by string operations.

 // estimateStringFixedTransformCost estimates cost for O(n) string operations such as
 // lowerAscii, upperAsciil, reverse and quote.
 func estimateStringFixedTransformCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil {
 		return nil
 	}
 	cost, size := estimateStringScan(estimateSize(estimator, *target))
 	return callEstimate(cost.Add(callCostEstimate).Add(size.AsCost()), size)
 }

 // estimateStringVariableTransformCost estimates cost for O(n) string operations that result
 // in a variable sized string which may be empty to the exact input string.
 func estimateStringVariableTransformCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil {
 		return nil
 	}
 	cost, size := estimateStringScan(estimateSize(estimator, *target))
 	transformSize := rangedSizeEstimate(0, size.Max)
 	return callEstimate(cost.Add(callCostEstimate).Add(transformSize.AsCost()), &transformSize)
 }

 // estimateStringCharAtCost includes a cost of 1 for the allocation, plus the string traversal cost.
 func estimateStringCharAtCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil || len(args) != 1 {
 		return nil
 	}
 	cost, _ := estimateStringScan(estimateSize(estimator, *target))
 	resultSize := rangedSizeEstimate(0, 1)
 	return callEstimate(cost.Add(callCostEstimate).Add(callCostEstimate), &resultSize)
 }

 // estimateSubstringCost estimates the cost for an O(n) traversal and allocation.
 func estimateSubstringCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil || len(args) < 1 || len(args) > 2 {
 		return nil
 	}
 	targetSize := estimateSize(estimator, *target)
 	cost, _ := estimateStringScan(targetSize)

 	start := nodeAsUintValue(args[0], 0)
 	end := targetSize.Max
 	if len(args) == 2 {
 		end = nodeAsUintValue(args[1], end)
 	}
 	resultSize := fixedSizeEstimate(end - start)
 	return callEstimate(cost.Add(callCostEstimate).Add(resultSize.AsCost()), &resultSize)
 }

 // estimateStringSearchCost estimates cost for O(n*m) string search operations
 // such as indexOf and lastIndexOf.
 func estimateStringSearchCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil || len(args) < 1 {
 		return nil
 	}
 	targetSize := estimateSize(estimator, *target)
 	needleSize := estimateSize(estimator, args[0])
 	searchSize := targetSize.Multiply(needleSize)
 	searchCost, _ := estimateStringScan(searchSize)
 	// Search cost is proportional to target size * substring size.
 	return callEstimate(searchCost.Add(callCostEstimate), nil)
 }

 // estimateStringReplaceCost estimates cost for string replace operations.
 // The cost accounts for search (O(n*m)) and potential output size growth.
 func estimateStringReplaceCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil || len(args) < 2 {
 		return nil
 	}
 	// Compute the search for the replacement string, by 'm' times
 	targetSize := estimateSize(estimator, *target)
 	needleSize := atLeastOne(estimateSize(estimator, args[0]))
 	searchCost := atLeastOne(targetSize).Multiply(needleSize).MultiplyByCostFactor(stringCostFactor)

 	replacementSize := estimateSize(estimator, args[1]).Add(fixedSizeEstimate(1))
 	allReplacedSize := safeMul(safeAdd(targetSize.Max, 1), replacementSize.Max)
 	resultMinSize := targetSize.Min
 	if resultMinSize > replacementSize.Min {
 		resultMinSize = replacementSize.Min
 	}
 	resultSize := rangedSizeEstimate(resultMinSize, allReplacedSize)
 	return callEstimate(
 		searchCost.Add(resultSize.AsCost()).Add(callCostEstimate), &resultSize,
 	)
 }

 // estimateStringSplitCost estimates cost for string split operations.
 // Split creates a list of substrings, so cost includes both traversal and
 // list allocation proportional to the input size.
 func estimateStringSplitCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil || len(args) < 1 {
 		return nil
 	}
 	targetSize := estimateSize(estimator, *target)
 	// Traversal cost proportional to input size.
 	traversalCost := targetSize.Add(fixedSizeEstimate(1)).MultiplyByCostFactor(stringCostFactor)
 	// Worst case: split("") produces N elements for a string of size N.
 	resultSize := rangedSizeEstimate(0, targetSize.Max)
 	// Include list creation base cost plus allocation for each element.
 	allocationCost := resultSize.MultiplyByCostFactor(1).Add(checker.FixedCostEstimate(common.ListCreateBaseCost))
 	cost := traversalCost.Add(allocationCost).Add(callCostEstimate)
 	return callEstimate(cost, &resultSize)
 }

 // estimateStringJoinCost estimates cost for string join operations.
 // Join iterates over all list elements and concatenates them, so cost is
 // proportional to the total size of all elements plus separator overhead.
 func estimateStringJoinCost(estimator checker.CostEstimator, target *checker.AstNode, args []checker.AstNode) *checker.CallEstimate {
 	if target == nil {
 		return nil
 	}
 	targetSize := estimateSize(estimator, *target)
 	sepSize := fixedSizeEstimate(0)
 	if len(args) >= 1 {
 		sepSize = estimateSize(estimator, args[0])
 	}
 	// Traversal cost proportional to the number of list elements.
 	traversalCost := targetSize.Add(fixedSizeEstimate(1)).MultiplyByCostFactor(stringCostFactor)
 	// Result size: sum of element sizes + (n-1) * separator size.
 	// Worst case estimate: use list size * max element size + list size * separator size.
 	maxResultSize := safeAdd(safeMul(targetSize.Max, (safeAdd(1, sepSize.Max))), sepSize.Max)
 	resultSize := rangedSizeEstimate(0, maxResultSize)
 	cost := traversalCost.Add(resultSize.MultiplyByCostFactor(1)).Add(callCostEstimate)
 	return callEstimate(cost, &resultSize)
 }

 // Runtime cost tracking functions for string extensions.
 //
 // These functions compute the actual cost of string operations after evaluation,
 // using the real sizes of the inputs and outputs.

 // trackStringCharAtCost tracks runtime cost for O(n) string operations.
 func trackStringCharAtCost(args []ref.Val, result ref.Val) *uint64 {
 	size := float64(actualSize(args[0])) * stringCostFactor
 	cost := safeAdd(callCost, uint64(math.Ceil(size)), 1)
 	return &cost
 }

 // trackStringTransformCost tracks runtime cost for O(n) string operations.
 func trackStringTransformCost(args []ref.Val, result ref.Val) *uint64 {
 	transformCost := math.Ceil(float64(actualSize(args[0])) * stringCostFactor)
 	resultSize := actualSize(result)
 	cost := safeAdd(callCost, uint64(transformCost), resultSize)
 	return &cost
 }

 // trackStringSearchCost tracks runtime cost for O(n*m) string search operations.
 func trackStringSearchCost(args []ref.Val, _ ref.Val) *uint64 {
 	searchCost := float64(actualSize(args[0])*actualSize(args[1])) * stringCostFactor
 	cost := safeAdd(uint64(math.Ceil(searchCost)), callCost)
 	return &cost
 }

 // trackStringReplaceCost tracks runtime cost for string replace operations,
 // accounting for search cost and the size of the result.
 func trackStringReplaceCost(args []ref.Val, result ref.Val) *uint64 {
 	targetSize := actualSize(args[0])
 	if targetSize == 0 {
 		targetSize = 1
 	}
 	needleSize := actualSize(args[1])
 	if needleSize == 0 {
 		needleSize = 1
 	}
 	searchCost := uint64(math.Ceil(float64(targetSize*needleSize) * stringCostFactor))
 	cost := safeAdd(callCost, searchCost, actualSize(result))
 	return &cost
 }

 // trackStringSplitCost tracks runtime cost for string split operations,
 // accounting for traversal and list allocation.
 func trackStringSplitCost(args []ref.Val, result ref.Val) *uint64 {
 	traversalCost := float64(safeAdd(actualSize(args[0]), 1)) * stringCostFactor
 	resultSize := actualSize(result)
 	cost := safeAdd(callCost, uint64(math.Ceil(traversalCost)), resultSize, common.ListCreateBaseCost)
 	return &cost
 }

 // trackStringJoinCost tracks runtime cost for string join operations,
 // accounting for traversal and the size of the result.
 func trackStringJoinCost(args []ref.Val, result ref.Val) *uint64 {
 	traversalCost := float64(safeAdd(actualSize(args[0]), 1)) * stringCostFactor
 	cost := safeAdd(callCost, uint64(math.Ceil(traversalCost)), actualSize(result))
 	return &cost
 }