| // Package kvfile provides utilities to parse line-delimited key/value files |
| // such as used for label-files and env-files. |
| // |
| // # File format |
| // |
| // key/value files use the following syntax: |
| // |
| // - File must be valid UTF-8. |
| // - BOM headers are removed. |
| // - Leading whitespace is removed for each line. |
| // - Lines starting with "#" are ignored. |
| // - Empty lines are ignored. |
| // - Key/Value pairs are provided as "KEY[=<VALUE>]". |
| // - Maximum line-length is limited to [bufio.MaxScanTokenSize]. |
| // |
| // # Interpolation, substitution, and escaping |
| // |
| // Both keys and values are used as-is; no interpolation, substitution or |
| // escaping is supported, and quotes are considered part of the key or value. |
| // Whitespace in values (including leading and trailing) is preserved. Given |
| // that the file format is line-delimited, neither key, nor value, can contain |
| // newlines. |
| // |
| // # Key/Value pairs |
| // |
| // Key/Value pairs take the following format: |
| // |
| // KEY[=<VALUE>] |
| // |
| // KEY is required and may not contain whitespaces or NUL characters. Any |
| // other character (except for the "=" delimiter) are accepted, but it is |
| // recommended to use a subset of the POSIX portable character set, as |
| // outlined in [Environment Variables]. |
| // |
| // VALUE is optional, but may be empty. If no value is provided (i.e., no |
| // equal sign ("=") is present), the KEY is omitted in the result, but some |
| // functions accept a lookup-function to provide a default value for the |
| // given key. |
| // |
| // [Environment Variables]: https://pubs.opengroup.org/onlinepubs/7908799/xbd/envvar.html |
| package kvfile |
| |
| import ( |
| "bufio" |
| "bytes" |
| "fmt" |
| "io" |
| "os" |
| "strings" |
| "unicode" |
| "unicode/utf8" |
| ) |
| |
| // Parse parses a line-delimited key/value pairs separated by equal sign. |
| // It accepts a lookupFn to lookup default values for keys that do not define |
| // a value. An error is produced if parsing failed, the content contains invalid |
| // UTF-8 characters, or a key contains whitespaces. |
| func Parse(filename string, lookupFn func(key string) (value string, found bool)) ([]string, error) { |
| fh, err := os.Open(filename) |
| if err != nil { |
| return []string{}, err |
| } |
| out, err := parseKeyValueFile(fh, lookupFn) |
| _ = fh.Close() |
| if err != nil { |
| return []string{}, fmt.Errorf("invalid env file (%s): %v", filename, err) |
| } |
| return out, nil |
| } |
| |
| // ParseFromReader parses a line-delimited key/value pairs separated by equal sign. |
| // It accepts a lookupFn to lookup default values for keys that do not define |
| // a value. An error is produced if parsing failed, the content contains invalid |
| // UTF-8 characters, or a key contains whitespaces. |
| func ParseFromReader(r io.Reader, lookupFn func(key string) (value string, found bool)) ([]string, error) { |
| return parseKeyValueFile(r, lookupFn) |
| } |
| |
| const whiteSpaces = " \t" |
| |
| func parseKeyValueFile(r io.Reader, lookupFn func(string) (string, bool)) ([]string, error) { |
| lines := []string{} |
| scanner := bufio.NewScanner(r) |
| utf8bom := []byte{0xEF, 0xBB, 0xBF} |
| for currentLine := 1; scanner.Scan(); currentLine++ { |
| scannedBytes := scanner.Bytes() |
| if !utf8.Valid(scannedBytes) { |
| return []string{}, fmt.Errorf("invalid utf8 bytes at line %d: %v", currentLine, scannedBytes) |
| } |
| // We trim UTF8 BOM |
| if currentLine == 1 { |
| scannedBytes = bytes.TrimPrefix(scannedBytes, utf8bom) |
| } |
| // trim the line from all leading whitespace first. trailing whitespace |
| // is part of the value, and is kept unmodified. |
| line := strings.TrimLeftFunc(string(scannedBytes), unicode.IsSpace) |
| |
| if len(line) == 0 || line[0] == '#' { |
| // skip empty lines and comments (lines starting with '#') |
| continue |
| } |
| |
| key, _, hasValue := strings.Cut(line, "=") |
| if len(key) == 0 { |
| return []string{}, fmt.Errorf("no variable name on line '%s'", line) |
| } |
| |
| // leading whitespace was already removed from the line, but |
| // variables are not allowed to contain whitespace or have |
| // trailing whitespace. |
| if strings.ContainsAny(key, whiteSpaces) { |
| return []string{}, fmt.Errorf("variable '%s' contains whitespaces", key) |
| } |
| |
| if hasValue { |
| // key/value pair is valid and has a value; add the line as-is. |
| lines = append(lines, line) |
| continue |
| } |
| |
| if lookupFn != nil { |
| // No value given; try to look up the value. The value may be |
| // empty but if no value is found, the key is omitted. |
| if value, found := lookupFn(line); found { |
| lines = append(lines, key+"="+value) |
| } |
| } |
| } |
| return lines, scanner.Err() |
| } |