123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156 |
- package shellquote
- import (
- "bytes"
- "errors"
- "strings"
- "unicode/utf8"
- )
- var (
- UnterminatedSingleQuoteError = errors.New("Unterminated single-quoted string")
- UnterminatedDoubleQuoteError = errors.New("Unterminated double-quoted string")
- UnterminatedEscapeError = errors.New("Unterminated backslash-escape")
- )
- var (
- splitChars = " \n\t"
- singleChar = '\''
- doubleChar = '"'
- escapeChar = '\\'
- doubleEscapeChars = "$`\"\n\\"
- )
- // Split splits a string according to /bin/sh's word-splitting rules. It
- // supports backslash-escapes, single-quotes, and double-quotes. Notably it does
- // not support the $'' style of quoting. It also doesn't attempt to perform any
- // other sort of expansion, including brace expansion, shell expansion, or
- // pathname expansion.
- //
- // If the given input has an unterminated quoted string or ends in a
- // backslash-escape, one of UnterminatedSingleQuoteError,
- // UnterminatedDoubleQuoteError, or UnterminatedEscapeError is returned.
- func Split(input string) (words []string, err error) {
- var buf bytes.Buffer
- words = make([]string, 0)
- for len(input) > 0 {
- // skip any splitChars at the start
- c, l := utf8.DecodeRuneInString(input)
- if strings.ContainsRune(splitChars, c) {
- input = input[l:]
- continue
- } else if c == escapeChar {
- // Look ahead for escaped newline so we can skip over it
- next := input[l:]
- if len(next) == 0 {
- err = UnterminatedEscapeError
- return
- }
- c2, l2 := utf8.DecodeRuneInString(next)
- if c2 == '\n' {
- input = next[l2:]
- continue
- }
- }
- var word string
- word, input, err = splitWord(input, &buf)
- if err != nil {
- return
- }
- words = append(words, word)
- }
- return
- }
- func splitWord(input string, buf *bytes.Buffer) (word string, remainder string, err error) {
- buf.Reset()
- raw:
- {
- cur := input
- for len(cur) > 0 {
- c, l := utf8.DecodeRuneInString(cur)
- cur = cur[l:]
- if c == singleChar {
- buf.WriteString(input[0 : len(input)-len(cur)-l])
- input = cur
- goto single
- } else if c == doubleChar {
- buf.WriteString(input[0 : len(input)-len(cur)-l])
- input = cur
- goto double
- } else if c == escapeChar {
- buf.WriteString(input[0 : len(input)-len(cur)-l])
- input = cur
- goto escape
- } else if strings.ContainsRune(splitChars, c) {
- buf.WriteString(input[0 : len(input)-len(cur)-l])
- return buf.String(), cur, nil
- }
- }
- if len(input) > 0 {
- buf.WriteString(input)
- input = ""
- }
- goto done
- }
- escape:
- {
- if len(input) == 0 {
- return "", "", UnterminatedEscapeError
- }
- c, l := utf8.DecodeRuneInString(input)
- if c == '\n' {
- // a backslash-escaped newline is elided from the output entirely
- } else {
- buf.WriteString(input[:l])
- }
- input = input[l:]
- }
- goto raw
- single:
- {
- i := strings.IndexRune(input, singleChar)
- if i == -1 {
- return "", "", UnterminatedSingleQuoteError
- }
- buf.WriteString(input[0:i])
- input = input[i+1:]
- goto raw
- }
- double:
- {
- cur := input
- for len(cur) > 0 {
- c, l := utf8.DecodeRuneInString(cur)
- cur = cur[l:]
- if c == doubleChar {
- buf.WriteString(input[0 : len(input)-len(cur)-l])
- input = cur
- goto raw
- } else if c == escapeChar {
- // bash only supports certain escapes in double-quoted strings
- c2, l2 := utf8.DecodeRuneInString(cur)
- cur = cur[l2:]
- if strings.ContainsRune(doubleEscapeChars, c2) {
- buf.WriteString(input[0 : len(input)-len(cur)-l-l2])
- if c2 == '\n' {
- // newline is special, skip the backslash entirely
- } else {
- buf.WriteRune(c2)
- }
- input = cur
- }
- }
- }
- return "", "", UnterminatedDoubleQuoteError
- }
- done:
- return buf.String(), input, nil
- }
|