waveterm/wavesrv/pkg/shparse/extend.go

414 lines
9.9 KiB
Go
Raw Normal View History

2023-10-17 06:31:13 +02:00
// Copyright 2023, Command Line Inc.
// SPDX-License-Identifier: Apache-2.0
2022-11-17 07:17:38 +01:00
package shparse
import (
"bytes"
"unicode"
"unicode/utf8"
zsh support (#227) adds zsh support to waveterm. big change, lots going on here. lots of other improvements and bug fixes added while debugging and building out the feature. Commits: * refactor shexec parser.go into new package shellenv. separate out bash specific parsing from generic functions * checkpoint * work on refactoring shexec. created two new packages shellapi (for bash/zsh specific stuff), and shellutil (shared between shellapi and shexec) * more refactoring * create shellapi interface to abstract bash specific functionality * more refactoring, move bash shell state parsing to shellapi * move makeRcFile to shellapi. remove all of the 'client' options CLI options from waveshell * get shellType passed through to server/single paths for waveshell * add a local shelltype detector * mock out a zshapi * move shelltype through more of the code * get a command to run via zsh * zsh can now switch directories. poc, needs cleanup * working on ShellState encoding differences between zsh/bash. Working on parsing zsh decls. move utilfn package into waveshell (shouldn't have been in wavesrv) * switch to use []byte for vardecl serialization + diffs * progress on zsh environment. still have issues reconciling init environment with trap environment * fix typeset argument parsing * parse promptvars, more zsh specific ignores * fix bug with promptvar not getting set (wrong check in FeState func) * add sdk (issue #188) to list of rtnstate commands * more zsh compatibility -- working with a larger ohmyzsh environment. ignore more variables, handle exit trap better. unique path/fpath. add a processtype variable to base. * must return a value * zsh alias parsing/restoring. diff changes (and rtnstate changes). introduces linediff v1. * force zmodload of zsh/parameter * starting work on zsh functions * need a v1 of mapdiff as well (to handle null chars) * pack/unpack of ints was wrong (one used int and one use uint). turned out we only ever encoded '0' so it worked. that also means it is safe to change unpack to unpackUInt * reworking for binary encoding of aliases and functions (because of zsh allows any character, including nulls, in names and values) * fixes, working on functions, issue with line endings * zsh functions. lots of ugliness here around dealing with line dicipline and cooked stty. new runcommand function to grab output from a non-tty fd. note that we still to run the actual command in a stty to get the proper output. * write uuid tempdir, cleanup with tmprcfilename code * hack in some simple zsh function declaration finding code for rtnstate. create function diff for rtnstate that supports zsh * make sure key order is constant so shell hashes are consistent * fix problems with state diffs to support new zsh formats. add diff/apply code to shellapi (moved from shellenv), that is now specific to zsh or bash * add log packet and new shellstate packets * switch to shellstate map that's also keyed by shelltype * add shelltype to remoteinstance * remove shell argument from waveshell * added new shelltype statemap to remote.go (msh), deal with fallout * move shellstate out of init packet, and move to an explicit reinit call. try to initialize all of the active shell states * change dont always store init state (only store on demand). initialize shell states on demand (if not already initialized). allow reset to change shells * add shellpref field to remote table. use to drive the default shell choice for new tabs * show shelltag on cmdinput, pass through ri and remote (defaultshellstate) * bump mshell version to v0.4 * better version validation for shellstate. also relax compatibility requirements for diffing states (shelltype + major version need to match) * better error handling, check shellstate compatibility during run (on waveshell server) * add extra separator for bash shellstate processing to deal with spurious output from rc files * special migration for v30 -- flag invalid bash shell states and show special button in UI to fix * format * remove zsh-decls (unused) * remove test code * remove debug print * fix typo
2024-01-17 01:11:04 +01:00
"github.com/wavetermdev/waveterm/waveshell/pkg/utilfn"
2022-11-17 07:17:38 +01:00
)
var noEscChars []bool
var specialEsc []string
func init() {
noEscChars = make([]bool, 256)
for ch := 0; ch < 256; ch++ {
if (ch >= '0' && ch <= '9') || (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') ||
ch == '-' || ch == '.' || ch == '/' || ch == ':' || ch == '=' || ch == '_' {
2022-11-17 07:17:38 +01:00
noEscChars[byte(ch)] = true
}
}
specialEsc = make([]string, 256)
specialEsc[0x7] = "\\a"
specialEsc[0x8] = "\\b"
specialEsc[0x9] = "\\t"
specialEsc[0xa] = "\\n"
specialEsc[0xb] = "\\v"
specialEsc[0xc] = "\\f"
specialEsc[0xd] = "\\r"
specialEsc[0x1b] = "\\E"
}
func getUtf8Literal(ch rune) string {
var buf bytes.Buffer
var runeArr [utf8.UTFMax]byte
barr := runeArr[:]
byteLen := utf8.EncodeRune(barr, ch)
for i := 0; i < byteLen; i++ {
buf.WriteString("\\x")
buf.WriteByte(utilfn.HexDigits[barr[i]/16])
buf.WriteByte(utilfn.HexDigits[barr[i]%16])
}
return buf.String()
}
func (w *WordType) writeString(s string) {
2022-11-17 07:17:38 +01:00
for _, ch := range s {
w.writeRune(ch)
}
}
func (w *WordType) writeRune(ch rune) {
2022-11-17 08:52:10 +01:00
wmeta := wordMetaMap[w.Type]
if w.Complete && wmeta.SuffixLen == 1 {
w.Raw = append(w.Raw[0:len(w.Raw)-1], ch, w.Raw[len(w.Raw)-1])
2022-11-17 07:17:38 +01:00
return
}
2022-11-17 08:52:10 +01:00
if w.Complete && wmeta.SuffixLen == 2 {
w.Raw = append(w.Raw[0:len(w.Raw)-2], ch, w.Raw[len(w.Raw)-2], w.Raw[len(w.Raw)-1])
2022-11-17 07:17:38 +01:00
return
}
2022-11-17 08:52:10 +01:00
// not complete or SuffixLen == 0 (2+ is not supported)
w.Raw = append(w.Raw, ch)
return
2022-11-17 07:17:38 +01:00
}
type extendContext struct {
Input []*WordType
InputPos int
QC QuoteContext
Rtn []*WordType
CurWord *WordType
2022-11-17 07:17:38 +01:00
Intention string
}
func makeExtendContext(qc QuoteContext, word *WordType) *extendContext {
rtn := &extendContext{QC: qc}
if word == nil {
rtn.Intention = WordTypeLit
return rtn
} else {
rtn.Intention = word.Type
rtn.Rtn = []*WordType{word}
rtn.CurWord = word
return rtn
2022-11-17 07:17:38 +01:00
}
}
func (ec *extendContext) appendWord(w *WordType) {
2022-11-17 07:17:38 +01:00
ec.Rtn = append(ec.Rtn, w)
ec.CurWord = w
}
2022-11-17 08:52:10 +01:00
func (ec *extendContext) ensureCurWord() {
if ec.CurWord == nil || ec.CurWord.Type != ec.Intention {
2022-11-22 04:06:59 +01:00
ec.CurWord = MakeEmptyWord(ec.Intention, ec.QC, 0, true)
2022-11-17 08:52:10 +01:00
ec.Rtn = append(ec.Rtn, ec.CurWord)
}
}
2022-11-22 04:06:59 +01:00
// grp, dq, ddq
func extendWithSubs(word *WordType, wordPos int, extStr string, complete bool) utilfn.StrWithPos {
wmeta := wordMetaMap[word.Type]
if word.Type == WordTypeGroup {
atEnd := (wordPos == len(word.Raw))
subWord := findCompletionWordAtPos(word.Subs, wordPos, true)
if subWord == nil {
strPos := Extend(MakeEmptyWord(WordTypeLit, word.QC, 0, true), 0, extStr, atEnd)
strPos = strPos.Prepend(string(word.Raw[0:wordPos]))
strPos = strPos.Append(string(word.Raw[wordPos:]))
return strPos
} else {
subComplete := complete && atEnd
strPos := Extend(subWord, wordPos-subWord.Offset, extStr, subComplete)
strPos = strPos.Prepend(string(word.Raw[0:subWord.Offset]))
strPos = strPos.Append(string(word.Raw[subWord.Offset+len(subWord.Raw):]))
return strPos
}
} else if word.Type == WordTypeDQ || word.Type == WordTypeDDQ {
if wordPos < word.contentStartPos() {
wordPos = word.contentStartPos()
}
atEnd := (wordPos >= len(word.Raw)-wmeta.SuffixLen)
subWord := findCompletionWordAtPos(word.Subs, wordPos-wmeta.PrefixLen, true)
quoteBalance := !atEnd
if subWord == nil {
realOffset := wordPos
strPos, wordOpen := extendInternal(MakeEmptyWord(WordTypeLit, word.QC.push(WordTypeDQ), 0, true), 0, extStr, false, quoteBalance)
strPos = strPos.Prepend(string(word.Raw[0:realOffset]))
var requiredSuffix string
if wordOpen {
requiredSuffix = wmeta.getSuffix()
}
if atEnd {
if complete {
return utilfn.StrWithPos{Str: strPos.Str + requiredSuffix + " ", Pos: strPos.Pos + len(requiredSuffix) + 1}
} else {
if word.Complete && requiredSuffix != "" {
return strPos.Append(requiredSuffix)
}
return strPos
}
}
strPos = strPos.Append(string(word.Raw[wordPos:]))
return strPos
} else {
realOffset := subWord.Offset + wmeta.PrefixLen
strPos, wordOpen := extendInternal(subWord, wordPos-realOffset, extStr, false, quoteBalance)
strPos = strPos.Prepend(string(word.Raw[0:realOffset]))
var requiredSuffix string
if wordOpen {
requiredSuffix = wmeta.getSuffix()
}
if atEnd {
if complete {
return utilfn.StrWithPos{Str: strPos.Str + requiredSuffix + " ", Pos: strPos.Pos + len(requiredSuffix) + 1}
} else {
if word.Complete && requiredSuffix != "" {
return strPos.Append(requiredSuffix)
}
return strPos
}
}
strPos = strPos.Append(string(word.Raw[realOffset+len(subWord.Raw):]))
return strPos
}
} else {
return utilfn.StrWithPos{Str: string(word.Raw), Pos: wordPos}
}
2022-11-22 04:06:59 +01:00
}
// lit, svar, varb, sq, dsq
func extendLeafCh(buf *bytes.Buffer, wordOpen *bool, wtype string, qc QuoteContext, ch rune) {
switch wtype {
2022-11-17 08:52:10 +01:00
case WordTypeSimpleVar, WordTypeVarBrace:
2022-11-22 04:06:59 +01:00
extendVar(buf, ch)
2022-11-17 07:17:38 +01:00
2022-11-22 04:06:59 +01:00
case WordTypeLit:
if qc.cur() == WordTypeDQ {
extendDQLit(buf, wordOpen, ch)
} else {
extendLit(buf, ch)
}
2022-11-17 07:17:38 +01:00
case WordTypeSQ:
2022-11-22 04:06:59 +01:00
extendSQ(buf, wordOpen, ch)
2022-11-17 07:17:38 +01:00
case WordTypeDSQ:
2022-11-22 04:06:59 +01:00
extendDSQ(buf, wordOpen, ch)
2022-11-17 07:17:38 +01:00
default:
2022-11-17 08:52:10 +01:00
return
2022-11-17 07:17:38 +01:00
}
}
func getWordOpenStr(wtype string, qc QuoteContext) string {
if wtype == WordTypeLit {
if qc.cur() == WordTypeDQ {
return "\""
} else {
return ""
}
}
wmeta := wordMetaMap[wtype]
return wmeta.getPrefix()
}
2022-11-22 04:06:59 +01:00
// lit, svar, varb sq, dsq
func extendLeaf(buf *bytes.Buffer, wordOpen *bool, word *WordType, wordPos int, extStr string) {
for _, ch := range extStr {
extendLeafCh(buf, wordOpen, word.Type, word.QC, ch)
2022-11-17 07:17:38 +01:00
}
2022-11-22 04:06:59 +01:00
}
// lit, grp, svar, dq, ddq, varb, sq, dsq
// returns (strwithpos, dq-closed)
func extendInternal(word *WordType, wordPos int, extStr string, complete bool, requiresQuoteBalance bool) (utilfn.StrWithPos, bool) {
2022-11-22 04:06:59 +01:00
if extStr == "" {
return utilfn.StrWithPos{Str: string(word.Raw), Pos: wordPos}, true
}
if word.canHaveSubs() {
return extendWithSubs(word, wordPos, extStr, complete), true
2022-11-22 04:06:59 +01:00
}
var buf bytes.Buffer
isEOW := wordPos >= word.contentEndPos()
if isEOW {
wordPos = word.contentEndPos()
}
if wordPos < word.contentStartPos() {
2022-11-22 04:06:59 +01:00
wordPos = word.contentStartPos()
}
if wordPos > 0 {
buf.WriteString(string(word.Raw[0:word.contentStartPos()])) // write the prefix
2022-11-22 04:06:59 +01:00
}
if wordPos > word.contentStartPos() {
buf.WriteString(string(word.Raw[word.contentStartPos():wordPos]))
2022-11-22 04:06:59 +01:00
}
wordOpen := true
extendLeaf(&buf, &wordOpen, word, wordPos, extStr)
2022-11-22 04:06:59 +01:00
if isEOW {
// end-of-word, write the suffix (and optional ' '). return the end of the string
wmeta := wordMetaMap[word.Type]
rtnPos := utf8.RuneCount(buf.Bytes())
2022-11-22 04:06:59 +01:00
buf.WriteString(wmeta.getSuffix())
if !wordOpen && requiresQuoteBalance {
buf.WriteString(getWordOpenStr(word.Type, word.QC))
wordOpen = true
}
2022-11-22 04:06:59 +01:00
if complete {
buf.WriteRune(' ')
return utilfn.StrWithPos{Str: buf.String(), Pos: utf8.RuneCount(buf.Bytes())}, wordOpen
2022-11-22 04:06:59 +01:00
} else {
return utilfn.StrWithPos{Str: buf.String(), Pos: rtnPos}, wordOpen
2022-11-22 04:06:59 +01:00
}
}
// completion in the middle of a word (no ' ')
rtnPos := utf8.RuneCount(buf.Bytes())
if !wordOpen {
// always required since there is a suffix
buf.WriteString(getWordOpenStr(word.Type, word.QC))
wordOpen = true
}
2022-11-22 04:06:59 +01:00
buf.WriteString(string(word.Raw[wordPos:])) // write the suffix
return utilfn.StrWithPos{Str: buf.String(), Pos: rtnPos}, wordOpen
}
// lit, grp, svar, dq, ddq, varb, sq, dsq
func Extend(word *WordType, wordPos int, extStr string, complete bool) utilfn.StrWithPos {
rtn, _ := extendInternal(word, wordPos, extStr, complete, false)
return rtn
2022-11-22 04:06:59 +01:00
}
func (ec *extendContext) extend(ch rune) {
if ch == 0 {
return
}
return
2022-11-17 07:17:38 +01:00
}
2022-11-17 08:52:10 +01:00
func isVarNameChar(ch rune) bool {
return ch == '_' || (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z') || (ch >= '0' && ch <= '9')
}
2022-11-22 04:06:59 +01:00
func extendVar(buf *bytes.Buffer, ch rune) {
2022-11-17 08:52:10 +01:00
if ch == 0 {
return
}
if !isVarNameChar(ch) {
return
}
2022-11-22 04:06:59 +01:00
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
}
2022-11-22 04:06:59 +01:00
func getSpecialEscape(ch rune) string {
if ch > unicode.MaxASCII {
return ""
}
return specialEsc[byte(ch)]
}
func writeSpecial(buf *bytes.Buffer, ch rune, wrap bool) {
if wrap {
buf.WriteRune('$')
buf.WriteRune('\'')
}
2022-11-22 04:06:59 +01:00
sesc := getSpecialEscape(ch)
if sesc != "" {
buf.WriteString(sesc)
} else {
utf8Lit := getUtf8Literal(ch)
buf.WriteString(utf8Lit)
}
if wrap {
buf.WriteRune('\'')
}
2022-11-22 04:06:59 +01:00
}
func extendLit(buf *bytes.Buffer, ch rune) {
2022-11-17 08:52:10 +01:00
if ch == 0 {
return
}
if ch > unicode.MaxASCII || !unicode.IsPrint(ch) {
writeSpecial(buf, ch, true)
2022-11-17 08:52:10 +01:00
return
}
var bch = byte(ch)
if noEscChars[bch] {
2022-11-22 04:06:59 +01:00
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
buf.WriteRune('\\')
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
func extendDSQ(buf *bytes.Buffer, wordOpen *bool, ch rune) {
2022-11-17 08:52:10 +01:00
if ch == 0 {
return
}
if !*wordOpen {
2022-11-22 04:06:59 +01:00
buf.WriteRune('$')
buf.WriteRune('\'')
*wordOpen = true
}
if ch > unicode.MaxASCII || !unicode.IsPrint(ch) {
writeSpecial(buf, ch, false)
return
}
2022-11-22 04:06:59 +01:00
if ch == '\'' {
buf.WriteRune('\\')
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
func extendSQ(buf *bytes.Buffer, wordOpen *bool, ch rune) {
2022-11-17 07:17:38 +01:00
if ch == 0 {
return
}
if ch == '\'' {
2022-11-22 04:06:59 +01:00
if *wordOpen {
buf.WriteRune('\'')
*wordOpen = false
}
buf.WriteRune('\\')
buf.WriteRune('\'')
2022-11-17 08:52:10 +01:00
return
2022-11-17 07:17:38 +01:00
}
if ch > unicode.MaxASCII || !unicode.IsPrint(ch) {
2022-11-22 04:06:59 +01:00
if *wordOpen {
buf.WriteRune('\'')
*wordOpen = false
2022-11-17 07:17:38 +01:00
}
writeSpecial(buf, ch, true)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
if !*wordOpen {
buf.WriteRune('\'')
*wordOpen = true
}
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
}
2022-11-22 04:06:59 +01:00
func extendDQLit(buf *bytes.Buffer, wordOpen *bool, ch rune) {
2022-11-17 08:52:10 +01:00
if ch == 0 {
return
}
if ch > unicode.MaxASCII || !unicode.IsPrint(ch) {
2022-11-22 04:06:59 +01:00
if *wordOpen {
buf.WriteRune('"')
*wordOpen = false
2022-11-17 08:52:10 +01:00
}
writeSpecial(buf, ch, true)
2022-11-22 04:06:59 +01:00
return
}
if !*wordOpen {
buf.WriteRune('"')
*wordOpen = true
}
if ch == '"' || ch == '\\' || ch == '$' || ch == '`' {
buf.WriteRune('\\')
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
2022-11-17 07:17:38 +01:00
}
2022-11-22 04:06:59 +01:00
buf.WriteRune(ch)
2022-11-17 08:52:10 +01:00
return
2022-11-17 07:17:38 +01:00
}