argh/parser.go

270 lines
4.8 KiB
Go
Raw Normal View History

2022-05-15 18:22:56 +00:00
//go:generate stringer -type NValue
package argh
import (
"io"
"strings"
"github.com/pkg/errors"
)
2022-05-15 18:22:56 +00:00
const (
ZeroValue NValue = iota
OneValue
OneOrMoreValue
)
var (
errSyntax = errors.New("syntax error")
2022-05-14 00:58:55 +00:00
DefaultParserConfig = &ParserConfig{
2022-05-15 18:22:56 +00:00
Commands: map[string]NValue{},
Flags: map[string]NValue{},
2022-05-14 00:58:55 +00:00
ScannerConfig: DefaultScannerConfig,
}
)
2022-05-15 18:22:56 +00:00
type NValue int
2022-05-14 00:58:55 +00:00
func ParseArgs(args []string, pCfg *ParserConfig) (*Argh, error) {
reEncoded := strings.Join(args, string(nul))
return NewParser(
strings.NewReader(reEncoded),
2022-05-14 00:58:55 +00:00
pCfg,
).Parse()
}
type Parser struct {
2022-05-15 18:22:56 +00:00
s *Scanner
2022-05-14 00:58:55 +00:00
2022-05-15 18:22:56 +00:00
buf []ScanEntry
commands map[string]NValue
valueFlags map[string]NValue
2022-05-14 00:58:55 +00:00
nodes []Node
stopSeen bool
}
2022-05-15 18:22:56 +00:00
type ScanEntry struct {
tok Token
lit string
2022-05-14 00:58:55 +00:00
pos int
}
2022-05-14 00:58:55 +00:00
type ParserConfig struct {
2022-05-15 18:22:56 +00:00
Commands map[string]NValue
Flags map[string]NValue
2022-05-14 00:58:55 +00:00
ScannerConfig *ScannerConfig
}
2022-05-14 00:58:55 +00:00
type parseDirective struct {
Break bool
}
func NewParser(r io.Reader, pCfg *ParserConfig) *Parser {
if pCfg == nil {
pCfg = DefaultParserConfig
}
2022-05-14 00:58:55 +00:00
parser := &Parser{
2022-05-15 18:22:56 +00:00
buf: []ScanEntry{},
2022-05-14 00:58:55 +00:00
s: NewScanner(r, pCfg.ScannerConfig),
2022-05-15 18:22:56 +00:00
commands: pCfg.Commands,
valueFlags: pCfg.Flags,
2022-05-14 00:58:55 +00:00
}
tracef("NewParser parser=%+#v", parser)
tracef("NewParser pCfg=%+#v", pCfg)
return parser
}
func (p *Parser) Parse() (*Argh, error) {
p.nodes = []Node{}
for {
2022-05-14 00:58:55 +00:00
pd, err := p.parseArg()
if err != nil {
return nil, err
}
2022-05-14 00:58:55 +00:00
if pd != nil && pd.Break {
break
}
2022-05-14 00:58:55 +00:00
}
return &Argh{ParseTree: &ParseTree{Nodes: p.nodes}}, nil
}
func (p *Parser) parseArg() (*parseDirective, error) {
tok, lit, pos := p.scan()
if tok == ILLEGAL {
return nil, errors.Wrapf(errSyntax, "illegal value %q at pos=%v", lit, pos)
}
if tok == EOL {
return &parseDirective{Break: true}, nil
}
2022-05-15 18:22:56 +00:00
p.unscan(tok, lit, pos)
2022-05-14 00:58:55 +00:00
node, err := p.nodify()
tracef("parseArg node=%+#v err=%+#v", node, err)
if err != nil {
return nil, errors.Wrapf(err, "value %q at pos=%v", lit, pos)
}
if node != nil {
p.nodes = append(p.nodes, node)
}
return nil, nil
}
func (p *Parser) nodify() (Node, error) {
tok, lit, pos := p.scan()
tracef("nodify tok=%s lit=%q pos=%v", tok, lit, pos)
switch tok {
case IDENT:
if len(p.nodes) == 0 {
return Program{Name: lit}, nil
2022-05-14 00:58:55 +00:00
}
2022-05-15 18:22:56 +00:00
if n, ok := p.commands[lit]; ok {
return p.scanValueCommand(lit, pos, n)
}
return Ident{Literal: lit}, nil
2022-05-14 00:58:55 +00:00
case ARG_DELIMITER:
return ArgDelimiter{}, nil
2022-05-14 00:58:55 +00:00
case COMPOUND_SHORT_FLAG:
flagNodes := []Node{}
for _, r := range lit[1:] {
2022-05-14 00:58:55 +00:00
flagNodes = append(
flagNodes,
Flag{
Name: string(r),
},
)
}
2022-05-15 18:22:56 +00:00
return CompoundShortFlag{Nodes: flagNodes}, nil
2022-05-14 00:58:55 +00:00
case SHORT_FLAG:
flagName := string(lit[1:])
2022-05-15 18:22:56 +00:00
if n, ok := p.valueFlags[flagName]; ok {
return p.scanValueFlag(flagName, pos, n)
2022-05-14 00:58:55 +00:00
}
return Flag{Name: flagName}, nil
2022-05-14 00:58:55 +00:00
case LONG_FLAG:
flagName := string(lit[2:])
2022-05-15 18:22:56 +00:00
if n, ok := p.valueFlags[flagName]; ok {
return p.scanValueFlag(flagName, pos, n)
2022-05-14 00:58:55 +00:00
}
return Flag{Name: flagName}, nil
2022-05-14 00:58:55 +00:00
default:
}
return Ident{Literal: lit}, nil
}
2022-05-15 18:22:56 +00:00
func (p *Parser) scanValueFlag(flagName string, pos int, n NValue) (Node, error) {
tracef("scanValueFlag flagName=%q pos=%v n=%v", flagName, pos, n)
values, err := func() ([]string, error) {
if n == ZeroValue {
return []string{}, nil
}
ret := []string{}
for {
lit, err := p.scanIdent()
if err != nil {
if n == OneValue {
return nil, err
}
if n == OneOrMoreValue {
break
}
}
ret = append(ret, lit)
if n == OneValue && len(ret) == 1 {
break
}
}
return ret, nil
}()
2022-05-14 00:58:55 +00:00
if err != nil {
return nil, err
}
2022-05-15 18:22:56 +00:00
return Flag{Name: flagName, Values: values}, nil
}
func (p *Parser) scanValueCommand(lit string, pos int, n NValue) (Node, error) {
return Command{Name: lit}, nil
2022-05-14 00:58:55 +00:00
}
func (p *Parser) scanIdent() (string, error) {
tok, lit, pos := p.scan()
2022-05-15 18:22:56 +00:00
unscanBuf := []ScanEntry{}
2022-05-14 00:58:55 +00:00
if tok == ASSIGN || tok == ARG_DELIMITER {
2022-05-15 18:22:56 +00:00
unscanBuf = append([]ScanEntry{{tok: tok, lit: lit, pos: pos}}, unscanBuf...)
2022-05-14 00:58:55 +00:00
tok, lit, pos = p.scan()
}
if tok == IDENT {
return lit, nil
}
2022-05-15 18:22:56 +00:00
unscanBuf = append([]ScanEntry{{tok: tok, lit: lit, pos: pos}}, unscanBuf...)
for _, entry := range unscanBuf {
p.unscan(entry.tok, entry.lit, entry.pos)
2022-05-14 00:58:55 +00:00
}
return "", errors.Wrapf(errSyntax, "expected ident at pos=%v but got %s (%q)", pos, tok, lit)
}
func (p *Parser) scan() (Token, string, int) {
2022-05-15 18:22:56 +00:00
if len(p.buf) != 0 {
entry, buf := p.buf[len(p.buf)-1], p.buf[:len(p.buf)-1]
p.buf = buf
tracef("scan returning buffer entry=%s %+#v", entry.tok, entry)
return entry.tok, entry.lit, entry.pos
}
2022-05-14 00:58:55 +00:00
tok, lit, pos := p.s.Scan()
2022-05-15 18:22:56 +00:00
tracef("scan returning next=%s %+#v", tok, ScanEntry{tok: tok, lit: lit, pos: pos})
2022-05-14 00:58:55 +00:00
return tok, lit, pos
}
2022-05-15 18:22:56 +00:00
func (p *Parser) unscan(tok Token, lit string, pos int) {
entry := ScanEntry{tok: tok, lit: lit, pos: pos}
tracef("unscan entry=%s %+#v", tok, entry)
2022-05-14 00:58:55 +00:00
2022-05-15 18:22:56 +00:00
p.buf = append(p.buf, entry)
2022-05-14 00:58:55 +00:00
}