diff options
| author | Charlie Stanton <charlie@shtanton.xyz> | 2024-04-07 15:27:36 +0100 | 
|---|---|---|
| committer | Charlie Stanton <charlie@shtanton.xyz> | 2024-04-07 15:27:36 +0100 | 
| commit | 658900fcae610caace83a112ac0ee865108ebc92 (patch) | |
| tree | 4d7b6bebe0d192abf62970ca4324ef1ff274e3c8 /subex | |
| parent | 81925b6ad5212512d27365b8224b76095191431f (diff) | |
| download | stred-go-658900fcae610caace83a112ac0ee865108ebc92.tar | |
Change output subex internals to allow structures
Also add substitute register syntactic sugar
Diffstat (limited to 'subex')
| -rw-r--r-- | subex/main_test.go | 12 | ||||
| -rw-r--r-- | subex/parse.go | 82 | ||||
| -rw-r--r-- | subex/subexast.go | 117 | ||||
| -rw-r--r-- | subex/subexstate.go | 67 | 
4 files changed, 177 insertions, 101 deletions
| diff --git a/subex/main_test.go b/subex/main_test.go index 8e98798..fb6f152 100644 --- a/subex/main_test.go +++ b/subex/main_test.go @@ -405,6 +405,18 @@ func TestSubexMain(t *testing.T) {  				},  			},  		}, +		{ +			subex: ".{-0}`\"hello\"`", +			input: []walk.Value { +				walk.NumberValue(1), +				walk.NumberValue(2), +			}, +			expected: []walk.Value { +				walk.NumberValue(1), +				walk.NumberValue(2), +				walk.StringValue("hello"), +			}, +		},  	}  	for i, test := range tests { diff --git a/subex/parse.go b/subex/parse.go index d7fe243..619c1c3 100644 --- a/subex/parse.go +++ b/subex/parse.go @@ -1,6 +1,7 @@  package subex  import ( +	"fmt"  	"main/walk"  	"strconv"  	"strings" @@ -115,6 +116,7 @@ func parseScalarLiteral(l RuneReader) (walk.Scalar, bool) {  				panic("Invalid literal")  			}  		default: +			fmt.Printf("%c\n", r)  			panic("Invalid literal")  	}  } @@ -181,7 +183,8 @@ func parseRepeatRange(l RuneReader) (output []ConvexRange) {  	return output  } -func parseValueReplacement(l RuneReader) (output []OutputValueAST) { +func parseValueReplacement(l RuneReader) (output SubexAST) { +	output = SubexASTEmpty{}  	// TODO escaping  	// TODO add arrays, maps and strings  	loop: for { @@ -197,37 +200,67 @@ func parseValueReplacement(l RuneReader) (output []OutputValueAST) {  			if slot == eof {  				panic("Missing slot character")  			} -			output = append(output, OutputValueLoadAST {slot: slot}) +			output = SubexASTConcat { +				First: output, +				Second: SubexASTOutputValueLoad { +					slot: slot, +				}, +			} +		// TODO: destructures +		case '"': +			output = SubexASTConcat { +				First: output, +				Second: SubexASTDestructure { +					Destructure: NoneStructure, +					Structure: StringStructure, +					Content: parseRuneReplacement(l, '"'), +				}, +			}  		default:  			l.Rewind()  			scalar, ok := parseScalarLiteral(l)  			if !ok {  				panic("Invalid scalar literal")  			} -			output = append(output, OutputValueLiteralAST {scalar}) +			output = SubexASTConcat { +				First: output, +				Second: SubexASTOutputValueLiteral { +					literal: scalar, +				}, +			}  		}  	}  	return output  } -func parseRuneReplacement(l RuneReader) (output []OutputRuneAST) { +func parseRuneReplacement(l RuneReader, end rune) (output SubexAST) { +	output = SubexASTEmpty{}  	// TODO escaping -	// TODO add arrays, maps and strings  	loop: for {  		r := l.Next()  		switch r {  		case eof:  			panic("Missing closing `") -		case '`': +		case end:  			break loop  		case '$':  			slot := l.Next()  			if slot == eof {  				panic("Missing slot character")  			} -			output = append(output, OutputRuneLoadAST {slot: slot}) +			output = SubexASTConcat { +				First: output, +				Second: SubexASTOutputRuneLoad { +					slot: slot, +				}, +			}  		default: -			output = append(output, OutputRuneLiteralAST {r}) +			output = SubexASTConcat { +				First: output, +				Second: SubexASTOutputRuneLiteral { +					literal: r, +				}, +			}  		}  	}  	return output @@ -394,6 +427,7 @@ func parseDestructure(l RuneReader, destructure Structure, inType Type) (lhs Sub  }  func parseSubex(l RuneReader, minPower int, inType Type) (lhs SubexAST, outType Type) { +	start:  	r := l.Next()  	switch r {  		case eof: @@ -467,16 +501,14 @@ func parseSubex(l RuneReader, minPower int, inType Type) (lhs SubexAST, outType  			lhs = SubexASTCopyNumber{}  		case '`':  			outType = inType -			lhs = SubexASTOutputValues {parseValueReplacement(l)} -		// TODO -		// case '_': -		// 	lhs = SubexASTCopyStringAtom{} -		// case '#': -		// 	lhs = SubexASTCopyString{} -		// case ',': -		// 	lhs = SubexASTCopyValue{} -		// case '"': -		// 	lhs = SubexASTCopyScalar {walk.NewAtomStringTerminal()} +			lhs = parseValueReplacement(l) +		case ' ': +			if inType == RuneType { +				outType = RuneType +				lhs = SubexASTCopyRune {' '} +			} else { +				goto start +			}  		default:  			outType = inType  			if inType == RuneType { @@ -533,10 +565,16 @@ func parseSubex(l RuneReader, minPower int, inType Type) (lhs SubexAST, outType  						InnerOutType: outType,  					}  				} else { -					resolveTypes(inType, ValueType) -					lhs = SubexASTStoreValues { -						Match: lhs, -						Slot: slot, +					if inType == ValueType { +						lhs = SubexASTStoreValues { +							Match: lhs, +							Slot: slot, +						} +					} else { +						lhs = SubexASTStoreRunes { +							Match: lhs, +							Slot: slot, +						}  					}  				}  				outType = AnyType diff --git a/subex/subexast.go b/subex/subexast.go index 2685925..d08ddac 100644 --- a/subex/subexast.go +++ b/subex/subexast.go @@ -46,6 +46,25 @@ func (ast SubexASTStoreValues) String() string {  	return fmt.Sprintf("$%c(%v)", ast.Slot, ast.Match)  } +type SubexASTStoreRunes struct { +	Match SubexAST +	Slot rune +} +func (ast SubexASTStoreRunes) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState { +	id := slotMap.getRuneId(ast.Slot) +	newNext := ast.Match.compileWith(&SubexStoreRunesEndState { +		slot: id, +		next: next, +	}, slotMap, inType, RuneType) + +	return &SubexCaptureRunesBeginState { +		next: newNext, +	} +} +func (ast SubexASTStoreRunes) String() string { +	return fmt.Sprintf("(%v)$%c", ast.Match, ast.Slot) +} +  // Try to run the first subex, if it fails then backtrack and use the second  type SubexASTOr struct {  	First, Second SubexAST @@ -148,7 +167,7 @@ type SubexASTCopyScalar struct {  }  func (ast SubexASTCopyScalar) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTCopyScalar")  	}  	return &SubexCopyState{  		filter: selectScalarFilter {ast.Scalar}, @@ -162,7 +181,7 @@ func (ast SubexASTCopyScalar) String() string {  type SubexASTCopyAnyRune struct {}  func (ast SubexASTCopyAnyRune) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != RuneType || outType != RuneType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTCopyAnyRune")  	}  	return &SubexCopyRuneState {  		next: next, @@ -170,7 +189,7 @@ func (ast SubexASTCopyAnyRune) compileWith(next SubexState, slotMap *SlotMap, in  	}  }  func (ast SubexASTCopyAnyRune) String() string { -	return "." +	return ".RUNE"  }  type SubexASTCopyRune struct { @@ -178,19 +197,22 @@ type SubexASTCopyRune struct {  }  func (ast SubexASTCopyRune) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != RuneType || outType != RuneType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTCopyRune")  	}  	return &SubexCopyRuneState {  		next: next,  		filter: selectRuneFilter {ast.rune},  	}  } +func (ast SubexASTCopyRune) String() string { +	return string(ast.rune) +}  // Read in a single atom that must be a boolean and output it unchanged  type SubexASTCopyBool struct {}  func (ast SubexASTCopyBool) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTCopyBool")  	}  	return &SubexCopyState {  		next: next, @@ -205,7 +227,7 @@ func (ast SubexASTCopyBool) String() string {  type SubexASTCopyNumber struct {}  func (ast SubexASTCopyNumber) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTCopyNumber")  	}  	return &SubexCopyState {  		next: next, @@ -220,7 +242,6 @@ func (ast SubexASTCopyNumber) String() string {  type SubexASTCopyAnyValue struct {}  func (ast SubexASTCopyAnyValue) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		fmt.Printf("%v, %v", inType, outType)  		panic("Invalid types for SubexASTCopyAnyValue")  	}  	return &SubexCopyState { @@ -277,64 +298,56 @@ func (ast SubexASTOutput) String() string {  }  */ -type OutputValueAST interface { -	compile(slotMap *SlotMap) OutputValue +type SubexASTOutputValueLiteral struct { +	literal walk.Scalar  } - -type OutputValueLoadAST struct { -	slot rune -} -func (ast OutputValueLoadAST) compile(slotMap *SlotMap) OutputValue { -	return OutputValueLoad { -		slotMap.getId(ast.slot), +func (ast SubexASTOutputValueLiteral) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState { +	if outType != ValueType { +		panic("Invalid outType for SubexASTOutputValueLiteral")  	} -} - -type OutputValueLiteralAST struct { -	scalar walk.Scalar -} -func (ast OutputValueLiteralAST) compile(slotMap *SlotMap) OutputValue { -	return OutputValueLiteral { -		ast.scalar, +	return &SubexOutputValueLiteralState { +		literal: ast.literal, +		next: next,  	}  } -type SubexASTOutputValues struct { -	Replacement []OutputValueAST +type SubexASTOutputValueLoad struct { +	slot rune  } -func (ast SubexASTOutputValues) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState { +func (ast SubexASTOutputValueLoad) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if outType != ValueType { -		panic("Invalid outType") -	} -	var content []OutputValue -	for _, el := range ast.Replacement { -		content = append(content, el.compile(slotMap)) +		panic("Invalid outType for SubexASTOutputValueLoad")  	} -	return &SubexOutputValuesState { -		content: content, +	return &SubexOutputValueLoadState { +		slot: slotMap.getId(ast.slot),  		next: next,  	}  } -type OutputRuneAST interface { -	compile(slotMap *SlotMap) OutputRune -} - -type OutputRuneLoadAST struct { -	slot rune +type SubexASTOutputRuneLiteral struct { +	literal rune  } -func (ast OutputRuneLoadAST) compile(slotMap *SlotMap) OutputRune { -	return OutputRuneLoad {slotMap.getRuneId(ast.slot)} +func (ast SubexASTOutputRuneLiteral) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState { +	if outType != RuneType { +		panic("Invalid outType for SubexASTOutputRuneLiteral") +	} +	return &SubexOutputRuneLiteralState { +		literal: ast.literal, +		next: next, +	}  } -type OutputRuneLiteralAST struct { -	r rune -} -func (ast OutputRuneLiteralAST) compile (slotMap *SlotMap) OutputRune { -	return OutputRuneLiteral {ast.r} +type SubexASTOutputRuneLoad struct { +	slot rune  } - -type SubexASTOutputRunes struct { +func (ast SubexASTOutputRuneLoad) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState { +	if outType != RuneType { +		panic("Invalid outType for SubexASTOutputRuneLoad") +	} +	return &SubexOutputRuneLoadState { +		slot: slotMap.getRuneId(ast.slot), +		next: next, +	}  }  // Run each input Atom through a map to produce an output Atom @@ -359,7 +372,7 @@ type SubexASTSum struct {  }  func (ast SubexASTSum) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTSum")  	}  	return &SubexCaptureBeginState {  		next: ast.Content.compileWith(&SubexArithmeticEndState { @@ -378,7 +391,7 @@ type SubexASTProduct struct {  }  func (ast SubexASTProduct) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTProduct")  	}  	return &SubexCaptureBeginState {  		next: ast.Content.compileWith(&SubexArithmeticEndState { @@ -398,7 +411,7 @@ type SubexASTNegate struct {  }  func (ast SubexASTNegate) compileWith(next SubexState, slotMap *SlotMap, inType Type, outType Type) SubexState {  	if inType != ValueType || outType != ValueType { -		panic("Invalid types for SubexASTNot") +		panic("Invalid types for SubexASTNegate")  	}  	return &SubexCaptureBeginState {  		next: ast.Content.compileWith(&SubexArithmeticEndState { diff --git a/subex/subexstate.go b/subex/subexstate.go index 4f5dc19..1e1e94e 100644 --- a/subex/subexstate.go +++ b/subex/subexstate.go @@ -133,6 +133,19 @@ func (state SubexStoreEndState) epsilon(aux auxiliaryState) []SubexBranch {  	}}  } +type SubexStoreRunesEndState struct { +	slot int +	next SubexState +} +func (state SubexStoreRunesEndState) epsilon(aux auxiliaryState) []SubexBranch { +	toStore, aux := aux.popOutputRunes() +	aux.store = aux.store.withRunes(state.slot, toStore) +	return []SubexBranch {{ +		state: state.next, +		aux: aux, +	}} +} +  /*  // A part of an output literal, either an Atom or a slot from which to load  type OutputContent interface { @@ -211,48 +224,48 @@ func (state SubexOutputState) accepting(aux auxiliaryState) []OutputStack {  }  */ -type OutputValue interface { -	build(store Store) []walk.Value -} - -type OutputValueLoad struct { -	slot int +type SubexOutputValueLiteralState struct { +	literal walk.Scalar +	next SubexState  } -func (ov OutputValueLoad) build(store Store) []walk.Value { -	return store.values[ov.slot] +func (state SubexOutputValueLiteralState) epsilon(aux auxiliaryState) []SubexBranch { +	return []SubexBranch {{ +		state: state.next, +		aux: aux.topAppend([]walk.Value {state.literal}), +	}}  } -type OutputValueLiteral struct { -	scalar walk.Scalar +type SubexOutputValueLoadState struct { +	slot int +	next SubexState  } -func (ov OutputValueLiteral) build(store Store) []walk.Value { -	return []walk.Value{ov.scalar} +func (state SubexOutputValueLoadState) epsilon(aux auxiliaryState) []SubexBranch { +	return []SubexBranch {{ +		state: state.next, +		aux: aux.topAppend(aux.store.values[state.slot]), +	}}  } -type SubexOutputValuesState struct { -	content []OutputValue +type SubexOutputRuneLiteralState struct { +	literal rune  	next SubexState  } -func (state SubexOutputValuesState) epsilon(aux auxiliaryState) []SubexBranch { -	var content []walk.Value -	for _, el := range state.content { -		content = append(content, el.build(aux.store)...) -	} +func (state SubexOutputRuneLiteralState) epsilon(aux auxiliaryState) []SubexBranch {  	return []SubexBranch {{  		state: state.next, -		aux: aux.topAppend(content), +		aux: aux.topAppendRune([]rune {state.literal}),  	}}  } -type OutputRune interface { -} - -type OutputRuneLoad struct { +type SubexOutputRuneLoadState struct {  	slot int +	next SubexState  } - -type OutputRuneLiteral struct { -	r rune +func (state SubexOutputRuneLoadState) epsilon(aux auxiliaryState) []SubexBranch { +	return []SubexBranch {{ +		state: state.next, +		aux: aux.topAppendRune(aux.store.runes[state.slot]), +	}}  }  // A final state, transitions to nothing but is accepting | 
