treerack/sequence.go

440 lines
8.7 KiB
Go
Raw Normal View History

2017-07-15 21:49:08 +02:00
package treerack
2017-06-25 17:51:08 +02:00
2017-11-26 01:49:22 +01:00
import "strconv"
2017-06-25 17:51:08 +02:00
type sequenceDefinition struct {
2017-11-02 22:19:03 +01:00
name string
id int
commit CommitType
2017-11-26 01:49:22 +01:00
originalItems []SequenceItem
2017-11-02 22:19:03 +01:00
items []SequenceItem
itemDefs []definition
ranges [][]int
generalizations []int
sbuilder *sequenceBuilder
sparser *sequenceParser
allChars bool
validated bool
initialized bool
2017-06-25 17:51:08 +02:00
}
type sequenceParser struct {
2017-11-02 22:19:03 +01:00
name string
id int
commit CommitType
items []parser
ranges [][]int
generalizations []int
allChars bool
2017-06-25 17:51:08 +02:00
}
2017-07-29 16:25:17 +02:00
type sequenceBuilder struct {
2017-11-02 22:19:03 +01:00
name string
id int
commit CommitType
items []builder
ranges [][]int
allChars bool
2017-06-25 17:51:08 +02:00
}
2017-06-25 23:38:32 +02:00
func newSequence(name string, ct CommitType, items []SequenceItem) *sequenceDefinition {
2017-11-26 01:49:22 +01:00
original := make([]SequenceItem, len(items))
for i := range items {
original[i] = items[i]
}
2017-06-25 17:51:08 +02:00
return &sequenceDefinition{
2017-11-26 01:49:22 +01:00
name: name,
commit: ct,
items: items,
originalItems: original,
2017-06-25 17:51:08 +02:00
}
}
2017-10-28 22:54:15 +02:00
func (d *sequenceDefinition) nodeName() string { return d.name }
2017-11-05 03:28:36 +01:00
func (d *sequenceDefinition) setName(n string) { d.name = n }
2017-10-28 22:54:15 +02:00
func (d *sequenceDefinition) nodeID() int { return d.id }
func (d *sequenceDefinition) setID(id int) { d.id = id }
func (d *sequenceDefinition) commitType() CommitType { return d.commit }
func (d *sequenceDefinition) setCommitType(ct CommitType) { d.commit = ct }
2017-06-25 17:51:08 +02:00
2017-11-26 01:49:22 +01:00
func normalizeItemRange(item SequenceItem) SequenceItem {
if item.Min == 0 && item.Max == 0 {
item.Min, item.Max = 1, 1
return item
}
2017-11-04 22:49:42 +01:00
2017-11-26 01:49:22 +01:00
if item.Min <= 0 {
item.Min = 0
}
if item.Max <= 0 {
item.Max = -1
}
return item
}
2017-11-04 22:49:42 +01:00
2017-11-26 01:49:22 +01:00
func (d *sequenceDefinition) initRanges() {
for i, item := range d.items {
item = normalizeItemRange(item)
2017-11-04 22:49:42 +01:00
d.items[i] = item
d.ranges = append(d.ranges, []int{item.Min, item.Max})
}
}
func (d *sequenceDefinition) preinit() {
d.initRanges()
}
2017-11-01 02:43:46 +01:00
func (d *sequenceDefinition) validate(r *registry) error {
if d.validated {
return nil
}
d.validated = true
2017-08-06 20:43:52 +02:00
for i := range d.items {
2017-11-01 02:43:46 +01:00
ii, ok := r.definition(d.items[i].Name)
if !ok {
2017-08-06 20:43:52 +02:00
return parserNotFound(d.items[i].Name)
}
2017-11-01 02:43:46 +01:00
if err := ii.validate(r); err != nil {
return err
}
2017-08-06 20:43:52 +02:00
}
return nil
}
2017-11-02 22:46:07 +01:00
func (d *sequenceDefinition) createBuilder() {
2017-11-01 03:54:53 +01:00
d.sbuilder = &sequenceBuilder{
2017-11-02 22:19:03 +01:00
name: d.name,
id: d.id,
commit: d.commit,
2017-11-02 22:46:07 +01:00
ranges: d.ranges,
2017-07-29 18:40:22 +02:00
}
2017-11-01 03:54:53 +01:00
}
2017-07-29 18:40:22 +02:00
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) initItems(r *registry) {
allChars := true
for _, item := range d.items {
def := r.definitions[item.Name]
2017-11-01 03:54:53 +01:00
d.itemDefs = append(d.itemDefs, def)
def.init(r)
2017-07-29 18:40:22 +02:00
d.sbuilder.items = append(d.sbuilder.items, def.builder())
2017-07-30 02:35:51 +02:00
if allChars {
if _, isChar := def.(*charParser); !isChar {
allChars = false
}
}
2017-07-27 01:48:16 +02:00
}
2017-07-30 02:35:51 +02:00
d.sbuilder.allChars = allChars
2017-07-30 05:10:46 +02:00
d.allChars = allChars
2017-11-01 03:54:53 +01:00
}
2017-07-29 18:40:22 +02:00
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) init(r *registry) {
if d.initialized {
2017-11-01 02:43:46 +01:00
return
2017-07-27 01:48:16 +02:00
}
2017-11-01 03:54:53 +01:00
d.initialized = true
d.initRanges()
2017-11-02 22:46:07 +01:00
d.createBuilder()
2017-11-01 03:54:53 +01:00
d.initItems(r)
2017-07-27 01:48:16 +02:00
}
2017-11-02 22:19:03 +01:00
func (d *sequenceDefinition) addGeneralization(g int) {
if intsContain(d.generalizations, g) {
2017-11-01 02:43:46 +01:00
return
2017-07-27 01:48:16 +02:00
}
2017-11-02 22:19:03 +01:00
d.generalizations = append(d.generalizations, g)
2017-07-27 01:48:16 +02:00
}
2017-06-25 17:51:08 +02:00
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) createParser() {
d.sparser = &sequenceParser{
2017-11-02 22:19:03 +01:00
name: d.name,
id: d.id,
commit: d.commit,
generalizations: d.generalizations,
allChars: d.allChars,
ranges: d.ranges,
2017-06-25 17:51:08 +02:00
}
2017-11-01 03:54:53 +01:00
}
2017-06-25 17:51:08 +02:00
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) createItemParsers() {
for _, item := range d.itemDefs {
pi := item.parser()
d.sparser.items = append(d.sparser.items, pi)
2017-06-25 17:51:08 +02:00
}
}
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) parser() parser {
if d.sparser != nil {
return d.sparser
2017-07-29 18:40:22 +02:00
}
2017-11-01 03:54:53 +01:00
d.createParser()
d.createItemParsers()
return d.sparser
2017-06-25 17:51:08 +02:00
}
2017-11-01 03:54:53 +01:00
func (d *sequenceDefinition) builder() builder { return d.sbuilder }
2017-11-02 22:19:03 +01:00
2017-11-26 01:49:22 +01:00
func (d *sequenceDefinition) isCharSequence(r *registry) bool {
for i := range d.originalItems {
item := normalizeItemRange(d.originalItems[i])
if item.Min != 1 || item.Max != 1 {
return false
}
itemDef, _ := r.definition(d.originalItems[i].Name)
c, ok := itemDef.(*charParser)
if !ok || !c.isSingleChar() {
return false
}
}
return true
}
func (d *sequenceDefinition) format(r *registry, f formatFlags) string {
if d.isCharSequence(r) {
var chars []rune
for i := range d.originalItems {
itemDef, _ := r.definition(d.originalItems[i].Name)
c, _ := itemDef.(*charParser)
chars = append(chars, c.chars[0])
}
chars = escape(charClassEscape, []rune(charClassBanned), chars)
return string(append([]rune{'"'}, append(chars, '"')...))
}
var chars []rune
for i := range d.originalItems {
if len(chars) > 0 {
chars = append(chars, ' ')
}
item := normalizeItemRange(d.originalItems[i])
needsQuantifier := item.Min != 1 || item.Max != 1
itemDef, _ := r.definition(item.Name)
isSymbol := itemDef.commitType()&userDefined != 0
ch, isChoice := itemDef.(*choiceDefinition)
isChoiceOfMultiple := isChoice && len(ch.options) > 1
seq, isSequence := itemDef.(*sequenceDefinition)
isSequenceOfMultiple := isSequence && len(seq.originalItems) > 1 && !seq.isCharSequence(r)
needsGrouping := isChoiceOfMultiple || isSequenceOfMultiple
if isSymbol {
chars = append(chars, []rune(itemDef.nodeName())...)
} else {
if needsGrouping {
chars = append(chars, '(')
}
chars = append(chars, []rune(itemDef.format(r, f))...)
if needsGrouping {
chars = append(chars, ')')
}
}
if !needsQuantifier {
continue
}
if item.Min == 0 && item.Max == 1 {
chars = append(chars, '?')
continue
}
if item.Min == 0 && item.Max < 0 {
chars = append(chars, '*')
continue
}
if item.Min == 1 && item.Max < 0 {
chars = append(chars, '+')
continue
}
chars = append(chars, '{')
if item.Min == item.Max {
chars = append(chars, []rune(strconv.Itoa(item.Min))...)
} else {
if item.Min > 0 {
chars = append(chars, []rune(strconv.Itoa(item.Min))...)
}
chars = append(chars, ',')
if item.Max >= 0 {
chars = append(chars, []rune(strconv.Itoa(item.Max))...)
}
}
chars = append(chars, '}')
}
return string(chars)
}
2017-11-02 22:19:03 +01:00
func (p *sequenceParser) nodeName() string { return p.name }
func (p *sequenceParser) nodeID() int { return p.id }
2017-06-25 17:51:08 +02:00
2017-10-31 21:09:30 +01:00
func (p *sequenceParser) parse(c *context) {
2017-08-06 03:42:35 +02:00
if !p.allChars {
2017-11-06 11:41:00 +01:00
if c.results.pending(c.offset, p.id) {
2017-08-06 03:42:35 +02:00
c.fail(c.offset)
return
}
2017-06-25 17:51:08 +02:00
2017-11-06 11:41:00 +01:00
c.results.markPending(c.offset, p.id)
2017-08-06 03:42:35 +02:00
}
2017-06-25 17:51:08 +02:00
2017-07-17 04:23:29 +02:00
itemIndex := 0
2017-06-25 23:38:32 +02:00
var currentCount int
2017-07-17 04:23:29 +02:00
from := c.offset
to := c.offset
2017-07-30 02:35:51 +02:00
var parsed bool
2017-07-17 04:23:29 +02:00
for itemIndex < len(p.items) {
2017-10-31 21:09:30 +01:00
p.items[itemIndex].parse(c)
2017-11-02 20:49:49 +01:00
if !c.matchLast {
2017-07-17 04:23:29 +02:00
if currentCount < p.ranges[itemIndex][0] {
c.fail(from)
2017-08-06 03:42:35 +02:00
if !p.allChars {
2017-11-06 11:41:00 +01:00
c.results.unmarkPending(from, p.id)
2017-08-06 03:42:35 +02:00
}
2017-06-25 23:38:32 +02:00
return
}
2017-07-17 04:23:29 +02:00
itemIndex++
2017-06-25 23:38:32 +02:00
currentCount = 0
continue
2017-06-25 17:51:08 +02:00
}
2017-07-30 02:35:51 +02:00
parsed = c.offset > to
2017-07-17 04:23:29 +02:00
if parsed {
2017-06-25 23:38:32 +02:00
currentCount++
}
2017-07-17 04:23:29 +02:00
to = c.offset
2017-11-04 22:49:42 +01:00
if !parsed || p.ranges[itemIndex][1] > 0 && currentCount == p.ranges[itemIndex][1] {
2017-07-17 04:23:29 +02:00
itemIndex++
2017-06-25 23:38:32 +02:00
currentCount = 0
2017-06-25 17:51:08 +02:00
}
}
2017-11-02 22:19:03 +01:00
for _, g := range p.generalizations {
2017-11-06 11:41:00 +01:00
if c.results.pending(from, g) {
2017-11-02 22:19:03 +01:00
c.results.setMatch(from, g, to)
}
2017-06-25 17:51:08 +02:00
}
2017-11-02 20:49:49 +01:00
c.results.setMatch(from, p.id, to)
2017-07-17 04:23:29 +02:00
c.success(to)
2017-08-06 03:42:35 +02:00
if !p.allChars {
2017-11-06 11:41:00 +01:00
c.results.unmarkPending(from, p.id)
2017-08-06 03:42:35 +02:00
}
2017-06-25 17:51:08 +02:00
}
2017-07-29 16:25:17 +02:00
func (b *sequenceBuilder) nodeName() string { return b.name }
func (b *sequenceBuilder) nodeID() int { return b.id }
2017-07-29 18:40:22 +02:00
func (b *sequenceBuilder) build(c *context) ([]*Node, bool) {
to, ok := c.results.longestMatch(c.offset, b.id)
2017-07-29 18:40:22 +02:00
if !ok {
return nil, false
}
from := c.offset
2017-11-04 22:24:55 +01:00
parsed := to > from
2017-07-30 02:35:51 +02:00
if b.allChars {
c.offset = to
if b.commit&Alias != 0 {
return nil, true
}
return []*Node{{
Name: b.name,
From: from,
To: to,
tokens: c.tokens,
}}, true
2017-11-04 22:24:55 +01:00
} else if parsed {
c.results.dropMatchTo(c.offset, b.id, to)
} else {
2017-11-06 11:41:00 +01:00
if c.results.pending(c.offset, b.id) {
2017-11-04 22:24:55 +01:00
return nil, false
}
2017-11-06 11:41:00 +01:00
c.results.markPending(c.offset, b.id)
2017-07-29 20:04:22 +02:00
}
2017-07-29 18:40:22 +02:00
var (
itemIndex int
currentCount int
nodes []*Node
)
for itemIndex < len(b.items) {
itemFrom := c.offset
n, ok := b.items[itemIndex].build(c)
if !ok {
itemIndex++
currentCount = 0
continue
}
2017-11-04 22:24:55 +01:00
if c.offset > itemFrom {
2017-07-29 18:40:22 +02:00
nodes = append(nodes, n...)
currentCount++
2017-11-04 22:49:42 +01:00
if b.ranges[itemIndex][1] > 0 && currentCount == b.ranges[itemIndex][1] {
2017-11-04 22:24:55 +01:00
itemIndex++
currentCount = 0
}
continue
}
2017-11-04 22:24:55 +01:00
if currentCount < b.ranges[itemIndex][0] {
for i := 0; i < b.ranges[itemIndex][0]-currentCount; i++ {
nodes = append(nodes, n...)
}
2017-07-29 18:40:22 +02:00
}
2017-11-04 22:24:55 +01:00
itemIndex++
currentCount = 0
2017-07-29 18:40:22 +02:00
}
2017-11-04 22:24:55 +01:00
if !parsed {
2017-11-06 11:41:00 +01:00
c.results.unmarkPending(from, b.id)
2017-11-04 22:24:55 +01:00
}
2017-07-29 18:40:22 +02:00
if b.commit&Alias != 0 {
return nodes, true
2017-06-25 17:51:08 +02:00
}
2017-07-29 18:40:22 +02:00
return []*Node{{
Name: b.name,
From: from,
To: to,
Nodes: nodes,
tokens: c.tokens,
}}, true
2017-06-25 17:51:08 +02:00
}