Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Blame
Revision Log

source: code/trunk/vendor/github.com/dlclark/regexp2/match.go@ 67

Last change on this file since 67 was 67, checked in by Izuru Yakumo, 23 months ago

Use vendored modules

Signed-off-by: Izuru Yakumo <yakumo.izuru@…>

File size: 8.6 KB

Line
1	package regexp2
2
3	import (
4	"bytes"
5	"fmt"
6	)
7
8	// Match is a single regex result match that contains groups and repeated captures
9	// -Groups
10	// -Capture
11	type Match struct {
12	Group //embeded group 0
13
14	regex *Regexp
15	otherGroups []Group
16
17	// input to the match
18	textpos int
19	textstart int
20
21	capcount int
22	caps []int
23	sparseCaps map[int]int
24
25	// output from the match
26	matches [][]int
27	matchcount []int
28
29	// whether we've done any balancing with this match. If we
30	// have done balancing, we'll need to do extra work in Tidy().
31	balancing bool
32	}
33
34	// Group is an explicit or implit (group 0) matched group within the pattern
35	type Group struct {
36	Capture // the last capture of this group is embeded for ease of use
37
38	Name string // group name
39	Captures []Capture // captures of this group
40	}
41
42	// Capture is a single capture of text within the larger original string
43	type Capture struct {
44	// the original string
45	text []rune
46	// the position in the original string where the first character of
47	// captured substring was found.
48	Index int
49	// the length of the captured substring.
50	Length int
51	}
52
53	// String returns the captured text as a String
54	func (c *Capture) String() string {
55	return string(c.text[c.Index : c.Index+c.Length])
56	}
57
58	// Runes returns the captured text as a rune slice
59	func (c *Capture) Runes() []rune {
60	return c.text[c.Index : c.Index+c.Length]
61	}
62
63	func newMatch(regex Regexp, capcount int, text []rune, startpos int) Match {
64	m := Match{
65	regex: regex,
66	matchcount: make([]int, capcount),
67	matches: make([][]int, capcount),
68	textstart: startpos,
69	balancing: false,
70	}
71	m.Name = "0"
72	m.text = text
73	m.matches[0] = make([]int, 2)
74	return &m
75	}
76
77	func newMatchSparse(regex Regexp, caps map[int]int, capcount int, text []rune, startpos int) Match {
78	m := newMatch(regex, capcount, text, startpos)
79	m.sparseCaps = caps
80	return m
81	}
82
83	func (m *Match) reset(text []rune, textstart int) {
84	m.text = text
85	m.textstart = textstart
86	for i := 0; i < len(m.matchcount); i++ {
87	m.matchcount[i] = 0
88	}
89	m.balancing = false
90	}
91
92	func (m *Match) tidy(textpos int) {
93
94	interval := m.matches[0]
95	m.Index = interval[0]
96	m.Length = interval[1]
97	m.textpos = textpos
98	m.capcount = m.matchcount[0]
99	//copy our root capture to the list
100	m.Group.Captures = []Capture{m.Group.Capture}
101
102	if m.balancing {
103	// The idea here is that we want to compact all of our unbalanced captures. To do that we
104	// use j basically as a count of how many unbalanced captures we have at any given time
105	// (really j is an index, but j/2 is the count). First we skip past all of the real captures
106	// until we find a balance captures. Then we check each subsequent entry. If it's a balance
107	// capture (it's negative), we decrement j. If it's a real capture, we increment j and copy
108	// it down to the last free position.
109	for cap := 0; cap < len(m.matchcount); cap++ {
110	limit := m.matchcount[cap] * 2
111	matcharray := m.matches[cap]
112
113	var i, j int
114
115	for i = 0; i < limit; i++ {
116	if matcharray[i] < 0 {
117	break
118	}
119	}
120
121	for j = i; i < limit; i++ {
122	if matcharray[i] < 0 {
123	// skip negative values
124	j--
125	} else {
126	// but if we find something positive (an actual capture), copy it back to the last
127	// unbalanced position.
128	if i != j {
129	matcharray[j] = matcharray[i]
130	}
131	j++
132	}
133	}
134
135	m.matchcount[cap] = j / 2
136	}
137
138	m.balancing = false
139	}
140	}
141
142	// isMatched tells if a group was matched by capnum
143	func (m *Match) isMatched(cap int) bool {
144	return cap < len(m.matchcount) && m.matchcount[cap] > 0 && m.matches[cap][m.matchcount[cap]*2-1] != (-3+1)
145	}
146
147	// matchIndex returns the index of the last specified matched group by capnum
148	func (m *Match) matchIndex(cap int) int {
149	i := m.matches[cap][m.matchcount[cap]*2-2]
150	if i >= 0 {
151	return i
152	}
153
154	return m.matches[cap][-3-i]
155	}
156
157	// matchLength returns the length of the last specified matched group by capnum
158	func (m *Match) matchLength(cap int) int {
159	i := m.matches[cap][m.matchcount[cap]*2-1]
160	if i >= 0 {
161	return i
162	}
163
164	return m.matches[cap][-3-i]
165	}
166
167	// Nonpublic builder: add a capture to the group specified by "c"
168	func (m *Match) addMatch(c, start, l int) {
169
170	if m.matches[c] == nil {
171	m.matches[c] = make([]int, 2)
172	}
173
174	capcount := m.matchcount[c]
175
176	if capcount*2+2 > len(m.matches[c]) {
177	oldmatches := m.matches[c]
178	newmatches := make([]int, capcount*8)
179	copy(newmatches, oldmatches[:capcount*2])
180	m.matches[c] = newmatches
181	}
182
183	m.matches[c][capcount*2] = start
184	m.matches[c][capcount*2+1] = l
185	m.matchcount[c] = capcount + 1
186	//log.Printf("addMatch: c=%v, i=%v, l=%v ... matches: %v", c, start, l, m.matches)
187	}
188
189	// Nonpublic builder: Add a capture to balance the specified group. This is used by the
190	// balanced match construct. (?<foo-foo2>...)
191	//
192	// If there were no such thing as backtracking, this would be as simple as calling RemoveMatch(c).
193	// However, since we have backtracking, we need to keep track of everything.
194	func (m *Match) balanceMatch(c int) {
195	m.balancing = true
196
197	// we'll look at the last capture first
198	capcount := m.matchcount[c]
199	target := capcount*2 - 2
200
201	// first see if it is negative, and therefore is a reference to the next available
202	// capture group for balancing. If it is, we'll reset target to point to that capture.
203	if m.matches[c][target] < 0 {
204	target = -3 - m.matches[c][target]
205	}
206
207	// move back to the previous capture
208	target -= 2
209
210	// if the previous capture is a reference, just copy that reference to the end. Otherwise, point to it.
211	if target >= 0 && m.matches[c][target] < 0 {
212	m.addMatch(c, m.matches[c][target], m.matches[c][target+1])
213	} else {
214	m.addMatch(c, -3-target, -4-target /* == -3 - (target + 1) */)
215	}
216	}
217
218	// Nonpublic builder: removes a group match by capnum
219	func (m *Match) removeMatch(c int) {
220	m.matchcount[c]--
221	}
222
223	// GroupCount returns the number of groups this match has matched
224	func (m *Match) GroupCount() int {
225	return len(m.matchcount)
226	}
227
228	// GroupByName returns a group based on the name of the group, or nil if the group name does not exist
229	func (m Match) GroupByName(name string) Group {
230	num := m.regex.GroupNumberFromName(name)
231	if num < 0 {
232	return nil
233	}
234	return m.GroupByNumber(num)
235	}
236
237	// GroupByNumber returns a group based on the number of the group, or nil if the group number does not exist
238	func (m Match) GroupByNumber(num int) Group {
239	// check our sparse map
240	if m.sparseCaps != nil {
241	if newNum, ok := m.sparseCaps[num]; ok {
242	num = newNum
243	}
244	}
245	if num >= len(m.matchcount) \|\| num < 0 {
246	return nil
247	}
248
249	if num == 0 {
250	return &m.Group
251	}
252
253	m.populateOtherGroups()
254
255	return &m.otherGroups[num-1]
256	}
257
258	// Groups returns all the capture groups, starting with group 0 (the full match)
259	func (m *Match) Groups() []Group {
260	m.populateOtherGroups()
261	g := make([]Group, len(m.otherGroups)+1)
262	g[0] = m.Group
263	copy(g[1:], m.otherGroups)
264	return g
265	}
266
267	func (m *Match) populateOtherGroups() {
268	// Construct all the Group objects first time called
269	if m.otherGroups == nil {
270	m.otherGroups = make([]Group, len(m.matchcount)-1)
271	for i := 0; i < len(m.otherGroups); i++ {
272	m.otherGroups[i] = newGroup(m.regex.GroupNameFromNumber(i+1), m.text, m.matches[i+1], m.matchcount[i+1])
273	}
274	}
275	}
276
277	func (m Match) groupValueAppendToBuf(groupnum int, buf bytes.Buffer) {
278	c := m.matchcount[groupnum]
279	if c == 0 {
280	return
281	}
282
283	matches := m.matches[groupnum]
284
285	index := matches[(c-1)*2]
286	last := index + matches[(c*2)-1]
287
288	for ; index < last; index++ {
289	buf.WriteRune(m.text[index])
290	}
291	}
292
293	func newGroup(name string, text []rune, caps []int, capcount int) Group {
294	g := Group{}
295	g.text = text
296	if capcount > 0 {
297	g.Index = caps[(capcount-1)*2]
298	g.Length = caps[(capcount*2)-1]
299	}
300	g.Name = name
301	g.Captures = make([]Capture, capcount)
302	for i := 0; i < capcount; i++ {
303	g.Captures[i] = Capture{
304	text: text,
305	Index: caps[i*2],
306	Length: caps[i*2+1],
307	}
308	}
309	//log.Printf("newGroup! capcount %v, %+v", capcount, g)
310
311	return g
312	}
313
314	func (m *Match) dump() string {
315	buf := &bytes.Buffer{}
316	buf.WriteRune('\n')
317	if len(m.sparseCaps) > 0 {
318	for k, v := range m.sparseCaps {
319	fmt.Fprintf(buf, "Slot %v -> %v\n", k, v)
320	}
321	}
322
323	for i, g := range m.Groups() {
324	fmt.Fprintf(buf, "Group %v (%v), %v caps:\n", i, g.Name, len(g.Captures))
325
326	for _, c := range g.Captures {
327	fmt.Fprintf(buf, " (%v, %v) %v\n", c.Index, c.Length, c.String())
328	}
329	}
330	/*
331	for i := 0; i < len(m.matchcount); i++ {
332	fmt.Fprintf(buf, "\nGroup %v (%v):\n", i, m.regex.GroupNameFromNumber(i))
333
334	for j := 0; j < m.matchcount[i]; j++ {
335	text := ""
336
337	if m.matches[i][j*2] >= 0 {
338	start := m.matches[i][j*2]
339	text = m.text[start : start+m.matches[i][j*2+1]]
340	}
341
342	fmt.Fprintf(buf, " (%v, %v) %v\n", m.matches[i][j2], m.matches[i][j2+1], text)
343	}
344	}
345	*/
346	return buf.String()
347	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: