summaryrefslogtreecommitdiffstats
path: root/utils.go
blob: e91ae44a10fb57b3cb28e72ae436febd98b749d9 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
package bibtex

import (
	"bytes"
	"strings"
	"unicode"
)

// reader for LaTeX strings with methods to easily handle special chars, etc
type reader struct {
	*strings.Reader
}

func newReader(s string) *reader {
	return &reader{Reader: strings.NewReader(s)}
}

func (r *reader) readRune() rune {
	c, _, _ := r.Reader.ReadRune()
	return c
}

func (r *reader) readBraces() string {
	bracelevel := 1
	var c rune
	var buf bytes.Buffer
	for bracelevel > 0 {
		c = r.readRune()
		switch {
		case c == '{':
			bracelevel += 1
		case c == '}':
			bracelevel -= 1
		case c == eof:
			return buf.String()
		}
		buf.WriteRune(c)
	}
	return buf.String()
}

func (r *reader) skipBraces() {
	bracelevel := 1
	var c rune
	for bracelevel > 0 {
		c = r.readRune()
		switch {
		case c == '{':
			bracelevel += 1
		case c == '}':
			bracelevel -= 1
		case c == eof:
			return
		}
	}
}

func (r *reader) peek() rune {
	ch := r.readRune()
	r.UnreadRune()
	return ch
}

// length of a LaTeX string. A special char counts as one, braces count as one
// to be consitent with the original BibTeX implementation, but this seems
// stupid
func length(s string) (res int) {
	reader := newReader(s)
	res = 0
	blevel := 0
	for c := reader.readRune(); c != eof; c = reader.readRune() {
		switch {
		case c == '{' && blevel == 0:
			blevel += 1
			if c := reader.peek(); c == '\\' {
				// special char, count as one
				reader.skipBraces()
				blevel = 0
			}
		case c == '{':
			blevel += 1
		case c == '}':
			blevel -= 1
		}
		res += 1
	}
	return
}

func (r *reader) searchBraces() (bool, bool) {
	bracelevel := 1
	var c rune
	for bracelevel > 0 {
		c = r.readRune()
		switch {
		case c == '{':
			bracelevel += 1
		case c == '}':
			bracelevel -= 1
		case unicode.IsLower(c):
			return true, true
		case unicode.IsUpper(c):
			return false, true
		case c == eof:
			return false, false
		}
	}
	return false, false
}

func (r *reader) readCommand() string {
	var buf bytes.Buffer
	for c := r.readRune(); c != eof; c = r.readRune() {
		if !unicode.IsLetter(c) {
			r.UnreadRune()
			break
		} else {
			buf.WriteRune(c)
		}
	}
	return buf.String()
}

func isLower(s string) bool {
	reader := newReader(s)
	for c := reader.readRune(); c != eof; c = reader.readRune() {
		switch {
		case c == '{':
			if c := reader.readRune(); c == '\\' {
				command := reader.readCommand()
				if lcommands[command] {
					return true
				} else if ucommands[command] {
					return false
				} else if a, b := reader.searchBraces(); b {
					return a
				}
			} else {
				reader.UnreadRune()
				reader.skipBraces()
			}
		case unicode.IsLower(c):
			return true
		case unicode.IsUpper(c):
			return false
		}
	}
	return false
}