74
|
1 //
|
|
2 // Copyright (c) 2011-2019 Canonical Ltd
|
|
3 // Copyright (c) 2006-2010 Kirill Simonov
|
|
4 //
|
|
5 // Permission is hereby granted, free of charge, to any person obtaining a copy of
|
|
6 // this software and associated documentation files (the "Software"), to deal in
|
|
7 // the Software without restriction, including without limitation the rights to
|
|
8 // use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
|
|
9 // of the Software, and to permit persons to whom the Software is furnished to do
|
|
10 // so, subject to the following conditions:
|
|
11 //
|
|
12 // The above copyright notice and this permission notice shall be included in all
|
|
13 // copies or substantial portions of the Software.
|
|
14 //
|
|
15 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21 // SOFTWARE.
|
|
22
|
|
23 package yaml
|
|
24
|
|
25 const (
|
|
26 // The size of the input raw buffer.
|
|
27 input_raw_buffer_size = 512
|
|
28
|
|
29 // The size of the input buffer.
|
|
30 // It should be possible to decode the whole raw buffer.
|
|
31 input_buffer_size = input_raw_buffer_size * 3
|
|
32
|
|
33 // The size of the output buffer.
|
|
34 output_buffer_size = 128
|
|
35
|
|
36 // The size of the output raw buffer.
|
|
37 // It should be possible to encode the whole output buffer.
|
|
38 output_raw_buffer_size = (output_buffer_size*2 + 2)
|
|
39
|
|
40 // The size of other stacks and queues.
|
|
41 initial_stack_size = 16
|
|
42 initial_queue_size = 16
|
|
43 initial_string_size = 16
|
|
44 )
|
|
45
|
|
46 // Check if the character at the specified position is an alphabetical
|
|
47 // character, a digit, '_', or '-'.
|
|
48 func is_alpha(b []byte, i int) bool {
|
|
49 return b[i] >= '0' && b[i] <= '9' || b[i] >= 'A' && b[i] <= 'Z' || b[i] >= 'a' && b[i] <= 'z' || b[i] == '_' || b[i] == '-'
|
|
50 }
|
|
51
|
|
52 // Check if the character at the specified position is a digit.
|
|
53 func is_digit(b []byte, i int) bool {
|
|
54 return b[i] >= '0' && b[i] <= '9'
|
|
55 }
|
|
56
|
|
57 // Get the value of a digit.
|
|
58 func as_digit(b []byte, i int) int {
|
|
59 return int(b[i]) - '0'
|
|
60 }
|
|
61
|
|
62 // Check if the character at the specified position is a hex-digit.
|
|
63 func is_hex(b []byte, i int) bool {
|
|
64 return b[i] >= '0' && b[i] <= '9' || b[i] >= 'A' && b[i] <= 'F' || b[i] >= 'a' && b[i] <= 'f'
|
|
65 }
|
|
66
|
|
67 // Get the value of a hex-digit.
|
|
68 func as_hex(b []byte, i int) int {
|
|
69 bi := b[i]
|
|
70 if bi >= 'A' && bi <= 'F' {
|
|
71 return int(bi) - 'A' + 10
|
|
72 }
|
|
73 if bi >= 'a' && bi <= 'f' {
|
|
74 return int(bi) - 'a' + 10
|
|
75 }
|
|
76 return int(bi) - '0'
|
|
77 }
|
|
78
|
|
79 // Check if the character is ASCII.
|
|
80 func is_ascii(b []byte, i int) bool {
|
|
81 return b[i] <= 0x7F
|
|
82 }
|
|
83
|
|
84 // Check if the character at the start of the buffer can be printed unescaped.
|
|
85 func is_printable(b []byte, i int) bool {
|
|
86 return ((b[i] == 0x0A) || // . == #x0A
|
|
87 (b[i] >= 0x20 && b[i] <= 0x7E) || // #x20 <= . <= #x7E
|
|
88 (b[i] == 0xC2 && b[i+1] >= 0xA0) || // #0xA0 <= . <= #xD7FF
|
|
89 (b[i] > 0xC2 && b[i] < 0xED) ||
|
|
90 (b[i] == 0xED && b[i+1] < 0xA0) ||
|
|
91 (b[i] == 0xEE) ||
|
|
92 (b[i] == 0xEF && // #xE000 <= . <= #xFFFD
|
|
93 !(b[i+1] == 0xBB && b[i+2] == 0xBF) && // && . != #xFEFF
|
|
94 !(b[i+1] == 0xBF && (b[i+2] == 0xBE || b[i+2] == 0xBF))))
|
|
95 }
|
|
96
|
|
97 // Check if the character at the specified position is NUL.
|
|
98 func is_z(b []byte, i int) bool {
|
|
99 return b[i] == 0x00
|
|
100 }
|
|
101
|
|
102 // Check if the beginning of the buffer is a BOM.
|
|
103 func is_bom(b []byte, i int) bool {
|
|
104 return b[0] == 0xEF && b[1] == 0xBB && b[2] == 0xBF
|
|
105 }
|
|
106
|
|
107 // Check if the character at the specified position is space.
|
|
108 func is_space(b []byte, i int) bool {
|
|
109 return b[i] == ' '
|
|
110 }
|
|
111
|
|
112 // Check if the character at the specified position is tab.
|
|
113 func is_tab(b []byte, i int) bool {
|
|
114 return b[i] == '\t'
|
|
115 }
|
|
116
|
|
117 // Check if the character at the specified position is blank (space or tab).
|
|
118 func is_blank(b []byte, i int) bool {
|
|
119 //return is_space(b, i) || is_tab(b, i)
|
|
120 return b[i] == ' ' || b[i] == '\t'
|
|
121 }
|
|
122
|
|
123 // Check if the character at the specified position is a line break.
|
|
124 func is_break(b []byte, i int) bool {
|
|
125 return (b[i] == '\r' || // CR (#xD)
|
|
126 b[i] == '\n' || // LF (#xA)
|
|
127 b[i] == 0xC2 && b[i+1] == 0x85 || // NEL (#x85)
|
|
128 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA8 || // LS (#x2028)
|
|
129 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA9) // PS (#x2029)
|
|
130 }
|
|
131
|
|
132 func is_crlf(b []byte, i int) bool {
|
|
133 return b[i] == '\r' && b[i+1] == '\n'
|
|
134 }
|
|
135
|
|
136 // Check if the character is a line break or NUL.
|
|
137 func is_breakz(b []byte, i int) bool {
|
|
138 //return is_break(b, i) || is_z(b, i)
|
|
139 return (
|
|
140 // is_break:
|
|
141 b[i] == '\r' || // CR (#xD)
|
|
142 b[i] == '\n' || // LF (#xA)
|
|
143 b[i] == 0xC2 && b[i+1] == 0x85 || // NEL (#x85)
|
|
144 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA8 || // LS (#x2028)
|
|
145 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA9 || // PS (#x2029)
|
|
146 // is_z:
|
|
147 b[i] == 0)
|
|
148 }
|
|
149
|
|
150 // Check if the character is a line break, space, or NUL.
|
|
151 func is_spacez(b []byte, i int) bool {
|
|
152 //return is_space(b, i) || is_breakz(b, i)
|
|
153 return (
|
|
154 // is_space:
|
|
155 b[i] == ' ' ||
|
|
156 // is_breakz:
|
|
157 b[i] == '\r' || // CR (#xD)
|
|
158 b[i] == '\n' || // LF (#xA)
|
|
159 b[i] == 0xC2 && b[i+1] == 0x85 || // NEL (#x85)
|
|
160 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA8 || // LS (#x2028)
|
|
161 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA9 || // PS (#x2029)
|
|
162 b[i] == 0)
|
|
163 }
|
|
164
|
|
165 // Check if the character is a line break, space, tab, or NUL.
|
|
166 func is_blankz(b []byte, i int) bool {
|
|
167 //return is_blank(b, i) || is_breakz(b, i)
|
|
168 return (
|
|
169 // is_blank:
|
|
170 b[i] == ' ' || b[i] == '\t' ||
|
|
171 // is_breakz:
|
|
172 b[i] == '\r' || // CR (#xD)
|
|
173 b[i] == '\n' || // LF (#xA)
|
|
174 b[i] == 0xC2 && b[i+1] == 0x85 || // NEL (#x85)
|
|
175 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA8 || // LS (#x2028)
|
|
176 b[i] == 0xE2 && b[i+1] == 0x80 && b[i+2] == 0xA9 || // PS (#x2029)
|
|
177 b[i] == 0)
|
|
178 }
|
|
179
|
|
180 // Determine the width of the character.
|
|
181 func width(b byte) int {
|
|
182 // Don't replace these by a switch without first
|
|
183 // confirming that it is being inlined.
|
|
184 if b&0x80 == 0x00 {
|
|
185 return 1
|
|
186 }
|
|
187 if b&0xE0 == 0xC0 {
|
|
188 return 2
|
|
189 }
|
|
190 if b&0xF0 == 0xE0 {
|
|
191 return 3
|
|
192 }
|
|
193 if b&0xF8 == 0xF0 {
|
|
194 return 4
|
|
195 }
|
|
196 return 0
|
|
197
|
|
198 }
|