diff options
author | Rutger Broekhoff | 2023-12-29 21:31:53 +0100 |
---|---|---|
committer | Rutger Broekhoff | 2023-12-29 21:31:53 +0100 |
commit | 404aeae4545d2426c089a5f8d5e82dae56f5212b (patch) | |
tree | 2d84e00af272b39fc04f3795ae06bc48970e57b5 /vendor/github.com/json-iterator/go/iter_str.go | |
parent | 209d8b0187ed025dec9ac149ebcced3462877bff (diff) | |
download | gitolfs3-404aeae4545d2426c089a5f8d5e82dae56f5212b.tar.gz gitolfs3-404aeae4545d2426c089a5f8d5e82dae56f5212b.zip |
Make Nix builds work
Diffstat (limited to 'vendor/github.com/json-iterator/go/iter_str.go')
-rw-r--r-- | vendor/github.com/json-iterator/go/iter_str.go | 215 |
1 files changed, 215 insertions, 0 deletions
diff --git a/vendor/github.com/json-iterator/go/iter_str.go b/vendor/github.com/json-iterator/go/iter_str.go new file mode 100644 index 0000000..adc487e --- /dev/null +++ b/vendor/github.com/json-iterator/go/iter_str.go | |||
@@ -0,0 +1,215 @@ | |||
1 | package jsoniter | ||
2 | |||
3 | import ( | ||
4 | "fmt" | ||
5 | "unicode/utf16" | ||
6 | ) | ||
7 | |||
8 | // ReadString read string from iterator | ||
9 | func (iter *Iterator) ReadString() (ret string) { | ||
10 | c := iter.nextToken() | ||
11 | if c == '"' { | ||
12 | for i := iter.head; i < iter.tail; i++ { | ||
13 | c := iter.buf[i] | ||
14 | if c == '"' { | ||
15 | ret = string(iter.buf[iter.head:i]) | ||
16 | iter.head = i + 1 | ||
17 | return ret | ||
18 | } else if c == '\\' { | ||
19 | break | ||
20 | } else if c < ' ' { | ||
21 | iter.ReportError("ReadString", | ||
22 | fmt.Sprintf(`invalid control character found: %d`, c)) | ||
23 | return | ||
24 | } | ||
25 | } | ||
26 | return iter.readStringSlowPath() | ||
27 | } else if c == 'n' { | ||
28 | iter.skipThreeBytes('u', 'l', 'l') | ||
29 | return "" | ||
30 | } | ||
31 | iter.ReportError("ReadString", `expects " or n, but found `+string([]byte{c})) | ||
32 | return | ||
33 | } | ||
34 | |||
35 | func (iter *Iterator) readStringSlowPath() (ret string) { | ||
36 | var str []byte | ||
37 | var c byte | ||
38 | for iter.Error == nil { | ||
39 | c = iter.readByte() | ||
40 | if c == '"' { | ||
41 | return string(str) | ||
42 | } | ||
43 | if c == '\\' { | ||
44 | c = iter.readByte() | ||
45 | str = iter.readEscapedChar(c, str) | ||
46 | } else { | ||
47 | str = append(str, c) | ||
48 | } | ||
49 | } | ||
50 | iter.ReportError("readStringSlowPath", "unexpected end of input") | ||
51 | return | ||
52 | } | ||
53 | |||
54 | func (iter *Iterator) readEscapedChar(c byte, str []byte) []byte { | ||
55 | switch c { | ||
56 | case 'u': | ||
57 | r := iter.readU4() | ||
58 | if utf16.IsSurrogate(r) { | ||
59 | c = iter.readByte() | ||
60 | if iter.Error != nil { | ||
61 | return nil | ||
62 | } | ||
63 | if c != '\\' { | ||
64 | iter.unreadByte() | ||
65 | str = appendRune(str, r) | ||
66 | return str | ||
67 | } | ||
68 | c = iter.readByte() | ||
69 | if iter.Error != nil { | ||
70 | return nil | ||
71 | } | ||
72 | if c != 'u' { | ||
73 | str = appendRune(str, r) | ||
74 | return iter.readEscapedChar(c, str) | ||
75 | } | ||
76 | r2 := iter.readU4() | ||
77 | if iter.Error != nil { | ||
78 | return nil | ||
79 | } | ||
80 | combined := utf16.DecodeRune(r, r2) | ||
81 | if combined == '\uFFFD' { | ||
82 | str = appendRune(str, r) | ||
83 | str = appendRune(str, r2) | ||
84 | } else { | ||
85 | str = appendRune(str, combined) | ||
86 | } | ||
87 | } else { | ||
88 | str = appendRune(str, r) | ||
89 | } | ||
90 | case '"': | ||
91 | str = append(str, '"') | ||
92 | case '\\': | ||
93 | str = append(str, '\\') | ||
94 | case '/': | ||
95 | str = append(str, '/') | ||
96 | case 'b': | ||
97 | str = append(str, '\b') | ||
98 | case 'f': | ||
99 | str = append(str, '\f') | ||
100 | case 'n': | ||
101 | str = append(str, '\n') | ||
102 | case 'r': | ||
103 | str = append(str, '\r') | ||
104 | case 't': | ||
105 | str = append(str, '\t') | ||
106 | default: | ||
107 | iter.ReportError("readEscapedChar", | ||
108 | `invalid escape char after \`) | ||
109 | return nil | ||
110 | } | ||
111 | return str | ||
112 | } | ||
113 | |||
114 | // ReadStringAsSlice read string from iterator without copying into string form. | ||
115 | // The []byte can not be kept, as it will change after next iterator call. | ||
116 | func (iter *Iterator) ReadStringAsSlice() (ret []byte) { | ||
117 | c := iter.nextToken() | ||
118 | if c == '"' { | ||
119 | for i := iter.head; i < iter.tail; i++ { | ||
120 | // require ascii string and no escape | ||
121 | // for: field name, base64, number | ||
122 | if iter.buf[i] == '"' { | ||
123 | // fast path: reuse the underlying buffer | ||
124 | ret = iter.buf[iter.head:i] | ||
125 | iter.head = i + 1 | ||
126 | return ret | ||
127 | } | ||
128 | } | ||
129 | readLen := iter.tail - iter.head | ||
130 | copied := make([]byte, readLen, readLen*2) | ||
131 | copy(copied, iter.buf[iter.head:iter.tail]) | ||
132 | iter.head = iter.tail | ||
133 | for iter.Error == nil { | ||
134 | c := iter.readByte() | ||
135 | if c == '"' { | ||
136 | return copied | ||
137 | } | ||
138 | copied = append(copied, c) | ||
139 | } | ||
140 | return copied | ||
141 | } | ||
142 | iter.ReportError("ReadStringAsSlice", `expects " or n, but found `+string([]byte{c})) | ||
143 | return | ||
144 | } | ||
145 | |||
146 | func (iter *Iterator) readU4() (ret rune) { | ||
147 | for i := 0; i < 4; i++ { | ||
148 | c := iter.readByte() | ||
149 | if iter.Error != nil { | ||
150 | return | ||
151 | } | ||
152 | if c >= '0' && c <= '9' { | ||
153 | ret = ret*16 + rune(c-'0') | ||
154 | } else if c >= 'a' && c <= 'f' { | ||
155 | ret = ret*16 + rune(c-'a'+10) | ||
156 | } else if c >= 'A' && c <= 'F' { | ||
157 | ret = ret*16 + rune(c-'A'+10) | ||
158 | } else { | ||
159 | iter.ReportError("readU4", "expects 0~9 or a~f, but found "+string([]byte{c})) | ||
160 | return | ||
161 | } | ||
162 | } | ||
163 | return ret | ||
164 | } | ||
165 | |||
166 | const ( | ||
167 | t1 = 0x00 // 0000 0000 | ||
168 | tx = 0x80 // 1000 0000 | ||
169 | t2 = 0xC0 // 1100 0000 | ||
170 | t3 = 0xE0 // 1110 0000 | ||
171 | t4 = 0xF0 // 1111 0000 | ||
172 | t5 = 0xF8 // 1111 1000 | ||
173 | |||
174 | maskx = 0x3F // 0011 1111 | ||
175 | mask2 = 0x1F // 0001 1111 | ||
176 | mask3 = 0x0F // 0000 1111 | ||
177 | mask4 = 0x07 // 0000 0111 | ||
178 | |||
179 | rune1Max = 1<<7 - 1 | ||
180 | rune2Max = 1<<11 - 1 | ||
181 | rune3Max = 1<<16 - 1 | ||
182 | |||
183 | surrogateMin = 0xD800 | ||
184 | surrogateMax = 0xDFFF | ||
185 | |||
186 | maxRune = '\U0010FFFF' // Maximum valid Unicode code point. | ||
187 | runeError = '\uFFFD' // the "error" Rune or "Unicode replacement character" | ||
188 | ) | ||
189 | |||
190 | func appendRune(p []byte, r rune) []byte { | ||
191 | // Negative values are erroneous. Making it unsigned addresses the problem. | ||
192 | switch i := uint32(r); { | ||
193 | case i <= rune1Max: | ||
194 | p = append(p, byte(r)) | ||
195 | return p | ||
196 | case i <= rune2Max: | ||
197 | p = append(p, t2|byte(r>>6)) | ||
198 | p = append(p, tx|byte(r)&maskx) | ||
199 | return p | ||
200 | case i > maxRune, surrogateMin <= i && i <= surrogateMax: | ||
201 | r = runeError | ||
202 | fallthrough | ||
203 | case i <= rune3Max: | ||
204 | p = append(p, t3|byte(r>>12)) | ||
205 | p = append(p, tx|byte(r>>6)&maskx) | ||
206 | p = append(p, tx|byte(r)&maskx) | ||
207 | return p | ||
208 | default: | ||
209 | p = append(p, t4|byte(r>>18)) | ||
210 | p = append(p, tx|byte(r>>12)&maskx) | ||
211 | p = append(p, tx|byte(r>>6)&maskx) | ||
212 | p = append(p, tx|byte(r)&maskx) | ||
213 | return p | ||
214 | } | ||
215 | } | ||