diff options
author | Rutger Broekhoff | 2023-12-29 21:31:53 +0100 |
---|---|---|
committer | Rutger Broekhoff | 2023-12-29 21:31:53 +0100 |
commit | 404aeae4545d2426c089a5f8d5e82dae56f5212b (patch) | |
tree | 2d84e00af272b39fc04f3795ae06bc48970e57b5 /vendor/github.com/klauspost/compress/s2/lz4sconvert.go | |
parent | 209d8b0187ed025dec9ac149ebcced3462877bff (diff) | |
download | gitolfs3-404aeae4545d2426c089a5f8d5e82dae56f5212b.tar.gz gitolfs3-404aeae4545d2426c089a5f8d5e82dae56f5212b.zip |
Make Nix builds work
Diffstat (limited to 'vendor/github.com/klauspost/compress/s2/lz4sconvert.go')
-rw-r--r-- | vendor/github.com/klauspost/compress/s2/lz4sconvert.go | 467 |
1 files changed, 467 insertions, 0 deletions
diff --git a/vendor/github.com/klauspost/compress/s2/lz4sconvert.go b/vendor/github.com/klauspost/compress/s2/lz4sconvert.go new file mode 100644 index 0000000..000f397 --- /dev/null +++ b/vendor/github.com/klauspost/compress/s2/lz4sconvert.go | |||
@@ -0,0 +1,467 @@ | |||
1 | // Copyright (c) 2022 Klaus Post. All rights reserved. | ||
2 | // Use of this source code is governed by a BSD-style | ||
3 | // license that can be found in the LICENSE file. | ||
4 | |||
5 | package s2 | ||
6 | |||
7 | import ( | ||
8 | "encoding/binary" | ||
9 | "fmt" | ||
10 | ) | ||
11 | |||
12 | // LZ4sConverter provides conversion from LZ4s. | ||
13 | // (Intel modified LZ4 Blocks) | ||
14 | // https://cdrdv2-public.intel.com/743912/743912-qat-programmers-guide-v2.0.pdf | ||
15 | // LZ4s is a variant of LZ4 block format. LZ4s should be considered as an intermediate compressed block format. | ||
16 | // The LZ4s format is selected when the application sets the compType to CPA_DC_LZ4S in CpaDcSessionSetupData. | ||
17 | // The LZ4s block returned by the IntelĀ® QAT hardware can be used by an external | ||
18 | // software post-processing to generate other compressed data formats. | ||
19 | // The following table lists the differences between LZ4 and LZ4s block format. LZ4s block format uses | ||
20 | // the same high-level formatting as LZ4 block format with the following encoding changes: | ||
21 | // For Min Match of 4 bytes, Copy length value 1-15 means length 4-18 with 18 bytes adding an extra byte. | ||
22 | // ONLY "Min match of 4 bytes" is supported. | ||
23 | type LZ4sConverter struct { | ||
24 | } | ||
25 | |||
26 | // ConvertBlock will convert an LZ4s block and append it as an S2 | ||
27 | // block without block length to dst. | ||
28 | // The uncompressed size is returned as well. | ||
29 | // dst must have capacity to contain the entire compressed block. | ||
30 | func (l *LZ4sConverter) ConvertBlock(dst, src []byte) ([]byte, int, error) { | ||
31 | if len(src) == 0 { | ||
32 | return dst, 0, nil | ||
33 | } | ||
34 | const debug = false | ||
35 | const inline = true | ||
36 | const lz4MinMatch = 3 | ||
37 | |||
38 | s, d := 0, len(dst) | ||
39 | dst = dst[:cap(dst)] | ||
40 | if !debug && hasAmd64Asm { | ||
41 | res, sz := cvtLZ4sBlockAsm(dst[d:], src) | ||
42 | if res < 0 { | ||
43 | const ( | ||
44 | errCorrupt = -1 | ||
45 | errDstTooSmall = -2 | ||
46 | ) | ||
47 | switch res { | ||
48 | case errCorrupt: | ||
49 | return nil, 0, ErrCorrupt | ||
50 | case errDstTooSmall: | ||
51 | return nil, 0, ErrDstTooSmall | ||
52 | default: | ||
53 | return nil, 0, fmt.Errorf("unexpected result: %d", res) | ||
54 | } | ||
55 | } | ||
56 | if d+sz > len(dst) { | ||
57 | return nil, 0, ErrDstTooSmall | ||
58 | } | ||
59 | return dst[:d+sz], res, nil | ||
60 | } | ||
61 | |||
62 | dLimit := len(dst) - 10 | ||
63 | var lastOffset uint16 | ||
64 | var uncompressed int | ||
65 | if debug { | ||
66 | fmt.Printf("convert block start: len(src): %d, len(dst):%d \n", len(src), len(dst)) | ||
67 | } | ||
68 | |||
69 | for { | ||
70 | if s >= len(src) { | ||
71 | return dst[:d], 0, ErrCorrupt | ||
72 | } | ||
73 | // Read literal info | ||
74 | token := src[s] | ||
75 | ll := int(token >> 4) | ||
76 | ml := int(lz4MinMatch + (token & 0xf)) | ||
77 | |||
78 | // If upper nibble is 15, literal length is extended | ||
79 | if token >= 0xf0 { | ||
80 | for { | ||
81 | s++ | ||
82 | if s >= len(src) { | ||
83 | if debug { | ||
84 | fmt.Printf("error reading ll: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
85 | } | ||
86 | return dst[:d], 0, ErrCorrupt | ||
87 | } | ||
88 | val := src[s] | ||
89 | ll += int(val) | ||
90 | if val != 255 { | ||
91 | break | ||
92 | } | ||
93 | } | ||
94 | } | ||
95 | // Skip past token | ||
96 | if s+ll >= len(src) { | ||
97 | if debug { | ||
98 | fmt.Printf("error literals: s+ll (%d+%d) >= len(src) (%d)\n", s, ll, len(src)) | ||
99 | } | ||
100 | return nil, 0, ErrCorrupt | ||
101 | } | ||
102 | s++ | ||
103 | if ll > 0 { | ||
104 | if d+ll > dLimit { | ||
105 | return nil, 0, ErrDstTooSmall | ||
106 | } | ||
107 | if debug { | ||
108 | fmt.Printf("emit %d literals\n", ll) | ||
109 | } | ||
110 | d += emitLiteralGo(dst[d:], src[s:s+ll]) | ||
111 | s += ll | ||
112 | uncompressed += ll | ||
113 | } | ||
114 | |||
115 | // Check if we are done... | ||
116 | if ml == lz4MinMatch { | ||
117 | if s == len(src) { | ||
118 | break | ||
119 | } | ||
120 | // 0 bytes. | ||
121 | continue | ||
122 | } | ||
123 | // 2 byte offset | ||
124 | if s >= len(src)-2 { | ||
125 | if debug { | ||
126 | fmt.Printf("s (%d) >= len(src)-2 (%d)", s, len(src)-2) | ||
127 | } | ||
128 | return nil, 0, ErrCorrupt | ||
129 | } | ||
130 | offset := binary.LittleEndian.Uint16(src[s:]) | ||
131 | s += 2 | ||
132 | if offset == 0 { | ||
133 | if debug { | ||
134 | fmt.Printf("error: offset 0, ml: %d, len(src)-s: %d\n", ml, len(src)-s) | ||
135 | } | ||
136 | return nil, 0, ErrCorrupt | ||
137 | } | ||
138 | if int(offset) > uncompressed { | ||
139 | if debug { | ||
140 | fmt.Printf("error: offset (%d)> uncompressed (%d)\n", offset, uncompressed) | ||
141 | } | ||
142 | return nil, 0, ErrCorrupt | ||
143 | } | ||
144 | |||
145 | if ml == lz4MinMatch+15 { | ||
146 | for { | ||
147 | if s >= len(src) { | ||
148 | if debug { | ||
149 | fmt.Printf("error reading ml: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
150 | } | ||
151 | return nil, 0, ErrCorrupt | ||
152 | } | ||
153 | val := src[s] | ||
154 | s++ | ||
155 | ml += int(val) | ||
156 | if val != 255 { | ||
157 | if s >= len(src) { | ||
158 | if debug { | ||
159 | fmt.Printf("error reading ml: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
160 | } | ||
161 | return nil, 0, ErrCorrupt | ||
162 | } | ||
163 | break | ||
164 | } | ||
165 | } | ||
166 | } | ||
167 | if offset == lastOffset { | ||
168 | if debug { | ||
169 | fmt.Printf("emit repeat, length: %d, offset: %d\n", ml, offset) | ||
170 | } | ||
171 | if !inline { | ||
172 | d += emitRepeat16(dst[d:], offset, ml) | ||
173 | } else { | ||
174 | length := ml | ||
175 | dst := dst[d:] | ||
176 | for len(dst) > 5 { | ||
177 | // Repeat offset, make length cheaper | ||
178 | length -= 4 | ||
179 | if length <= 4 { | ||
180 | dst[0] = uint8(length)<<2 | tagCopy1 | ||
181 | dst[1] = 0 | ||
182 | d += 2 | ||
183 | break | ||
184 | } | ||
185 | if length < 8 && offset < 2048 { | ||
186 | // Encode WITH offset | ||
187 | dst[1] = uint8(offset) | ||
188 | dst[0] = uint8(offset>>8)<<5 | uint8(length)<<2 | tagCopy1 | ||
189 | d += 2 | ||
190 | break | ||
191 | } | ||
192 | if length < (1<<8)+4 { | ||
193 | length -= 4 | ||
194 | dst[2] = uint8(length) | ||
195 | dst[1] = 0 | ||
196 | dst[0] = 5<<2 | tagCopy1 | ||
197 | d += 3 | ||
198 | break | ||
199 | } | ||
200 | if length < (1<<16)+(1<<8) { | ||
201 | length -= 1 << 8 | ||
202 | dst[3] = uint8(length >> 8) | ||
203 | dst[2] = uint8(length >> 0) | ||
204 | dst[1] = 0 | ||
205 | dst[0] = 6<<2 | tagCopy1 | ||
206 | d += 4 | ||
207 | break | ||
208 | } | ||
209 | const maxRepeat = (1 << 24) - 1 | ||
210 | length -= 1 << 16 | ||
211 | left := 0 | ||
212 | if length > maxRepeat { | ||
213 | left = length - maxRepeat + 4 | ||
214 | length = maxRepeat - 4 | ||
215 | } | ||
216 | dst[4] = uint8(length >> 16) | ||
217 | dst[3] = uint8(length >> 8) | ||
218 | dst[2] = uint8(length >> 0) | ||
219 | dst[1] = 0 | ||
220 | dst[0] = 7<<2 | tagCopy1 | ||
221 | if left > 0 { | ||
222 | d += 5 + emitRepeat16(dst[5:], offset, left) | ||
223 | break | ||
224 | } | ||
225 | d += 5 | ||
226 | break | ||
227 | } | ||
228 | } | ||
229 | } else { | ||
230 | if debug { | ||
231 | fmt.Printf("emit copy, length: %d, offset: %d\n", ml, offset) | ||
232 | } | ||
233 | if !inline { | ||
234 | d += emitCopy16(dst[d:], offset, ml) | ||
235 | } else { | ||
236 | length := ml | ||
237 | dst := dst[d:] | ||
238 | for len(dst) > 5 { | ||
239 | // Offset no more than 2 bytes. | ||
240 | if length > 64 { | ||
241 | off := 3 | ||
242 | if offset < 2048 { | ||
243 | // emit 8 bytes as tagCopy1, rest as repeats. | ||
244 | dst[1] = uint8(offset) | ||
245 | dst[0] = uint8(offset>>8)<<5 | uint8(8-4)<<2 | tagCopy1 | ||
246 | length -= 8 | ||
247 | off = 2 | ||
248 | } else { | ||
249 | // Emit a length 60 copy, encoded as 3 bytes. | ||
250 | // Emit remaining as repeat value (minimum 4 bytes). | ||
251 | dst[2] = uint8(offset >> 8) | ||
252 | dst[1] = uint8(offset) | ||
253 | dst[0] = 59<<2 | tagCopy2 | ||
254 | length -= 60 | ||
255 | } | ||
256 | // Emit remaining as repeats, at least 4 bytes remain. | ||
257 | d += off + emitRepeat16(dst[off:], offset, length) | ||
258 | break | ||
259 | } | ||
260 | if length >= 12 || offset >= 2048 { | ||
261 | // Emit the remaining copy, encoded as 3 bytes. | ||
262 | dst[2] = uint8(offset >> 8) | ||
263 | dst[1] = uint8(offset) | ||
264 | dst[0] = uint8(length-1)<<2 | tagCopy2 | ||
265 | d += 3 | ||
266 | break | ||
267 | } | ||
268 | // Emit the remaining copy, encoded as 2 bytes. | ||
269 | dst[1] = uint8(offset) | ||
270 | dst[0] = uint8(offset>>8)<<5 | uint8(length-4)<<2 | tagCopy1 | ||
271 | d += 2 | ||
272 | break | ||
273 | } | ||
274 | } | ||
275 | lastOffset = offset | ||
276 | } | ||
277 | uncompressed += ml | ||
278 | if d > dLimit { | ||
279 | return nil, 0, ErrDstTooSmall | ||
280 | } | ||
281 | } | ||
282 | |||
283 | return dst[:d], uncompressed, nil | ||
284 | } | ||
285 | |||
286 | // ConvertBlockSnappy will convert an LZ4s block and append it | ||
287 | // as a Snappy block without block length to dst. | ||
288 | // The uncompressed size is returned as well. | ||
289 | // dst must have capacity to contain the entire compressed block. | ||
290 | func (l *LZ4sConverter) ConvertBlockSnappy(dst, src []byte) ([]byte, int, error) { | ||
291 | if len(src) == 0 { | ||
292 | return dst, 0, nil | ||
293 | } | ||
294 | const debug = false | ||
295 | const lz4MinMatch = 3 | ||
296 | |||
297 | s, d := 0, len(dst) | ||
298 | dst = dst[:cap(dst)] | ||
299 | // Use assembly when possible | ||
300 | if !debug && hasAmd64Asm { | ||
301 | res, sz := cvtLZ4sBlockSnappyAsm(dst[d:], src) | ||
302 | if res < 0 { | ||
303 | const ( | ||
304 | errCorrupt = -1 | ||
305 | errDstTooSmall = -2 | ||
306 | ) | ||
307 | switch res { | ||
308 | case errCorrupt: | ||
309 | return nil, 0, ErrCorrupt | ||
310 | case errDstTooSmall: | ||
311 | return nil, 0, ErrDstTooSmall | ||
312 | default: | ||
313 | return nil, 0, fmt.Errorf("unexpected result: %d", res) | ||
314 | } | ||
315 | } | ||
316 | if d+sz > len(dst) { | ||
317 | return nil, 0, ErrDstTooSmall | ||
318 | } | ||
319 | return dst[:d+sz], res, nil | ||
320 | } | ||
321 | |||
322 | dLimit := len(dst) - 10 | ||
323 | var uncompressed int | ||
324 | if debug { | ||
325 | fmt.Printf("convert block start: len(src): %d, len(dst):%d \n", len(src), len(dst)) | ||
326 | } | ||
327 | |||
328 | for { | ||
329 | if s >= len(src) { | ||
330 | return nil, 0, ErrCorrupt | ||
331 | } | ||
332 | // Read literal info | ||
333 | token := src[s] | ||
334 | ll := int(token >> 4) | ||
335 | ml := int(lz4MinMatch + (token & 0xf)) | ||
336 | |||
337 | // If upper nibble is 15, literal length is extended | ||
338 | if token >= 0xf0 { | ||
339 | for { | ||
340 | s++ | ||
341 | if s >= len(src) { | ||
342 | if debug { | ||
343 | fmt.Printf("error reading ll: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
344 | } | ||
345 | return nil, 0, ErrCorrupt | ||
346 | } | ||
347 | val := src[s] | ||
348 | ll += int(val) | ||
349 | if val != 255 { | ||
350 | break | ||
351 | } | ||
352 | } | ||
353 | } | ||
354 | // Skip past token | ||
355 | if s+ll >= len(src) { | ||
356 | if debug { | ||
357 | fmt.Printf("error literals: s+ll (%d+%d) >= len(src) (%d)\n", s, ll, len(src)) | ||
358 | } | ||
359 | return nil, 0, ErrCorrupt | ||
360 | } | ||
361 | s++ | ||
362 | if ll > 0 { | ||
363 | if d+ll > dLimit { | ||
364 | return nil, 0, ErrDstTooSmall | ||
365 | } | ||
366 | if debug { | ||
367 | fmt.Printf("emit %d literals\n", ll) | ||
368 | } | ||
369 | d += emitLiteralGo(dst[d:], src[s:s+ll]) | ||
370 | s += ll | ||
371 | uncompressed += ll | ||
372 | } | ||
373 | |||
374 | // Check if we are done... | ||
375 | if ml == lz4MinMatch { | ||
376 | if s == len(src) { | ||
377 | break | ||
378 | } | ||
379 | // 0 bytes. | ||
380 | continue | ||
381 | } | ||
382 | // 2 byte offset | ||
383 | if s >= len(src)-2 { | ||
384 | if debug { | ||
385 | fmt.Printf("s (%d) >= len(src)-2 (%d)", s, len(src)-2) | ||
386 | } | ||
387 | return nil, 0, ErrCorrupt | ||
388 | } | ||
389 | offset := binary.LittleEndian.Uint16(src[s:]) | ||
390 | s += 2 | ||
391 | if offset == 0 { | ||
392 | if debug { | ||
393 | fmt.Printf("error: offset 0, ml: %d, len(src)-s: %d\n", ml, len(src)-s) | ||
394 | } | ||
395 | return nil, 0, ErrCorrupt | ||
396 | } | ||
397 | if int(offset) > uncompressed { | ||
398 | if debug { | ||
399 | fmt.Printf("error: offset (%d)> uncompressed (%d)\n", offset, uncompressed) | ||
400 | } | ||
401 | return nil, 0, ErrCorrupt | ||
402 | } | ||
403 | |||
404 | if ml == lz4MinMatch+15 { | ||
405 | for { | ||
406 | if s >= len(src) { | ||
407 | if debug { | ||
408 | fmt.Printf("error reading ml: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
409 | } | ||
410 | return nil, 0, ErrCorrupt | ||
411 | } | ||
412 | val := src[s] | ||
413 | s++ | ||
414 | ml += int(val) | ||
415 | if val != 255 { | ||
416 | if s >= len(src) { | ||
417 | if debug { | ||
418 | fmt.Printf("error reading ml: s (%d) >= len(src) (%d)\n", s, len(src)) | ||
419 | } | ||
420 | return nil, 0, ErrCorrupt | ||
421 | } | ||
422 | break | ||
423 | } | ||
424 | } | ||
425 | } | ||
426 | if debug { | ||
427 | fmt.Printf("emit copy, length: %d, offset: %d\n", ml, offset) | ||
428 | } | ||
429 | length := ml | ||
430 | // d += emitCopyNoRepeat(dst[d:], int(offset), ml) | ||
431 | for length > 0 { | ||
432 | if d >= dLimit { | ||
433 | return nil, 0, ErrDstTooSmall | ||
434 | } | ||
435 | |||
436 | // Offset no more than 2 bytes. | ||
437 | if length > 64 { | ||
438 | // Emit a length 64 copy, encoded as 3 bytes. | ||
439 | dst[d+2] = uint8(offset >> 8) | ||
440 | dst[d+1] = uint8(offset) | ||
441 | dst[d+0] = 63<<2 | tagCopy2 | ||
442 | length -= 64 | ||
443 | d += 3 | ||
444 | continue | ||
445 | } | ||
446 | if length >= 12 || offset >= 2048 || length < 4 { | ||
447 | // Emit the remaining copy, encoded as 3 bytes. | ||
448 | dst[d+2] = uint8(offset >> 8) | ||
449 | dst[d+1] = uint8(offset) | ||
450 | dst[d+0] = uint8(length-1)<<2 | tagCopy2 | ||
451 | d += 3 | ||
452 | break | ||
453 | } | ||
454 | // Emit the remaining copy, encoded as 2 bytes. | ||
455 | dst[d+1] = uint8(offset) | ||
456 | dst[d+0] = uint8(offset>>8)<<5 | uint8(length-4)<<2 | tagCopy1 | ||
457 | d += 2 | ||
458 | break | ||
459 | } | ||
460 | uncompressed += ml | ||
461 | if d > dLimit { | ||
462 | return nil, 0, ErrDstTooSmall | ||
463 | } | ||
464 | } | ||
465 | |||
466 | return dst[:d], uncompressed, nil | ||
467 | } | ||