You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							197 lines
						
					
					
						
							5.3 KiB
						
					
					
				
			
		
		
	
	
							197 lines
						
					
					
						
							5.3 KiB
						
					
					
				| // Copyright 2015 PingCAP, Inc.
 | |
| //
 | |
| // Licensed under the Apache License, Version 2.0 (the "License");
 | |
| // you may not use this file except in compliance with the License.
 | |
| // You may obtain a copy of the License at
 | |
| //
 | |
| //     http://www.apache.org/licenses/LICENSE-2.0
 | |
| //
 | |
| // Unless required by applicable law or agreed to in writing, software
 | |
| // distributed under the License is distributed on an "AS IS" BASIS,
 | |
| // See the License for the specific language governing permissions and
 | |
| // limitations under the License.
 | |
| 
 | |
| package codec
 | |
| 
 | |
| import (
 | |
| 	"bytes"
 | |
| 	"encoding/binary"
 | |
| 	"runtime"
 | |
| 	"unsafe"
 | |
| 
 | |
| 	"github.com/juju/errors"
 | |
| )
 | |
| 
 | |
| const (
 | |
| 	encGroupSize = 8
 | |
| 	encMarker    = byte(0xFF)
 | |
| 	encPad       = byte(0x0)
 | |
| )
 | |
| 
 | |
| var (
 | |
| 	pads    = make([]byte, encGroupSize)
 | |
| 	encPads = []byte{encPad}
 | |
| )
 | |
| 
 | |
| // EncodeBytes guarantees the encoded value is in ascending order for comparison,
 | |
| // encoding with the following rule:
 | |
| //  [group1][marker1]...[groupN][markerN]
 | |
| //  group is 8 bytes slice which is padding with 0.
 | |
| //  marker is `0xFF - padding 0 count`
 | |
| // For example:
 | |
| //   [] -> [0, 0, 0, 0, 0, 0, 0, 0, 247]
 | |
| //   [1, 2, 3] -> [1, 2, 3, 0, 0, 0, 0, 0, 250]
 | |
| //   [1, 2, 3, 0] -> [1, 2, 3, 0, 0, 0, 0, 0, 251]
 | |
| //   [1, 2, 3, 4, 5, 6, 7, 8] -> [1, 2, 3, 4, 5, 6, 7, 8, 255, 0, 0, 0, 0, 0, 0, 0, 0, 247]
 | |
| // Refer: https://github.com/facebook/mysql-5.6/wiki/MyRocks-record-format#memcomparable-format
 | |
| func EncodeBytes(b []byte, data []byte) []byte {
 | |
| 	// Allocate more space to avoid unnecessary slice growing.
 | |
| 	// Assume that the byte slice size is about `(len(data) / encGroupSize + 1) * (encGroupSize + 1)` bytes,
 | |
| 	// that is `(len(data) / 8 + 1) * 9` in our implement.
 | |
| 	dLen := len(data)
 | |
| 	reallocSize := (dLen/encGroupSize + 1) * (encGroupSize + 1)
 | |
| 	result := reallocBytes(b, reallocSize)
 | |
| 	for idx := 0; idx <= dLen; idx += encGroupSize {
 | |
| 		remain := dLen - idx
 | |
| 		padCount := 0
 | |
| 		if remain >= encGroupSize {
 | |
| 			result = append(result, data[idx:idx+encGroupSize]...)
 | |
| 		} else {
 | |
| 			padCount = encGroupSize - remain
 | |
| 			result = append(result, data[idx:]...)
 | |
| 			result = append(result, pads[:padCount]...)
 | |
| 		}
 | |
| 
 | |
| 		marker := encMarker - byte(padCount)
 | |
| 		result = append(result, marker)
 | |
| 	}
 | |
| 
 | |
| 	return result
 | |
| }
 | |
| 
 | |
| func decodeBytes(b []byte, reverse bool) ([]byte, []byte, error) {
 | |
| 	data := make([]byte, 0, len(b))
 | |
| 	for {
 | |
| 		if len(b) < encGroupSize+1 {
 | |
| 			return nil, nil, errors.New("insufficient bytes to decode value")
 | |
| 		}
 | |
| 
 | |
| 		groupBytes := b[:encGroupSize+1]
 | |
| 		if reverse {
 | |
| 			reverseBytes(groupBytes)
 | |
| 		}
 | |
| 
 | |
| 		group := groupBytes[:encGroupSize]
 | |
| 		marker := groupBytes[encGroupSize]
 | |
| 
 | |
| 		// Check validity of marker.
 | |
| 		padCount := encMarker - marker
 | |
| 		realGroupSize := encGroupSize - padCount
 | |
| 		if padCount > encGroupSize {
 | |
| 			return nil, nil, errors.Errorf("invalid marker byte, group bytes %q", groupBytes)
 | |
| 		}
 | |
| 
 | |
| 		data = append(data, group[:realGroupSize]...)
 | |
| 		b = b[encGroupSize+1:]
 | |
| 
 | |
| 		if marker != encMarker {
 | |
| 			// Check validity of padding bytes.
 | |
| 			if bytes.Count(group[realGroupSize:], encPads) != int(padCount) {
 | |
| 				return nil, nil, errors.Errorf("invalid padding byte, group bytes %q", groupBytes)
 | |
| 			}
 | |
| 
 | |
| 			break
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return b, data, nil
 | |
| }
 | |
| 
 | |
| // DecodeBytes decodes bytes which is encoded by EncodeBytes before,
 | |
| // returns the leftover bytes and decoded value if no error.
 | |
| func DecodeBytes(b []byte) ([]byte, []byte, error) {
 | |
| 	return decodeBytes(b, false)
 | |
| }
 | |
| 
 | |
| // EncodeBytesDesc first encodes bytes using EncodeBytes, then bitwise reverses
 | |
| // encoded value to guarantee the encoded value is in descending order for comparison.
 | |
| func EncodeBytesDesc(b []byte, data []byte) []byte {
 | |
| 	n := len(b)
 | |
| 	b = EncodeBytes(b, data)
 | |
| 	reverseBytes(b[n:])
 | |
| 	return b
 | |
| }
 | |
| 
 | |
| // DecodeBytesDesc decodes bytes which is encoded by EncodeBytesDesc before,
 | |
| // returns the leftover bytes and decoded value if no error.
 | |
| func DecodeBytesDesc(b []byte) ([]byte, []byte, error) {
 | |
| 	return decodeBytes(b, true)
 | |
| }
 | |
| 
 | |
| // EncodeCompactBytes joins bytes with its length into a byte slice. It is more
 | |
| // efficient in both space and time compare to EncodeBytes. Note that the encoded
 | |
| // result is not memcomparable.
 | |
| func EncodeCompactBytes(b []byte, data []byte) []byte {
 | |
| 	b = reallocBytes(b, binary.MaxVarintLen64+len(data))
 | |
| 	b = EncodeVarint(b, int64(len(data)))
 | |
| 	return append(b, data...)
 | |
| }
 | |
| 
 | |
| // DecodeCompactBytes decodes bytes which is encoded by EncodeCompactBytes before.
 | |
| func DecodeCompactBytes(b []byte) ([]byte, []byte, error) {
 | |
| 	b, n, err := DecodeVarint(b)
 | |
| 	if err != nil {
 | |
| 		return nil, nil, errors.Trace(err)
 | |
| 	}
 | |
| 	if int64(len(b)) < n {
 | |
| 		return nil, nil, errors.Errorf("insufficient bytes to decode value, expected length: %v", n)
 | |
| 	}
 | |
| 	return b[n:], b[:n], nil
 | |
| }
 | |
| 
 | |
| // See https://golang.org/src/crypto/cipher/xor.go
 | |
| const wordSize = int(unsafe.Sizeof(uintptr(0)))
 | |
| const supportsUnaligned = runtime.GOARCH == "386" || runtime.GOARCH == "amd64"
 | |
| 
 | |
| func fastReverseBytes(b []byte) {
 | |
| 	n := len(b)
 | |
| 	w := n / wordSize
 | |
| 	if w > 0 {
 | |
| 		bw := *(*[]uintptr)(unsafe.Pointer(&b))
 | |
| 		for i := 0; i < w; i++ {
 | |
| 			bw[i] = ^bw[i]
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	for i := w * wordSize; i < n; i++ {
 | |
| 		b[i] = ^b[i]
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func safeReverseBytes(b []byte) {
 | |
| 	for i := range b {
 | |
| 		b[i] = ^b[i]
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func reverseBytes(b []byte) {
 | |
| 	if supportsUnaligned {
 | |
| 		fastReverseBytes(b)
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	safeReverseBytes(b)
 | |
| }
 | |
| 
 | |
| // like realloc.
 | |
| func reallocBytes(b []byte, n int) []byte {
 | |
| 	newSize := len(b) + n
 | |
| 	if cap(b) < newSize {
 | |
| 		bs := make([]byte, len(b), newSize)
 | |
| 		copy(bs, b)
 | |
| 		return bs
 | |
| 	}
 | |
| 
 | |
| 	// slice b has capability to store n bytes
 | |
| 	return b
 | |
| }
 | |
| 
 |