2011-03-19 06:37:00 +08:00
|
|
|
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file. See the AUTHORS file for names of contributors.
|
|
|
|
//
|
|
|
|
// Endian-neutral encoding:
|
|
|
|
// * Fixed-length numbers are encoded with least-significant byte first
|
|
|
|
// * In addition we support variable length "varint" encoding
|
|
|
|
// * Strings are encoded prefixed by their length in varint format
|
|
|
|
|
|
|
|
#ifndef STORAGE_LEVELDB_UTIL_CODING_H_
|
|
|
|
#define STORAGE_LEVELDB_UTIL_CODING_H_
|
|
|
|
|
2019-05-07 01:58:38 +08:00
|
|
|
#include <cstdint>
|
|
|
|
#include <cstring>
|
2011-03-19 06:37:00 +08:00
|
|
|
#include <string>
|
2018-03-16 21:23:29 +08:00
|
|
|
|
2011-03-31 02:35:40 +08:00
|
|
|
#include "leveldb/slice.h"
|
2011-03-19 06:37:00 +08:00
|
|
|
#include "port/port.h"
|
|
|
|
|
|
|
|
namespace leveldb {
|
|
|
|
|
|
|
|
// Standard Put... routines append to a string
|
2018-03-13 00:14:44 +08:00
|
|
|
void PutFixed32(std::string* dst, uint32_t value);
|
|
|
|
void PutFixed64(std::string* dst, uint64_t value);
|
|
|
|
void PutVarint32(std::string* dst, uint32_t value);
|
|
|
|
void PutVarint64(std::string* dst, uint64_t value);
|
|
|
|
void PutLengthPrefixedSlice(std::string* dst, const Slice& value);
|
2011-03-19 06:37:00 +08:00
|
|
|
|
|
|
|
// Standard Get... routines parse a value from the beginning of a Slice
|
|
|
|
// and advance the slice past the parsed value.
|
2018-03-13 00:14:44 +08:00
|
|
|
bool GetVarint32(Slice* input, uint32_t* value);
|
|
|
|
bool GetVarint64(Slice* input, uint64_t* value);
|
|
|
|
bool GetLengthPrefixedSlice(Slice* input, Slice* result);
|
2011-03-19 06:37:00 +08:00
|
|
|
|
|
|
|
// Pointer-based variants of GetVarint... These either store a value
|
|
|
|
// in *v and return a pointer just past the parsed value, or return
|
2018-04-11 07:18:06 +08:00
|
|
|
// nullptr on error. These routines only look at bytes in the range
|
2011-03-19 06:37:00 +08:00
|
|
|
// [p..limit-1]
|
2018-03-16 21:23:29 +08:00
|
|
|
const char* GetVarint32Ptr(const char* p, const char* limit, uint32_t* v);
|
|
|
|
const char* GetVarint64Ptr(const char* p, const char* limit, uint64_t* v);
|
2011-03-19 06:37:00 +08:00
|
|
|
|
|
|
|
// Returns the length of the varint32 or varint64 encoding of "v"
|
2018-03-13 00:14:44 +08:00
|
|
|
int VarintLength(uint64_t v);
|
2011-03-19 06:37:00 +08:00
|
|
|
|
|
|
|
// Lower-level versions of Put... that write directly into a character buffer
|
|
|
|
// and return a pointer just past the last byte written.
|
|
|
|
// REQUIRES: dst has enough space for the value being written
|
2018-03-13 00:14:44 +08:00
|
|
|
char* EncodeVarint32(char* dst, uint32_t value);
|
|
|
|
char* EncodeVarint64(char* dst, uint64_t value);
|
2011-03-19 06:37:00 +08:00
|
|
|
|
2019-05-07 01:58:38 +08:00
|
|
|
// TODO(costan): Remove port::kLittleEndian and the fast paths based on
|
|
|
|
// std::memcpy when clang learns to optimize the generic code, as
|
|
|
|
// described in https://bugs.llvm.org/show_bug.cgi?id=41761
|
|
|
|
//
|
|
|
|
// The platform-independent code in DecodeFixed{32,64}() gets optimized to mov
|
|
|
|
// on x86 and ldr on ARM64, by both clang and gcc. However, only gcc optimizes
|
|
|
|
// the platform-independent code in EncodeFixed{32,64}() to mov / str.
|
|
|
|
|
|
|
|
// Lower-level versions of Put... that write directly into a character buffer
|
|
|
|
// REQUIRES: dst has enough space for the value being written
|
|
|
|
|
|
|
|
inline void EncodeFixed32(char* dst, uint32_t value) {
|
|
|
|
uint8_t* const buffer = reinterpret_cast<uint8_t*>(dst);
|
|
|
|
|
|
|
|
if (port::kLittleEndian) {
|
|
|
|
// Fast path for little-endian CPUs. All major compilers optimize this to a
|
|
|
|
// single mov (x86_64) / str (ARM) instruction.
|
|
|
|
std::memcpy(buffer, &value, sizeof(uint32_t));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Platform-independent code.
|
|
|
|
// Currently, only gcc optimizes this to a single mov / str instruction.
|
|
|
|
buffer[0] = static_cast<uint8_t>(value);
|
|
|
|
buffer[1] = static_cast<uint8_t>(value >> 8);
|
|
|
|
buffer[2] = static_cast<uint8_t>(value >> 16);
|
|
|
|
buffer[3] = static_cast<uint8_t>(value >> 24);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline void EncodeFixed64(char* dst, uint64_t value) {
|
|
|
|
uint8_t* const buffer = reinterpret_cast<uint8_t*>(dst);
|
|
|
|
|
|
|
|
if (port::kLittleEndian) {
|
|
|
|
// Fast path for little-endian CPUs. All major compilers optimize this to a
|
|
|
|
// single mov (x86_64) / str (ARM) instruction.
|
|
|
|
std::memcpy(buffer, &value, sizeof(uint64_t));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Platform-independent code.
|
|
|
|
// Currently, only gcc optimizes this to a single mov / str instruction.
|
|
|
|
buffer[0] = static_cast<uint8_t>(value);
|
|
|
|
buffer[1] = static_cast<uint8_t>(value >> 8);
|
|
|
|
buffer[2] = static_cast<uint8_t>(value >> 16);
|
|
|
|
buffer[3] = static_cast<uint8_t>(value >> 24);
|
|
|
|
buffer[4] = static_cast<uint8_t>(value >> 32);
|
|
|
|
buffer[5] = static_cast<uint8_t>(value >> 40);
|
|
|
|
buffer[6] = static_cast<uint8_t>(value >> 48);
|
|
|
|
buffer[7] = static_cast<uint8_t>(value >> 56);
|
|
|
|
}
|
|
|
|
|
2011-03-19 06:37:00 +08:00
|
|
|
// Lower-level versions of Get... that read directly from a character buffer
|
|
|
|
// without any bounds checking.
|
|
|
|
|
|
|
|
inline uint32_t DecodeFixed32(const char* ptr) {
|
2019-05-07 01:58:38 +08:00
|
|
|
const uint8_t* const buffer = reinterpret_cast<const uint8_t*>(ptr);
|
|
|
|
|
2011-03-19 06:37:00 +08:00
|
|
|
if (port::kLittleEndian) {
|
2019-05-07 01:58:38 +08:00
|
|
|
// Fast path for little-endian CPUs. All major compilers optimize this to a
|
|
|
|
// single mov (x86_64) / ldr (ARM) instruction.
|
2011-03-19 06:37:00 +08:00
|
|
|
uint32_t result;
|
2019-05-07 01:58:38 +08:00
|
|
|
std::memcpy(&result, buffer, sizeof(uint32_t));
|
2011-03-19 06:37:00 +08:00
|
|
|
return result;
|
|
|
|
}
|
2019-05-07 01:58:38 +08:00
|
|
|
|
|
|
|
// Platform-independent code.
|
|
|
|
// Clang and gcc optimize this to a single mov / ldr instruction.
|
|
|
|
return (static_cast<uint32_t>(buffer[0])) |
|
|
|
|
(static_cast<uint32_t>(buffer[1]) << 8) |
|
|
|
|
(static_cast<uint32_t>(buffer[2]) << 16) |
|
|
|
|
(static_cast<uint32_t>(buffer[3]) << 24);
|
2011-03-19 06:37:00 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
inline uint64_t DecodeFixed64(const char* ptr) {
|
2019-05-07 01:58:38 +08:00
|
|
|
const uint8_t* const buffer = reinterpret_cast<const uint8_t*>(ptr);
|
|
|
|
|
2011-03-19 06:37:00 +08:00
|
|
|
if (port::kLittleEndian) {
|
2019-05-07 01:58:38 +08:00
|
|
|
// Fast path for little-endian CPUs. All major compilers optimize this to a
|
|
|
|
// single mov (x86_64) / ldr (ARM) instruction.
|
2011-03-19 06:37:00 +08:00
|
|
|
uint64_t result;
|
2019-05-07 01:58:38 +08:00
|
|
|
std::memcpy(&result, buffer, sizeof(uint64_t));
|
2011-03-19 06:37:00 +08:00
|
|
|
return result;
|
|
|
|
}
|
2019-05-07 01:58:38 +08:00
|
|
|
|
|
|
|
// Platform-independent code.
|
|
|
|
// Clang and gcc optimize this to a single mov / ldr instruction.
|
|
|
|
return (static_cast<uint64_t>(buffer[0])) |
|
|
|
|
(static_cast<uint64_t>(buffer[1]) << 8) |
|
|
|
|
(static_cast<uint64_t>(buffer[2]) << 16) |
|
|
|
|
(static_cast<uint64_t>(buffer[3]) << 24) |
|
|
|
|
(static_cast<uint64_t>(buffer[4]) << 32) |
|
|
|
|
(static_cast<uint64_t>(buffer[5]) << 40) |
|
|
|
|
(static_cast<uint64_t>(buffer[6]) << 48) |
|
|
|
|
(static_cast<uint64_t>(buffer[7]) << 56);
|
2011-03-19 06:37:00 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Internal routine for use by fallback path of GetVarint32Ptr
|
2019-05-03 02:01:00 +08:00
|
|
|
const char* GetVarint32PtrFallback(const char* p, const char* limit,
|
2018-03-13 00:14:44 +08:00
|
|
|
uint32_t* value);
|
2019-05-03 02:01:00 +08:00
|
|
|
inline const char* GetVarint32Ptr(const char* p, const char* limit,
|
2011-03-19 06:37:00 +08:00
|
|
|
uint32_t* value) {
|
|
|
|
if (p < limit) {
|
|
|
|
uint32_t result = *(reinterpret_cast<const unsigned char*>(p));
|
|
|
|
if ((result & 128) == 0) {
|
|
|
|
*value = result;
|
|
|
|
return p + 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return GetVarint32PtrFallback(p, limit, value);
|
|
|
|
}
|
|
|
|
|
2011-11-01 01:22:06 +08:00
|
|
|
} // namespace leveldb
|
2011-03-19 06:37:00 +08:00
|
|
|
|
|
|
|
#endif // STORAGE_LEVELDB_UTIL_CODING_H_
|