crashpad/util/stream/base94_output_stream.cc
Mark Mentovai 6278690abe Update copyright boilerplate, 2022 edition (Crashpad)
sed -i '' -E -e 's/Copyright (.+) The Crashpad Authors\. All rights reserved\.$/Copyright \1 The Crashpad Authors/' $(git grep -El 'Copyright (.+) The Crashpad Authors\. All rights reserved\.$')

Bug: chromium:1098010
Change-Id: I8d6138469ddbe3d281a5d83f64cf918ec2491611
Reviewed-on: https://chromium-review.googlesource.com/c/crashpad/crashpad/+/3878262
Reviewed-by: Joshua Peraza <jperaza@chromium.org>
Commit-Queue: Mark Mentovai <mark@chromium.org>
2022-09-06 23:54:07 +00:00

175 lines
4.9 KiB
C++
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

// Copyright 2019 The Crashpad Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "util/stream/base94_output_stream.h"
#include <algorithm>
#include "base/check.h"
#include "base/logging.h"
#include "base/numerics/safe_conversions.h"
namespace crashpad {
namespace {
// To improve the space efficiency, we can encode 14 bits into two symbols
// if 14-bit number is less than 94^2 which is total number can be encoded
// by 2 digits of base94 number, in another word, if 13 bit number is
// smaller than 643, we could read one more bit, because even if the 14th
// bit is 1, the 14-bit number doesnt exceed the max value.
constexpr uint16_t kMaxValueOf14BitEncoding = (94 * 94 - 1) & 0x1FFF;
constexpr size_t kMaxBuffer = 4096;
inline uint8_t EncodeByte(uint8_t byte) {
DCHECK(byte < 94);
return (byte >= 94u) ? 0xff : (byte + '!');
}
inline uint8_t DecodeByte(uint8_t byte) {
DCHECK(byte >= '!' && byte <= '~');
return std::min(static_cast<uint8_t>(byte - '!'), static_cast<uint8_t>(94));
}
} // namespace
Base94OutputStream::Base94OutputStream(
Mode mode,
std::unique_ptr<OutputStreamInterface> output_stream)
: mode_(mode),
output_stream_(std::move(output_stream)),
bit_buf_(0),
bit_count_(0),
symbol_buffer_(0),
flush_needed_(false),
flushed_(false) {
buffer_.reserve(kMaxBuffer);
}
Base94OutputStream::~Base94OutputStream() {
DCHECK(!flush_needed_);
}
bool Base94OutputStream::Write(const uint8_t* data, size_t size) {
DCHECK(!flushed_);
flush_needed_ = true;
return mode_ == Mode::kEncode ? Encode(data, size) : Decode(data, size);
}
bool Base94OutputStream::Flush() {
flushed_ = true;
if (flush_needed_) {
flush_needed_ = false;
if (!((mode_ == Mode::kEncode) ? FinishEncoding() : FinishDecoding()))
return false;
}
return output_stream_->Flush();
}
bool Base94OutputStream::Encode(const uint8_t* data, size_t size) {
const uint8_t* cur = data;
while (size--) {
bit_buf_ |= *(cur++) << bit_count_;
bit_count_ += 8;
if (bit_count_ < 14)
continue;
uint16_t block;
// Check if 13-bit or 14-bit data should be encoded.
if ((bit_buf_ & 0x1FFF) > kMaxValueOf14BitEncoding) {
block = bit_buf_ & 0x1FFF;
bit_buf_ >>= 13;
bit_count_ -= 13;
} else {
block = bit_buf_ & 0x3FFF;
bit_buf_ >>= 14;
bit_count_ -= 14;
}
buffer_.push_back(EncodeByte(block % 94));
buffer_.push_back(EncodeByte(base::saturated_cast<uint8_t>(block / 94)));
if (buffer_.size() > kMaxBuffer - 2 && !WriteOutputStream())
return false;
}
return WriteOutputStream();
}
bool Base94OutputStream::Decode(const uint8_t* data, size_t size) {
const uint8_t* cur = data;
while (size--) {
if (DecodeByte(*cur) == 94) {
LOG(ERROR) << "Decode: invalid input";
return false;
}
if (symbol_buffer_ == 0) {
symbol_buffer_ = *cur;
cur++;
continue;
}
uint16_t v = DecodeByte(symbol_buffer_) + DecodeByte(*cur) * 94;
cur++;
symbol_buffer_ = 0;
bit_buf_ |= v << bit_count_;
bit_count_ += (v & 0x1FFF) > kMaxValueOf14BitEncoding ? 13 : 14;
while (bit_count_ > 7) {
buffer_.push_back(bit_buf_ & 0xff);
bit_buf_ >>= 8;
bit_count_ -= 8;
}
if (buffer_.size() > kMaxBuffer - 2) {
if (!WriteOutputStream())
return false;
}
}
return WriteOutputStream();
}
bool Base94OutputStream::FinishEncoding() {
if (bit_count_ == 0)
return true;
// Up to 13 bits data is left over.
buffer_.push_back(EncodeByte(bit_buf_ % 94));
if (bit_buf_ > 93 || bit_count_ > 8)
buffer_.push_back(EncodeByte(base::saturated_cast<uint8_t>(bit_buf_ / 94)));
bit_count_ = 0;
bit_buf_ = 0;
return WriteOutputStream();
}
bool Base94OutputStream::FinishDecoding() {
// The left over bit is padding and all zero, if there is no symbol
// unprocessed.
if (symbol_buffer_ == 0) {
DCHECK(!bit_buf_);
return true;
}
bit_buf_ |= DecodeByte(symbol_buffer_) << bit_count_;
buffer_.push_back(bit_buf_ & 0xff);
bit_buf_ >>= 8;
// The remaining bits are either encode padding or zeros from bit shift.
DCHECK(!bit_buf_);
return WriteOutputStream();
}
bool Base94OutputStream::WriteOutputStream() {
if (buffer_.empty())
return true;
bool result = output_stream_->Write(buffer_.data(), buffer_.size());
buffer_.clear();
return result;
}
} // namespace crashpad