logd: replace std::vector<uint8_t> in SerializedLogChunk

Turns out std::vector::resize() and std::vector::clear() don't
actually deallocate any memory.  std::vector::shrink_to_fit() can be
used for this but isn't a 'guarantee'.  Instead of trying to get
std::vector to play nice, this change replaces std::vector<uint8_t>
with std::unique_ptr<uint8_t[]>, which is more accurate to how I'm
using this memory anyway.

Test: logging unit tests
Change-Id: I9638e90bbf50bcf316c5aa172c8278ea945d27e7
This commit is contained in:
Tom Cherry 2020-06-24 13:51:04 -07:00
parent b07e339b53
commit b6cb992cf3
5 changed files with 98 additions and 45 deletions

View File

@ -27,7 +27,7 @@ CompressionEngine& CompressionEngine::GetInstance() {
return *engine;
}
bool ZlibCompressionEngine::Compress(std::span<uint8_t> in, std::vector<uint8_t>& out) {
bool ZlibCompressionEngine::Compress(SerializedData& in, size_t data_length, SerializedData& out) {
z_stream strm;
strm.zalloc = Z_NULL;
strm.zfree = Z_NULL;
@ -37,34 +37,34 @@ bool ZlibCompressionEngine::Compress(std::span<uint8_t> in, std::vector<uint8_t>
LOG(FATAL) << "deflateInit() failed";
}
CHECK_LE(in.size(), static_cast<int64_t>(std::numeric_limits<uint32_t>::max()));
uint32_t out_size = deflateBound(&strm, in.size());
CHECK_LE(data_length, in.size());
CHECK_LE(in.size(), std::numeric_limits<uint32_t>::max());
uint32_t deflate_bound = deflateBound(&strm, in.size());
out.resize(out_size);
strm.avail_in = in.size();
strm.next_in = const_cast<uint8_t*>(in.data());
strm.avail_out = out_size;
out.Resize(deflate_bound);
strm.avail_in = data_length;
strm.next_in = in.data();
strm.avail_out = out.size();
strm.next_out = out.data();
ret = deflate(&strm, Z_FINISH);
CHECK_EQ(ret, Z_STREAM_END);
uint32_t compressed_data_size = strm.total_out;
uint32_t compressed_size = strm.total_out;
deflateEnd(&strm);
out.resize(compressed_data_size);
out.Resize(compressed_size);
return true;
}
bool ZlibCompressionEngine::Decompress(const std::vector<uint8_t>& in, std::vector<uint8_t>& out,
size_t out_size) {
out.resize(out_size);
bool ZlibCompressionEngine::Decompress(SerializedData& in, SerializedData& out) {
z_stream strm;
strm.zalloc = Z_NULL;
strm.zfree = Z_NULL;
strm.opaque = Z_NULL;
strm.avail_in = in.size();
strm.next_in = const_cast<uint8_t*>(in.data());
strm.next_in = in.data();
strm.avail_out = out.size();
strm.next_out = out.data();
@ -79,22 +79,22 @@ bool ZlibCompressionEngine::Decompress(const std::vector<uint8_t>& in, std::vect
return true;
}
bool ZstdCompressionEngine::Compress(std::span<uint8_t> in, std::vector<uint8_t>& out) {
size_t out_size = ZSTD_compressBound(in.size());
out.resize(out_size);
bool ZstdCompressionEngine::Compress(SerializedData& in, size_t data_length, SerializedData& out) {
CHECK_LE(data_length, in.size());
out_size = ZSTD_compress(out.data(), out_size, in.data(), in.size(), 1);
size_t compress_bound = ZSTD_compressBound(data_length);
out.Resize(compress_bound);
size_t out_size = ZSTD_compress(out.data(), out.size(), in.data(), data_length, 1);
if (ZSTD_isError(out_size)) {
LOG(FATAL) << "ZSTD_compress failed: " << ZSTD_getErrorName(out_size);
}
out.resize(out_size);
out.Resize(out_size);
return true;
}
bool ZstdCompressionEngine::Decompress(const std::vector<uint8_t>& in, std::vector<uint8_t>& out,
size_t out_size) {
out.resize(out_size);
bool ZstdCompressionEngine::Decompress(SerializedData& in, SerializedData& out) {
size_t result = ZSTD_decompress(out.data(), out.size(), in.data(), in.size());
if (ZSTD_isError(result)) {
LOG(FATAL) << "ZSTD_decompress failed: " << ZSTD_getErrorName(result);

View File

@ -16,8 +16,9 @@
#pragma once
#include <span>
#include <vector>
#include <memory>
#include "SerializedData.h"
class CompressionEngine {
public:
@ -25,23 +26,20 @@ class CompressionEngine {
virtual ~CompressionEngine(){};
virtual bool Compress(std::span<uint8_t> in, std::vector<uint8_t>& out) = 0;
// Decompress the contents of `in` into `out`. `out_size` must be set to the decompressed size
// of the contents.
virtual bool Decompress(const std::vector<uint8_t>& in, std::vector<uint8_t>& out,
size_t out_size) = 0;
virtual bool Compress(SerializedData& in, size_t data_length, SerializedData& out) = 0;
// Decompress the contents of `in` into `out`. `out.size()` must be set to the decompressed
// size of the contents.
virtual bool Decompress(SerializedData& in, SerializedData& out) = 0;
};
class ZlibCompressionEngine : public CompressionEngine {
public:
bool Compress(std::span<uint8_t> in, std::vector<uint8_t>& out) override;
bool Decompress(const std::vector<uint8_t>& in, std::vector<uint8_t>& out,
size_t out_size) override;
bool Compress(SerializedData& in, size_t data_length, SerializedData& out) override;
bool Decompress(SerializedData& in, SerializedData& out) override;
};
class ZstdCompressionEngine : public CompressionEngine {
public:
bool Compress(std::span<uint8_t> in, std::vector<uint8_t>& out) override;
bool Decompress(const std::vector<uint8_t>& in, std::vector<uint8_t>& out,
size_t out_size) override;
bool Compress(SerializedData& in, size_t data_length, SerializedData& out) override;
bool Decompress(SerializedData& in, SerializedData& out) override;
};

55
logd/SerializedData.h Normal file
View File

@ -0,0 +1,55 @@
/*
* Copyright (C) 2020 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#pragma once
#include <sys/types.h>
#include <algorithm>
#include <memory>
// This class is used instead of std::string or std::vector because their clear(), erase(), etc
// functions don't actually deallocate. shrink_to_fit() does deallocate but is not guaranteed to
// work and swapping with an empty string/vector is clunky.
class SerializedData {
public:
SerializedData() {}
SerializedData(size_t size) : data_(new uint8_t[size]), size_(size) {}
void Resize(size_t new_size) {
if (size_ == 0) {
data_.reset(new uint8_t[new_size]);
size_ = new_size;
} else if (new_size == 0) {
data_.reset();
size_ = 0;
} else if (new_size != size_) {
std::unique_ptr<uint8_t[]> new_data(new uint8_t[new_size]);
size_t copy_size = std::min(size_, new_size);
memcpy(new_data.get(), data_.get(), copy_size);
data_.swap(new_data);
size_ = new_size;
}
}
uint8_t* data() { return data_.get(); }
const uint8_t* data() const { return data_.get(); }
size_t size() const { return size_; }
private:
std::unique_ptr<uint8_t[]> data_;
size_t size_ = 0;
};

View File

@ -25,14 +25,13 @@ SerializedLogChunk::~SerializedLogChunk() {
}
void SerializedLogChunk::Compress() {
if (compressed_log_.empty()) {
CompressionEngine::GetInstance().Compress({contents_.data(), write_offset_},
compressed_log_);
if (compressed_log_.size() == 0) {
CompressionEngine::GetInstance().Compress(contents_, write_offset_, compressed_log_);
LOG(INFO) << "Compressed Log, buffer max size: " << contents_.size()
<< " size used: " << write_offset_
<< " compressed size: " << compressed_log_.size();
}
contents_.resize(0);
contents_.Resize(0);
}
// TODO: Develop a better reference counting strategy to guard against the case where the writer is
@ -41,7 +40,8 @@ void SerializedLogChunk::IncReaderRefCount() {
if (++reader_ref_count_ != 1 || writer_active_) {
return;
}
CompressionEngine::GetInstance().Decompress(compressed_log_, contents_, write_offset_);
contents_.Resize(write_offset_);
CompressionEngine::GetInstance().Decompress(compressed_log_, contents_);
}
void SerializedLogChunk::DecReaderRefCount(bool compress) {
@ -90,7 +90,7 @@ bool SerializedLogChunk::ClearUidLogs(uid_t uid, log_id_t log_id, LogStatistics*
// Clear the old compressed logs and set write_offset_ appropriately for DecReaderRefCount()
// to compress the new partially cleared log.
if (new_write_offset != write_offset_) {
compressed_log_.clear();
compressed_log_.Resize(0);
write_offset_ = new_write_offset;
}

View File

@ -18,14 +18,14 @@
#include <sys/types.h>
#include <vector>
#include "LogWriter.h"
#include "SerializedData.h"
#include "SerializedLogEntry.h"
class SerializedLogChunk {
public:
explicit SerializedLogChunk(size_t size) : contents_(size) {}
SerializedLogChunk(SerializedLogChunk&& other) noexcept = default;
~SerializedLogChunk();
void Compress();
@ -66,10 +66,10 @@ class SerializedLogChunk {
private:
// The decompressed contents of this log buffer. Deallocated when the ref_count reaches 0 and
// writer_active_ is false.
std::vector<uint8_t> contents_;
SerializedData contents_;
int write_offset_ = 0;
uint32_t reader_ref_count_ = 0;
bool writer_active_ = true;
uint64_t highest_sequence_number_ = 1;
std::vector<uint8_t> compressed_log_;
SerializedData compressed_log_;
};