400 lines
8.4 KiB
C
400 lines
8.4 KiB
C
|
/* xdelta3 - delta compression tools and library -*- Mode: C++ -*-
|
||
|
Copyright 2016 Joshua MacDonald
|
||
|
|
||
|
Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
you may not use this file except in compliance with the License.
|
||
|
You may obtain a copy of the License at
|
||
|
|
||
|
http://www.apache.org/licenses/LICENSE-2.0
|
||
|
|
||
|
Unless required by applicable law or agreed to in writing, software
|
||
|
distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
See the License for the specific language governing permissions and
|
||
|
limitations under the License.
|
||
|
*/
|
||
|
class Block;
|
||
|
class BlockIterator;
|
||
|
class TmpFile;
|
||
|
|
||
|
class Block {
|
||
|
public:
|
||
|
Block()
|
||
|
: data_(NULL),
|
||
|
data_size_(0),
|
||
|
size_(0) { }
|
||
|
|
||
|
~Block() {
|
||
|
if (data_) {
|
||
|
delete [] data_;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
size_t Size() const {
|
||
|
return size_;
|
||
|
}
|
||
|
|
||
|
uint8_t operator[](size_t i) const {
|
||
|
CHECK_LT(i, size_);
|
||
|
return data_[i];
|
||
|
}
|
||
|
|
||
|
uint8_t* Data() const {
|
||
|
if (data_ == NULL) {
|
||
|
CHECK_EQ(0, size_);
|
||
|
data_size_ = 1;
|
||
|
data_ = new uint8_t[1];
|
||
|
}
|
||
|
return data_;
|
||
|
}
|
||
|
|
||
|
// For writing to blocks
|
||
|
void Append(const uint8_t *data, size_t size) {
|
||
|
if (data_ == NULL) {
|
||
|
CHECK_EQ(0, size_);
|
||
|
CHECK_EQ(0, data_size_);
|
||
|
data_ = new uint8_t[Constants::BLOCK_SIZE];
|
||
|
data_size_ = Constants::BLOCK_SIZE;
|
||
|
}
|
||
|
|
||
|
if (size_ + size > data_size_) {
|
||
|
uint8_t *tmp = data_;
|
||
|
while (size_ + size > data_size_) {
|
||
|
data_size_ *= 2;
|
||
|
}
|
||
|
data_ = new uint8_t[data_size_];
|
||
|
memcpy(data_, tmp, size_);
|
||
|
delete [] tmp;
|
||
|
}
|
||
|
|
||
|
memcpy(data_ + size_, data, size);
|
||
|
size_ += size;
|
||
|
}
|
||
|
|
||
|
// For cleaing a block
|
||
|
void Reset() {
|
||
|
size_ = 0;
|
||
|
}
|
||
|
|
||
|
// Note: This does not benefit from -Wformat= checking, due to the
|
||
|
// enclosing template. Further, it was not used.
|
||
|
// void Print() const {
|
||
|
// xoff_t pos = 0;
|
||
|
// for (size_t i = 0; i < Size(); i++) {
|
||
|
// if (pos % 16 == 0) {
|
||
|
// DP(RINT "%5" Q "x: ", pos);
|
||
|
// }
|
||
|
// DP(RINT "%02x ", (*this)[i]);
|
||
|
// if (pos % 16 == 15) {
|
||
|
// DP(RINT "\n");
|
||
|
// }
|
||
|
// pos++;
|
||
|
// }
|
||
|
// DP(RINT "\n");
|
||
|
// }
|
||
|
|
||
|
void WriteTmpFile(TmpFile *f) const {
|
||
|
f->Append(this);
|
||
|
}
|
||
|
|
||
|
void SetSize(size_t size) {
|
||
|
uint8_t *t = NULL;
|
||
|
if (data_size_ < size) {
|
||
|
if (data_) {
|
||
|
t = data_;
|
||
|
}
|
||
|
data_ = new uint8_t[size];
|
||
|
data_size_ = size;
|
||
|
}
|
||
|
if (t && size < size_) {
|
||
|
memcpy(data_, t, size);
|
||
|
}
|
||
|
delete [] t;
|
||
|
size_ = size;
|
||
|
}
|
||
|
|
||
|
private:
|
||
|
friend class BlockIterator;
|
||
|
|
||
|
mutable uint8_t *data_;
|
||
|
mutable size_t data_size_;
|
||
|
size_t size_;
|
||
|
};
|
||
|
|
||
|
class FileSpec {
|
||
|
public:
|
||
|
FileSpec(MTRandom *rand)
|
||
|
: rand_(rand) {
|
||
|
}
|
||
|
|
||
|
// Generates a file with a known size
|
||
|
void GenerateFixedSize(xoff_t size) {
|
||
|
Reset();
|
||
|
|
||
|
for (xoff_t p = 0; p < size; ) {
|
||
|
xoff_t t = min(Constants::BLOCK_SIZE, size - p);
|
||
|
table_.insert(make_pair(p, Segment(t, rand_)));
|
||
|
p += t;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Generates a file with exponential-random distributed size
|
||
|
void GenerateRandomSize(xoff_t mean) {
|
||
|
GenerateFixedSize(rand_->ExpRand(mean));
|
||
|
}
|
||
|
|
||
|
// Returns the size of the file
|
||
|
xoff_t Size() const {
|
||
|
if (table_.empty()) {
|
||
|
return 0;
|
||
|
}
|
||
|
ConstSegmentMapIterator i = --table_.end();
|
||
|
return i->first + i->second.Size();
|
||
|
}
|
||
|
|
||
|
// Returns the number of blocks
|
||
|
xoff_t Blocks(size_t blksize = Constants::BLOCK_SIZE) const {
|
||
|
if (table_.empty()) {
|
||
|
return 0;
|
||
|
}
|
||
|
return ((Size() - 1) / blksize) + 1;
|
||
|
}
|
||
|
|
||
|
// Returns the number of segments
|
||
|
xoff_t Segments() const {
|
||
|
return table_.size();
|
||
|
}
|
||
|
|
||
|
// Create a mutation according to "what".
|
||
|
void ModifyTo(const Mutator &mutator,
|
||
|
FileSpec *modify) const {
|
||
|
modify->Reset();
|
||
|
mutator.Mutate(&modify->table_, &table_, rand_);
|
||
|
modify->CheckSegments();
|
||
|
}
|
||
|
|
||
|
void CheckSegments() const {
|
||
|
for (ConstSegmentMapIterator iter(table_.begin());
|
||
|
iter != table_.end(); ) {
|
||
|
ConstSegmentMapIterator iter0(iter++);
|
||
|
if (iter == table_.end()) {
|
||
|
break;
|
||
|
}
|
||
|
CHECK_EQ(iter0->first + iter0->second.Size(), iter->first);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void Reset() {
|
||
|
table_.clear();
|
||
|
}
|
||
|
|
||
|
void Print() const {
|
||
|
for (ConstSegmentMapIterator iter(table_.begin());
|
||
|
iter != table_.end();
|
||
|
++iter) {
|
||
|
const Segment &seg = iter->second;
|
||
|
cerr << "Segment at " << iter->first
|
||
|
<< " (" << seg.ToString() << ")" << endl;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void PrintData() const {
|
||
|
Block block;
|
||
|
for (BlockIterator iter(*this); !iter.Done(); iter.Next()) {
|
||
|
iter.Get(&block);
|
||
|
block.Print();
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void WriteTmpFile(TmpFile *f) const {
|
||
|
Block block;
|
||
|
for (BlockIterator iter(*this); !iter.Done(); iter.Next()) {
|
||
|
iter.Get(&block);
|
||
|
f->Append(&block);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void Get(Block *block, xoff_t offset, size_t size) const {
|
||
|
size_t got = 0;
|
||
|
block->SetSize(size);
|
||
|
|
||
|
ConstSegmentMapIterator pos = table_.upper_bound(offset);
|
||
|
if (pos == table_.begin()) {
|
||
|
CHECK_EQ(0, Size());
|
||
|
return;
|
||
|
}
|
||
|
--pos;
|
||
|
|
||
|
while (got < size) {
|
||
|
CHECK(pos != table_.end());
|
||
|
CHECK_GE(offset, pos->first);
|
||
|
|
||
|
const Segment &seg = pos->second;
|
||
|
|
||
|
// The position of this segment may start before this block starts,
|
||
|
// and then the position of the data may be offset from the seeding
|
||
|
// position.
|
||
|
size_t seg_offset = offset - pos->first;
|
||
|
size_t advance = min(seg.Size() - seg_offset,
|
||
|
size - got);
|
||
|
|
||
|
seg.Fill(seg_offset, advance, block->Data() + got);
|
||
|
|
||
|
got += advance;
|
||
|
offset += advance;
|
||
|
++pos;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
typedef BlockIterator iterator;
|
||
|
|
||
|
private:
|
||
|
friend class BlockIterator;
|
||
|
|
||
|
MTRandom *rand_;
|
||
|
SegmentMap table_;
|
||
|
};
|
||
|
|
||
|
class BlockIterator {
|
||
|
public:
|
||
|
explicit BlockIterator(const FileSpec& spec)
|
||
|
: spec_(spec),
|
||
|
blkno_(0),
|
||
|
blksize_(Constants::BLOCK_SIZE) { }
|
||
|
|
||
|
BlockIterator(const FileSpec& spec,
|
||
|
size_t blksize)
|
||
|
: spec_(spec),
|
||
|
blkno_(0),
|
||
|
blksize_(blksize) { }
|
||
|
|
||
|
bool Done() const {
|
||
|
return blkno_ >= spec_.Blocks(blksize_);
|
||
|
}
|
||
|
|
||
|
void Next() {
|
||
|
blkno_++;
|
||
|
}
|
||
|
|
||
|
xoff_t Blkno() const {
|
||
|
return blkno_;
|
||
|
}
|
||
|
|
||
|
xoff_t Blocks() const {
|
||
|
return spec_.Blocks(blksize_);
|
||
|
}
|
||
|
|
||
|
xoff_t Offset() const {
|
||
|
return blkno_ * blksize_;
|
||
|
}
|
||
|
|
||
|
void SetBlock(xoff_t blkno) {
|
||
|
CHECK_LE(blkno, Blocks());
|
||
|
blkno_ = blkno;
|
||
|
}
|
||
|
|
||
|
void Get(Block *block) const {
|
||
|
spec_.Get(block, blkno_ * blksize_, BytesOnBlock());
|
||
|
}
|
||
|
|
||
|
size_t BytesOnBlock() const {
|
||
|
xoff_t blocks = spec_.Blocks(blksize_);
|
||
|
xoff_t size = spec_.Size();
|
||
|
|
||
|
DCHECK((blkno_ < blocks) ||
|
||
|
(blkno_ == blocks && size % blksize_ == 0));
|
||
|
|
||
|
if (blkno_ == blocks) {
|
||
|
return 0;
|
||
|
}
|
||
|
if (blkno_ + 1 == blocks) {
|
||
|
return ((size - 1) % blksize_) + 1;
|
||
|
}
|
||
|
return blksize_;
|
||
|
}
|
||
|
|
||
|
size_t BlockSize() const {
|
||
|
return blksize_;
|
||
|
}
|
||
|
|
||
|
private:
|
||
|
const FileSpec& spec_;
|
||
|
xoff_t blkno_;
|
||
|
size_t blksize_;
|
||
|
};
|
||
|
|
||
|
class ExtFile {
|
||
|
public:
|
||
|
ExtFile() {
|
||
|
static int static_counter = 0;
|
||
|
pid_t pid = getpid();
|
||
|
char buf[64];
|
||
|
xoff_t xpid = pid;
|
||
|
snprintf(buf, 64, "/tmp/regtest.%" Q "u.%d", xpid, static_counter++);
|
||
|
filename_.append(buf);
|
||
|
unlink(filename_.c_str());
|
||
|
}
|
||
|
|
||
|
~ExtFile() {
|
||
|
unlink(filename_.c_str());
|
||
|
}
|
||
|
|
||
|
const char* Name() const {
|
||
|
return filename_.c_str();
|
||
|
}
|
||
|
|
||
|
// Check whether a real file matches a file spec.
|
||
|
bool EqualsSpec(const FileSpec &spec) const {
|
||
|
main_file t;
|
||
|
main_file_init(&t);
|
||
|
CHECK_EQ(0, main_file_open(&t, Name(), XO_READ));
|
||
|
|
||
|
Block tblock;
|
||
|
Block sblock;
|
||
|
for (BlockIterator iter(spec); !iter.Done(); iter.Next()) {
|
||
|
iter.Get(&sblock);
|
||
|
tblock.SetSize(sblock.Size());
|
||
|
size_t tread;
|
||
|
CHECK_EQ(0, main_file_read(&t,
|
||
|
tblock.Data(),
|
||
|
tblock.Size(), &tread, "read failed"));
|
||
|
CHECK_EQ(0, CmpDifferentBlockBytes(tblock, sblock));
|
||
|
}
|
||
|
|
||
|
CHECK_EQ(0, main_file_close(&t));
|
||
|
main_file_cleanup(&t);
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
protected:
|
||
|
string filename_;
|
||
|
};
|
||
|
|
||
|
class TmpFile : public ExtFile {
|
||
|
public:
|
||
|
TmpFile() {
|
||
|
main_file_init(&file_);
|
||
|
CHECK_EQ(0, main_file_open(&file_, Name(), XO_WRITE));
|
||
|
}
|
||
|
|
||
|
~TmpFile() {
|
||
|
main_file_cleanup(&file_);
|
||
|
}
|
||
|
|
||
|
void Append(const Block *block) {
|
||
|
CHECK_EQ(0, main_file_write(&file_,
|
||
|
block->Data(), block->Size(),
|
||
|
"tmpfile write failed"));
|
||
|
}
|
||
|
|
||
|
const char* Name() const {
|
||
|
if (main_file_isopen(&file_)) {
|
||
|
CHECK_EQ(0, main_file_close(&file_));
|
||
|
}
|
||
|
return ExtFile::Name();
|
||
|
}
|
||
|
|
||
|
private:
|
||
|
mutable main_file file_;
|
||
|
};
|