2016-10-30 15:48:40 -04:00
|
|
|
/*
|
|
|
|
PARTIO SOFTWARE
|
|
|
|
Copyright 2010 Disney Enterprises, Inc. All rights reserved
|
|
|
|
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions are
|
|
|
|
met:
|
|
|
|
|
|
|
|
* Redistributions of source code must retain the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
|
|
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer in
|
|
|
|
the documentation and/or other materials provided with the
|
|
|
|
distribution.
|
|
|
|
|
|
|
|
* The names "Disney", "Walt Disney Pictures", "Walt Disney Animation
|
|
|
|
Studios" or the names of its contributors may NOT be used to
|
|
|
|
endorse or promote products derived from this software without
|
|
|
|
specific prior written permission from Walt Disney Pictures.
|
|
|
|
|
|
|
|
Disclaimer: THIS SOFTWARE IS PROVIDED BY WALT DISNEY PICTURES AND
|
|
|
|
CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING,
|
|
|
|
BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY, FITNESS
|
|
|
|
FOR A PARTICULAR PURPOSE, NONINFRINGEMENT AND TITLE ARE DISCLAIMED.
|
|
|
|
IN NO EVENT SHALL WALT DISNEY PICTURES, THE COPYRIGHT HOLDER OR
|
|
|
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
|
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
|
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
|
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND BASED ON ANY
|
|
|
|
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <algorithm>
|
2016-11-09 19:52:18 -05:00
|
|
|
#include <array>
|
2016-10-30 15:48:40 -04:00
|
|
|
#include <cassert>
|
2016-11-07 21:11:30 -05:00
|
|
|
#include <cstring>
|
2016-10-30 15:48:40 -04:00
|
|
|
#include <fstream>
|
|
|
|
#include <iomanip>
|
|
|
|
#include <iostream>
|
2016-10-31 21:53:22 -04:00
|
|
|
#include <iterator> // for std::back_inserter
|
2016-10-30 15:48:40 -04:00
|
|
|
#include <stdexcept>
|
|
|
|
#include <string>
|
|
|
|
|
2016-10-31 21:53:22 -04:00
|
|
|
extern "C" {
|
2016-10-31 20:48:43 -04:00
|
|
|
#include <zlib.h>
|
2016-10-31 20:55:05 -04:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-10-31 20:48:43 -04:00
|
|
|
#include <detail/zip.hpp>
|
2016-11-09 19:52:18 -05:00
|
|
|
#include <xlnt/utils/exceptions.hpp>
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-10-31 20:48:43 -04:00
|
|
|
namespace xlnt {
|
|
|
|
namespace detail {
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
template <class T>
|
2016-10-31 20:48:43 -04:00
|
|
|
inline T read_int(std::istream &stream)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 20:48:43 -04:00
|
|
|
T value;
|
|
|
|
stream.read(reinterpret_cast<char *>(&value), sizeof(T));
|
|
|
|
return value;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
template <class T>
|
2016-10-31 20:48:43 -04:00
|
|
|
inline void write_int(std::ostream &stream, T value)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 20:48:43 -04:00
|
|
|
stream.write(reinterpret_cast<char *>(&value), sizeof(T));
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
zip_file_header::zip_file_header()
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 22:41:20 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
bool zip_file_header::read(std::istream &istream, const bool global)
|
2016-10-31 22:41:20 -04:00
|
|
|
{
|
|
|
|
auto sig = read_int<std::uint32_t>(istream);
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
// read and check for local/global magic
|
2016-11-07 21:11:30 -05:00
|
|
|
if (global)
|
2016-10-31 22:41:20 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
if (sig != 0x02014b50)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::cerr << "Did not find global header signature" << std::endl;
|
2016-10-31 20:48:43 -04:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
version = read_int<std::uint16_t>(istream);
|
2016-10-31 22:41:20 -04:00
|
|
|
}
|
2016-11-07 21:11:30 -05:00
|
|
|
else if (sig != 0x04034b50)
|
2016-10-31 22:41:20 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::cerr << "Did not find local header signature" << std::endl;
|
2016-10-31 22:41:20 -04:00
|
|
|
return false;
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
// Read rest of header
|
|
|
|
version = read_int<std::uint16_t>(istream);
|
|
|
|
flags = read_int<std::uint16_t>(istream);
|
|
|
|
compression_type = read_int<std::uint16_t>(istream);
|
|
|
|
stamp_date = read_int<std::uint16_t>(istream);
|
|
|
|
stamp_time = read_int<std::uint16_t>(istream);
|
|
|
|
crc = read_int<std::uint32_t>(istream);
|
|
|
|
compressed_size = read_int<std::uint32_t>(istream);
|
|
|
|
uncompressed_size = read_int<std::uint32_t>(istream);
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
auto filename_length = read_int<std::uint16_t>(istream);
|
|
|
|
auto extra_length = read_int<std::uint16_t>(istream);
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
std::uint16_t comment_length = 0;
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (global)
|
2016-10-31 22:41:20 -04:00
|
|
|
{
|
|
|
|
comment_length = read_int<std::uint16_t>(istream);
|
2016-11-07 21:11:30 -05:00
|
|
|
/*std::uint16_t disk_number_start = */ read_int<std::uint16_t>(istream);
|
|
|
|
/*std::uint16_t int_file_attrib = */ read_int<std::uint16_t>(istream);
|
|
|
|
/*std::uint32_t ext_file_attrib = */ read_int<std::uint32_t>(istream);
|
2016-10-31 22:41:20 -04:00
|
|
|
header_offset = read_int<std::uint32_t>(istream);
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
filename.resize(filename_length, '\0');
|
|
|
|
istream.read(&filename[0], filename_length);
|
2016-11-07 21:11:30 -05:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
extra.resize(extra_length, 0);
|
|
|
|
istream.read(reinterpret_cast<char *>(extra.data()), extra_length);
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
if (global)
|
|
|
|
{
|
|
|
|
comment.resize(comment_length, '\0');
|
|
|
|
istream.read(&comment[0], comment_length);
|
2016-10-31 20:48:43 -04:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-10-31 22:41:20 -04:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
void zip_file_header::Write(std::ostream &ostream, const bool global) const
|
2016-10-31 22:41:20 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
if (global)
|
|
|
|
{
|
|
|
|
write_int(ostream, static_cast<unsigned int>(0x02014b50)); // header sig
|
|
|
|
write_int(ostream, static_cast<unsigned short>(0)); // version made by
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
write_int(ostream, static_cast<unsigned int>(0x04034b50));
|
|
|
|
}
|
|
|
|
|
|
|
|
write_int(ostream, version);
|
|
|
|
write_int(ostream, flags);
|
|
|
|
write_int(ostream, compression_type);
|
|
|
|
write_int(ostream, stamp_date);
|
|
|
|
write_int(ostream, stamp_time);
|
|
|
|
write_int(ostream, crc);
|
|
|
|
write_int(ostream, compressed_size);
|
|
|
|
write_int(ostream, uncompressed_size);
|
|
|
|
write_int(ostream, static_cast<unsigned short>(filename.length()));
|
|
|
|
write_int(ostream, static_cast<unsigned short>(0)); // extra lengthx
|
|
|
|
|
|
|
|
if (global)
|
|
|
|
{
|
|
|
|
write_int(ostream, static_cast<unsigned short>(0)); // filecomment
|
|
|
|
write_int(ostream, static_cast<unsigned short>(0)); // disk# start
|
|
|
|
write_int(ostream, static_cast<unsigned short>(0)); // internal file
|
|
|
|
write_int(ostream, static_cast<unsigned int>(0)); // ext final
|
|
|
|
write_int(ostream, static_cast<unsigned int>(header_offset)); // rel offset
|
|
|
|
}
|
|
|
|
|
|
|
|
for (unsigned int i = 0; i < filename.length(); i++)
|
|
|
|
{
|
|
|
|
write_int(ostream, filename.c_str()[i]);
|
|
|
|
}
|
2016-10-31 22:41:20 -04:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
static const std::size_t buffer_size = 512;
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
class ZipStreambufDecompress : public std::streambuf
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::istream &istream;
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
z_stream strm;
|
2016-11-09 19:52:18 -05:00
|
|
|
std::array<char, buffer_size> in;
|
|
|
|
std::array<char, buffer_size> out;
|
2016-10-31 20:48:43 -04:00
|
|
|
zip_file_header header;
|
2016-11-09 19:52:18 -05:00
|
|
|
std::size_t total_read;
|
|
|
|
std::size_t total_uncompressed;
|
2016-10-30 15:48:40 -04:00
|
|
|
bool valid;
|
|
|
|
bool compressed_data;
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
static const unsigned short DEFLATE = 8;
|
|
|
|
static const unsigned short UNCOMPRESSED = 0;
|
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
public:
|
2016-11-07 21:11:30 -05:00
|
|
|
ZipStreambufDecompress(std::istream &stream, zip_file_header central_header)
|
|
|
|
: istream(stream), header(central_header), total_read(0), total_uncompressed(0), valid(true)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
strm.zalloc = Z_NULL;
|
|
|
|
strm.zfree = Z_NULL;
|
|
|
|
strm.opaque = Z_NULL;
|
|
|
|
strm.avail_in = 0;
|
|
|
|
strm.next_in = Z_NULL;
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
setg(in.data(), in.data(), in.data());
|
2016-11-07 21:11:30 -05:00
|
|
|
setp(0, 0);
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// skip the header
|
2016-11-07 21:11:30 -05:00
|
|
|
valid = header.read(istream, false);
|
|
|
|
if (header.compression_type == DEFLATE)
|
2016-11-09 19:52:18 -05:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
compressed_data = true;
|
2016-11-09 19:52:18 -05:00
|
|
|
}
|
2016-11-07 21:11:30 -05:00
|
|
|
else if (header.compression_type == UNCOMPRESSED)
|
2016-11-09 19:52:18 -05:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
compressed_data = false;
|
2016-11-09 19:52:18 -05:00
|
|
|
}
|
2016-11-07 21:11:30 -05:00
|
|
|
else
|
|
|
|
{
|
|
|
|
compressed_data = false;
|
|
|
|
std::cerr << "ZIP: got unrecognized compressed data (Supported deflate/uncompressed)" << std::endl;
|
|
|
|
valid = false;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// initialize the inflate
|
2016-11-07 21:11:30 -05:00
|
|
|
if (compressed_data && valid)
|
|
|
|
{
|
2016-11-09 19:52:18 -05:00
|
|
|
#pragma clang diagnostic push
|
|
|
|
#pragma clang diagnostic ignored "-Wold-style-cast"
|
2016-11-07 21:11:30 -05:00
|
|
|
int result = inflateInit2(&strm, -MAX_WBITS);
|
2016-11-09 19:52:18 -05:00
|
|
|
#pragma clang diagnostic pop
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (result != Z_OK)
|
|
|
|
{
|
|
|
|
std::cerr << "gzip: inflateInit2 did not return Z_OK" << std::endl;
|
|
|
|
valid = false;
|
|
|
|
}
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
header = central_header;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
virtual ~ZipStreambufDecompress()
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
2016-11-09 19:52:18 -05:00
|
|
|
if (compressed_data && valid)
|
|
|
|
{
|
|
|
|
inflateEnd(&strm);
|
|
|
|
}
|
2016-11-07 21:11:30 -05:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
int process()
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
|
|
|
if (!valid) return -1;
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (compressed_data)
|
|
|
|
{
|
|
|
|
strm.avail_out = buffer_size - 4;
|
2016-11-09 19:52:18 -05:00
|
|
|
strm.next_out = reinterpret_cast<Bytef *>(out.data() + 4);
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
while (strm.avail_out != 0)
|
|
|
|
{
|
|
|
|
if (strm.avail_in == 0)
|
2016-11-09 19:52:18 -05:00
|
|
|
{
|
|
|
|
// buffer empty, read some more from file
|
|
|
|
istream.read(in.data(), static_cast<std::streamsize>(std::min(buffer_size, header.compressed_size - total_read)));
|
|
|
|
strm.avail_in = static_cast<unsigned int>(istream.gcount());
|
2016-11-07 21:11:30 -05:00
|
|
|
total_read += strm.avail_in;
|
2016-11-09 19:52:18 -05:00
|
|
|
strm.next_in = reinterpret_cast<Bytef *>(in.data());
|
2016-11-07 21:11:30 -05:00
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
int ret = inflate(&strm, Z_NO_FLUSH); // decompress
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
switch (ret)
|
|
|
|
{
|
|
|
|
case Z_STREAM_ERROR:
|
|
|
|
std::cerr << "libz error Z_STREAM_ERROR" << std::endl;
|
|
|
|
valid = false;
|
|
|
|
return -1;
|
2016-10-30 15:48:40 -04:00
|
|
|
case Z_NEED_DICT:
|
|
|
|
case Z_DATA_ERROR:
|
2016-11-07 21:11:30 -05:00
|
|
|
case Z_MEM_ERROR:
|
|
|
|
std::cerr << "gzip error " << strm.msg << std::endl;
|
|
|
|
valid = false;
|
|
|
|
return -1;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (ret == Z_STREAM_END) break;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
auto unzip_count = buffer_size - strm.avail_out - 4;
|
2016-11-07 21:11:30 -05:00
|
|
|
total_uncompressed += unzip_count;
|
2016-11-09 19:52:18 -05:00
|
|
|
return static_cast<int>(unzip_count);
|
2016-11-07 21:11:30 -05:00
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
// uncompressed, so just read
|
|
|
|
istream.read(out.data() + 4, static_cast<std::streamsize>(std::min(buffer_size - 4, header.uncompressed_size - total_read)));
|
|
|
|
auto count = istream.gcount();
|
|
|
|
total_read += static_cast<std::size_t>(count);
|
|
|
|
return static_cast<int>(count);
|
2016-11-07 21:11:30 -05:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
virtual int underflow()
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
|
|
|
if (gptr() && (gptr() < egptr()))
|
|
|
|
return traits_type::to_int_type(*gptr()); // if we already have data just use it
|
2016-11-09 19:52:18 -05:00
|
|
|
auto put_back_count = gptr() - eback();
|
2016-11-07 21:11:30 -05:00
|
|
|
if (put_back_count > 4) put_back_count = 4;
|
2016-11-09 19:52:18 -05:00
|
|
|
std::memmove(out.data() + (4 - put_back_count), gptr() - put_back_count, static_cast<std::size_t>(put_back_count));
|
2016-11-07 21:11:30 -05:00
|
|
|
int num = process();
|
2016-11-09 19:52:18 -05:00
|
|
|
setg(out.data() + 4 - put_back_count, out.data() + 4, out.data() + 4 + num);
|
2016-11-07 21:11:30 -05:00
|
|
|
if (num <= 0) return EOF;
|
|
|
|
return traits_type::to_int_type(*gptr());
|
|
|
|
}
|
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
virtual int overflow(int c = EOF);
|
2016-10-30 15:48:40 -04:00
|
|
|
};
|
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
int ZipStreambufDecompress::overflow(int)
|
|
|
|
{
|
|
|
|
throw xlnt::exception("writing to read-only buffer");
|
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
class ZipStreambufCompress : public std::streambuf
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::ostream &ostream; // owned when header==0 (when not part of zip file)
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
z_stream strm;
|
2016-11-09 19:52:18 -05:00
|
|
|
std::array<char, buffer_size> in;
|
|
|
|
std::array<char, buffer_size> out;
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
zip_file_header *header;
|
2016-10-30 15:48:40 -04:00
|
|
|
unsigned int uncompressed_size;
|
|
|
|
unsigned int crc;
|
|
|
|
|
|
|
|
bool valid;
|
|
|
|
|
|
|
|
public:
|
2016-11-07 21:11:30 -05:00
|
|
|
ZipStreambufCompress(zip_file_header *central_header, std::ostream &stream)
|
2016-11-27 16:56:38 +01:00
|
|
|
: ostream(stream), strm({}), header(central_header), valid(true)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
strm.zalloc = Z_NULL;
|
|
|
|
strm.zfree = Z_NULL;
|
|
|
|
strm.opaque = Z_NULL;
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
#pragma clang diagnostic push
|
|
|
|
#pragma clang diagnostic ignored "-Wold-style-cast"
|
2016-11-07 21:11:30 -05:00
|
|
|
int ret = deflateInit2(&strm, Z_DEFAULT_COMPRESSION, Z_DEFLATED, -MAX_WBITS, 8, Z_DEFAULT_STRATEGY);
|
2016-11-09 19:52:18 -05:00
|
|
|
#pragma clang diagnostic pop
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (ret != Z_OK)
|
|
|
|
{
|
|
|
|
std::cerr << "libz: failed to deflateInit" << std::endl;
|
|
|
|
valid = false;
|
|
|
|
return;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
setg(0, 0, 0);
|
2016-11-09 19:52:18 -05:00
|
|
|
setp(in.data(), in.data() + buffer_size - 4); // we want to be 4 aligned
|
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// Write appropriate header
|
2016-11-07 21:11:30 -05:00
|
|
|
if (header)
|
|
|
|
{
|
2016-11-09 19:52:18 -05:00
|
|
|
header->header_offset = static_cast<std::uint32_t>(stream.tellp());
|
2016-11-07 21:11:30 -05:00
|
|
|
header->Write(ostream, false);
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
uncompressed_size = crc = 0;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
virtual ~ZipStreambufCompress()
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
|
|
|
if (valid)
|
|
|
|
{
|
|
|
|
process(true);
|
|
|
|
deflateEnd(&strm);
|
|
|
|
if (header)
|
|
|
|
{
|
|
|
|
std::ios::streampos final_position = ostream.tellp();
|
|
|
|
header->uncompressed_size = uncompressed_size;
|
|
|
|
header->crc = crc;
|
|
|
|
ostream.seekp(header->header_offset);
|
|
|
|
header->Write(ostream, false);
|
|
|
|
ostream.seekp(final_position);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
write_int(ostream, crc);
|
|
|
|
write_int(ostream, uncompressed_size);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (!header) delete &ostream;
|
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
protected:
|
|
|
|
int process(bool flush)
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
|
|
|
if (!valid) return -1;
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
strm.next_in = reinterpret_cast<Bytef *>(pbase());
|
|
|
|
strm.avail_in = static_cast<unsigned int>(pptr() - pbase());
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
while (strm.avail_in != 0 || flush)
|
|
|
|
{
|
|
|
|
strm.avail_out = buffer_size;
|
2016-11-09 19:52:18 -05:00
|
|
|
strm.next_out = reinterpret_cast<Bytef *>(out.data());
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
int ret = deflate(&strm, flush ? Z_FINISH : Z_NO_FLUSH);
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (!(ret != Z_BUF_ERROR && ret != Z_STREAM_ERROR))
|
|
|
|
{
|
|
|
|
valid = false;
|
|
|
|
std::cerr << "gzip: gzip error " << strm.msg << std::endl;
|
|
|
|
;
|
|
|
|
return -1;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
|
|
|
auto generated_output = static_cast<int>(strm.next_out - reinterpret_cast<std::uint8_t *>(out.data()));
|
|
|
|
ostream.write(out.data(), generated_output);
|
|
|
|
if (header) header->compressed_size += static_cast<unsigned int>(generated_output);
|
2016-11-07 21:11:30 -05:00
|
|
|
if (ret == Z_STREAM_END) break;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
// update counts, crc's and buffers
|
2016-11-09 19:52:18 -05:00
|
|
|
auto consumed_input = static_cast<unsigned int>(pptr() - pbase());
|
2016-11-07 21:11:30 -05:00
|
|
|
uncompressed_size += consumed_input;
|
2016-11-09 19:52:18 -05:00
|
|
|
crc = static_cast<unsigned int>(crc32(crc, reinterpret_cast<Bytef *>(in.data()), consumed_input));
|
2016-11-07 21:11:30 -05:00
|
|
|
setp(pbase(), pbase() + buffer_size - 4);
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
return 1;
|
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
virtual int sync()
|
2016-11-07 21:11:30 -05:00
|
|
|
{
|
|
|
|
if (pptr() && pptr() > pbase()) return process(false);
|
|
|
|
return 0;
|
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
|
|
|
virtual int underflow()
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-09 19:52:18 -05:00
|
|
|
throw std::runtime_error("Attempt to read write only ostream");
|
2016-10-31 20:48:43 -04:00
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
virtual int overflow(int c = EOF);
|
|
|
|
};
|
|
|
|
|
|
|
|
int ZipStreambufCompress::overflow(int c)
|
|
|
|
{
|
|
|
|
if (c != EOF)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-09 19:52:18 -05:00
|
|
|
*pptr() = static_cast<char>(c);
|
|
|
|
pbump(1);
|
2016-10-31 20:48:43 -04:00
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
if (process(false) == EOF) return EOF;
|
|
|
|
return c;
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
zip_file_istream::zip_file_istream(std::unique_ptr<std::streambuf> &&buffer)
|
|
|
|
: std::istream(&*buffer)
|
|
|
|
{
|
|
|
|
buf.swap(buffer);
|
|
|
|
}
|
|
|
|
|
|
|
|
zip_file_istream::~zip_file_istream()
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
zip_file_ostream::zip_file_ostream(std::unique_ptr<std::streambuf> &&buffer)
|
|
|
|
: std::ostream(&*buffer)
|
|
|
|
{
|
|
|
|
buf.swap(buffer);
|
|
|
|
}
|
2016-10-30 15:48:40 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
zip_file_ostream::~zip_file_ostream()
|
|
|
|
{
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-12-02 14:37:50 +01:00
|
|
|
ZipFileWriter::ZipFileWriter(std::ostream &stream) : tarstream_(stream)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-12-02 14:37:50 +01:00
|
|
|
if (!tarstream_) throw std::runtime_error("ZIP: Invalid file handle");
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
ZipFileWriter::~ZipFileWriter()
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
|
|
|
// Write all file headers
|
2016-12-02 14:37:50 +01:00
|
|
|
std::ios::streampos final_position = tarstream_.tellp();
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
for (unsigned int i = 0; i < file_headers_.size(); i++)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-12-02 14:37:50 +01:00
|
|
|
file_headers_[i].Write(tarstream_, true);
|
2016-10-31 20:48:43 -04:00
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-12-02 14:37:50 +01:00
|
|
|
std::ios::streampos central_end = tarstream_.tellp();
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// Write end of central
|
2016-12-02 14:37:50 +01:00
|
|
|
write_int(tarstream_, static_cast<std::uint32_t>(0x06054b50)); // end of central
|
|
|
|
write_int(tarstream_, static_cast<std::uint16_t>(0)); // this disk number
|
|
|
|
write_int(tarstream_, static_cast<std::uint16_t>(0)); // this disk number
|
|
|
|
write_int(tarstream_, static_cast<std::uint16_t>(file_headers_.size())); // one entry in center in this disk
|
|
|
|
write_int(tarstream_, static_cast<std::uint16_t>(file_headers_.size())); // one entry in center
|
|
|
|
write_int(tarstream_, static_cast<std::uint32_t>(central_end - final_position)); // size of header
|
|
|
|
write_int(tarstream_, static_cast<std::uint32_t>(final_position)); // offset to header
|
|
|
|
write_int(tarstream_, static_cast<std::uint16_t>(0)); // zip comment
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
std::ostream &ZipFileWriter::open(const std::string &filename)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 20:48:43 -04:00
|
|
|
zip_file_header header;
|
|
|
|
header.filename = filename;
|
|
|
|
file_headers_.push_back(header);
|
2016-12-02 14:37:50 +01:00
|
|
|
auto streambuf = std::make_unique<ZipStreambufCompress>(&file_headers_.back(), tarstream_);
|
2016-11-07 21:11:30 -05:00
|
|
|
auto stream = new zip_file_ostream(std::move(streambuf));
|
|
|
|
write_stream_.reset(stream);
|
|
|
|
return *write_stream_;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ZipFileWriter::close()
|
|
|
|
{
|
|
|
|
write_stream_.reset(nullptr);
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
ZipFileReader::ZipFileReader(std::istream &stream) : source_stream_(stream)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
if (!stream)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
|
|
|
throw std::runtime_error("ZIP: Invalid file handle");
|
|
|
|
}
|
|
|
|
|
|
|
|
read_central_header();
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
ZipFileReader::~ZipFileReader()
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
bool ZipFileReader::read_central_header()
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
|
|
|
// Find the header
|
|
|
|
// NOTE: this assumes the zip file header is the last thing written to file...
|
2016-11-07 21:11:30 -05:00
|
|
|
source_stream_.seekg(0, std::ios_base::end);
|
|
|
|
std::ios::streampos end_position = source_stream_.tellg();
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
auto max_comment_size = std::uint32_t(0xffff); // max size of header
|
|
|
|
auto read_size_before_comment = std::uint32_t(22);
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
std::ios::streamoff read_start = max_comment_size + read_size_before_comment;
|
2016-10-31 20:48:43 -04:00
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
if (read_start > end_position)
|
|
|
|
{
|
|
|
|
read_start = end_position;
|
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
source_stream_.seekg(end_position - read_start);
|
2016-10-31 20:48:43 -04:00
|
|
|
std::vector<char> buf(static_cast<std::size_t>(read_start), '\0');
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (read_start <= 0)
|
|
|
|
{
|
|
|
|
std::cerr << "ZIP: Invalid read buffer size" << std::endl;
|
|
|
|
return false;
|
|
|
|
}
|
2016-11-09 19:52:18 -05:00
|
|
|
|
2016-10-31 20:48:43 -04:00
|
|
|
source_stream_.read(buf.data(), read_start);
|
|
|
|
|
|
|
|
auto found_header = false;
|
|
|
|
std::size_t header_index = 0;
|
|
|
|
|
2016-11-09 19:52:18 -05:00
|
|
|
for (std::size_t i = 0; i < static_cast<std::size_t>(read_start - 3); ++i)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
if (buf[i] == 0x50 && buf[i + 1] == 0x4b && buf[i + 2] == 0x05 && buf[i + 3] == 0x06)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
|
|
|
found_header = true;
|
|
|
|
header_index = i;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (!found_header)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::cerr << "ZIP: Failed to find zip header" << std::endl;
|
2016-10-31 20:48:43 -04:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// seek to end of central header and read
|
2016-10-31 20:48:43 -04:00
|
|
|
source_stream_.seekg(end_position - (read_start - static_cast<std::ptrdiff_t>(header_index)));
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
/*auto word = */ read_int<std::uint32_t>(source_stream_);
|
2016-10-31 20:48:43 -04:00
|
|
|
auto disk_number1 = read_int<std::uint16_t>(source_stream_);
|
|
|
|
auto disk_number2 = read_int<std::uint16_t>(source_stream_);
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (disk_number1 != disk_number2 || disk_number1 != 0)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::cerr << "ZIP: multiple disk zip files are not supported" << std::endl;
|
2016-10-31 20:48:43 -04:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
auto num_files = read_int<std::uint16_t>(source_stream_); // one entry in center in this disk
|
|
|
|
auto num_files_this_disk = read_int<std::uint16_t>(source_stream_); // one entry in center
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
if (num_files != num_files_this_disk)
|
2016-10-31 20:48:43 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
std::cerr << "ZIP: multi disk zip files are not supported" << std::endl;
|
2016-10-31 20:48:43 -04:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-11-07 21:11:30 -05:00
|
|
|
/*auto size_of_header = */ read_int<std::uint32_t>(source_stream_); // size of header
|
2016-10-31 20:48:43 -04:00
|
|
|
auto header_offset = read_int<std::uint32_t>(source_stream_); // offset to header
|
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
// go to header and read all file headers
|
2016-10-31 20:48:43 -04:00
|
|
|
source_stream_.seekg(header_offset);
|
|
|
|
|
|
|
|
for (std::uint16_t i = 0; i < num_files; ++i)
|
|
|
|
{
|
|
|
|
zip_file_header header;
|
|
|
|
|
|
|
|
if (header.read(source_stream_, true))
|
|
|
|
{
|
|
|
|
file_headers_[header.filename] = header;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-10-30 15:48:40 -04:00
|
|
|
return true;
|
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
std::istream &ZipFileReader::open(const std::string &filename)
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 20:48:43 -04:00
|
|
|
if (!has_file(filename))
|
|
|
|
{
|
|
|
|
throw "not found";
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
auto header = file_headers_.at(filename);
|
|
|
|
source_stream_.seekg(header.header_offset);
|
2016-11-07 21:11:30 -05:00
|
|
|
auto streambuf = std::make_unique<ZipStreambufDecompress>(source_stream_, header);
|
|
|
|
read_stream_.reset(new zip_file_istream(std::move(streambuf)));
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
return *read_stream_;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
std::vector<std::string> ZipFileReader::files() const
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-10-31 20:48:43 -04:00
|
|
|
std::vector<std::string> filenames;
|
|
|
|
std::transform(file_headers_.begin(), file_headers_.end(), std::back_inserter(filenames),
|
|
|
|
[](const std::pair<std::string, zip_file_header> &h) { return h.first; });
|
|
|
|
return filenames;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
2016-10-31 20:48:43 -04:00
|
|
|
|
|
|
|
bool ZipFileReader::has_file(const std::string &filename) const
|
2016-10-30 15:48:40 -04:00
|
|
|
{
|
2016-11-07 21:11:30 -05:00
|
|
|
return file_headers_.count(filename) != 0;
|
2016-10-30 15:48:40 -04:00
|
|
|
}
|
|
|
|
|
2016-10-31 20:48:43 -04:00
|
|
|
} // namespace detail
|
|
|
|
} // namespace xlnt
|