xlnt/source/workbook.cpp

698 lines
18 KiB
C++
Raw Normal View History

2014-05-22 05:48:51 +08:00
#include <algorithm>
2014-06-11 05:12:15 +08:00
#include <array>
2014-06-05 06:42:17 +08:00
#include <fstream>
#include <set>
2014-05-21 22:20:30 +08:00
#include <sstream>
#include <pugixml.hpp>
2014-06-11 06:36:31 +08:00
#ifdef _WIN32
2014-06-11 05:12:15 +08:00
#include <Windows.h>
2014-06-11 06:36:31 +08:00
#endif
2014-06-11 05:12:15 +08:00
2014-08-14 06:56:34 +08:00
#include <xlnt/workbook/workbook.hpp>
#include <xlnt/common/exceptions.hpp>
#include <xlnt/drawing/drawing.hpp>
#include <xlnt/worksheet/range.hpp>
#include <xlnt/reader/reader.hpp>
#include <xlnt/common/relationship.hpp>
#include <xlnt/worksheet/worksheet.hpp>
#include <xlnt/writer/writer.hpp>
#include <xlnt/common/zip_file.hpp>
#include <xlnt/workbook/document_properties.hpp>
#include <xlnt/writer/style_writer.hpp>
2014-06-06 04:19:31 +08:00
#include "detail/cell_impl.hpp"
#include "detail/workbook_impl.hpp"
#include "detail/worksheet_impl.hpp"
2014-05-21 22:20:30 +08:00
2014-06-11 05:12:15 +08:00
static std::string CreateTemporaryFilename()
{
#ifdef _WIN32
std::array<TCHAR, MAX_PATH> buffer;
DWORD result = GetTempPath(static_cast<DWORD>(buffer.size()), buffer.data());
if(result > MAX_PATH)
{
throw std::runtime_error("buffer is too small");
}
if(result == 0)
{
throw std::runtime_error("GetTempPath failed");
}
std::string directory(buffer.begin(), buffer.begin() + result);
return directory + "xlnt.xlsx";
#else
return "/tmp/xlsx.xlnt";
#endif
}
2014-05-21 22:20:30 +08:00
namespace xlnt {
2014-05-31 06:42:25 +08:00
namespace detail {
2014-07-25 05:31:46 +08:00
workbook_impl::workbook_impl() : active_sheet_index_(0), guess_types_(false), data_only_(false)
2014-05-21 22:20:30 +08:00
{
}
2014-07-25 05:31:46 +08:00
2014-05-31 06:42:25 +08:00
} // namespace detail
workbook::workbook() : d_(new detail::workbook_impl())
{
create_sheet("Sheet");
2014-07-20 02:43:48 +08:00
create_relationship("rId2", "sharedStrings.xml", relationship::type::shared_strings);
create_relationship("rId3", "styles.xml", relationship::type::styles);
create_relationship("rId4", "theme/theme1.xml", relationship::type::theme);
2014-05-21 22:20:30 +08:00
}
workbook::iterator::iterator(workbook &wb, std::size_t index) : wb_(wb), index_(index)
{
}
2014-06-11 05:12:15 +08:00
workbook::iterator::iterator(const iterator &rhs) : wb_(rhs.wb_), index_(rhs.index_)
{
}
worksheet workbook::iterator::operator*()
{
return wb_[index_];
}
workbook::iterator &workbook::iterator::operator++()
{
index_++;
return *this;
}
workbook::iterator workbook::iterator::operator++(int)
{
iterator old(wb_, index_);
++*this;
return old;
}
bool workbook::iterator::operator==(const iterator &comparand) const
{
return index_ == comparand.index_ && wb_ == comparand.wb_;
}
workbook::const_iterator::const_iterator(const workbook &wb, std::size_t index) : wb_(wb), index_(index)
{
}
2014-06-11 05:12:15 +08:00
workbook::const_iterator::const_iterator(const const_iterator &rhs) : wb_(rhs.wb_), index_(rhs.index_)
{
}
const worksheet workbook::const_iterator::operator*()
{
return wb_.get_sheet_by_index(index_);
}
workbook::const_iterator &workbook::const_iterator::operator++()
{
index_++;
return *this;
}
workbook::const_iterator workbook::const_iterator::operator++(int)
{
const_iterator old(wb_, index_);
++*this;
return old;
}
bool workbook::const_iterator::operator==(const const_iterator &comparand) const
{
return index_ == comparand.index_ && wb_ == comparand.wb_;
}
2014-05-21 22:20:30 +08:00
worksheet workbook::get_sheet_by_name(const std::string &name)
{
for(auto &impl : d_->worksheets_)
2014-05-21 22:20:30 +08:00
{
if(impl.title_ == name)
{
return worksheet(&impl);
}
2014-05-21 22:20:30 +08:00
}
return worksheet();
}
worksheet workbook::get_sheet_by_index(std::size_t index)
{
return worksheet(&d_->worksheets_[index]);
}
const worksheet workbook::get_sheet_by_index(std::size_t index) const
{
return worksheet(&d_->worksheets_.at(index));
2014-05-21 22:20:30 +08:00
}
worksheet workbook::get_active_sheet()
{
return worksheet(&d_->worksheets_[d_->active_sheet_index_]);
2014-05-21 22:20:30 +08:00
}
bool workbook::has_named_range(const std::string &name) const
2014-05-21 22:20:30 +08:00
{
for(auto worksheet : *this)
2014-05-21 22:20:30 +08:00
{
if(worksheet.has_named_range(name))
2014-05-21 22:20:30 +08:00
{
return true;
}
}
return false;
}
worksheet workbook::create_sheet()
{
2014-05-21 22:20:30 +08:00
std::string title = "Sheet1";
int index = 1;
2014-05-21 22:20:30 +08:00
while(get_sheet_by_name(title) != nullptr)
{
title = "Sheet" + std::to_string(++index);
}
2014-06-10 12:29:49 +08:00
2014-06-14 03:05:24 +08:00
d_->worksheets_.push_back(detail::worksheet_impl(this, title));
create_relationship("rId" + std::to_string(d_->relationships_.size() + 1), "xl/worksheets/sheet" + std::to_string(d_->worksheets_.size()) + ".xml", relationship::type::worksheet);
return worksheet(&d_->worksheets_.back());
2014-05-21 22:20:30 +08:00
}
void workbook::add_sheet(xlnt::worksheet worksheet)
{
for(auto ws : *this)
{
if(worksheet == ws)
{
throw std::runtime_error("worksheet already in workbook");
}
}
d_->worksheets_.emplace_back(*worksheet.d_);
2014-05-21 22:20:30 +08:00
}
void workbook::add_sheet(xlnt::worksheet worksheet, std::size_t index)
{
add_sheet(worksheet);
2014-05-31 06:42:25 +08:00
std::swap(d_->worksheets_[index], d_->worksheets_.back());
2014-05-21 22:20:30 +08:00
}
int workbook::get_index(xlnt::worksheet worksheet)
{
int i = 0;
for(auto ws : *this)
{
if(worksheet == ws)
{
return i;
}
i++;
}
throw std::runtime_error("worksheet isn't owned by this workbook");
}
void workbook::create_named_range(const std::string &name, worksheet range_owner, const range_reference &reference)
2014-05-21 22:20:30 +08:00
{
auto match = get_sheet_by_name(range_owner.get_title());
if(match != nullptr)
2014-05-21 22:20:30 +08:00
{
match.create_named_range(name, reference);
return;
2014-05-21 22:20:30 +08:00
}
throw std::runtime_error("worksheet isn't owned by this workbook");
}
void workbook::remove_named_range(const std::string &name)
2014-05-21 22:20:30 +08:00
{
for(auto ws : *this)
2014-05-21 22:20:30 +08:00
{
if(ws.has_named_range(name))
2014-05-21 22:20:30 +08:00
{
ws.remove_named_range(name);
2014-05-21 22:20:30 +08:00
return;
}
}
throw std::runtime_error("named range not found");
2014-05-21 22:20:30 +08:00
}
range workbook::get_named_range(const std::string &name)
2014-05-21 22:20:30 +08:00
{
for(auto ws : *this)
2014-05-21 22:20:30 +08:00
{
if(ws.has_named_range(name))
2014-05-21 22:20:30 +08:00
{
return ws.get_named_range(name);
2014-05-21 22:20:30 +08:00
}
}
throw std::runtime_error("named range not found");
2014-05-21 22:20:30 +08:00
}
bool workbook::load(const std::istream &stream)
{
std::string temp_file = CreateTemporaryFilename();
std::ofstream tmp;
tmp.open(temp_file, std::ios::out | std::ios::binary);
tmp << stream.rdbuf();
tmp.close();
load(temp_file);
std::remove(temp_file.c_str());
return true;
}
2014-06-05 06:42:17 +08:00
bool workbook::load(const std::vector<unsigned char> &data)
{
2014-06-11 05:12:15 +08:00
std::string temp_file = CreateTemporaryFilename();
std::ofstream tmp;
tmp.open(temp_file, std::ios::out | std::ios::binary);
for(auto c : data)
2014-06-05 06:42:17 +08:00
{
2014-06-11 05:12:15 +08:00
tmp.put(c);
2014-06-05 06:42:17 +08:00
}
2014-06-11 05:12:15 +08:00
tmp.close();
load(temp_file);
std::remove(temp_file.c_str());
return true;
2014-06-05 06:42:17 +08:00
}
bool workbook::load(const std::string &filename)
2014-05-21 22:20:30 +08:00
{
2014-08-02 04:46:54 +08:00
zip_file f;
try
{
f.load(filename);
}
catch(std::exception e)
{
throw invalid_file_exception(filename);
}
2014-07-20 04:59:05 +08:00
auto content_types = reader::read_content_types(f);
auto type = reader::determine_document_type(content_types);
2014-08-02 04:46:54 +08:00
2014-05-21 22:20:30 +08:00
if(type != "excel")
{
2014-08-02 04:46:54 +08:00
throw invalid_file_exception(filename);
2014-05-21 22:20:30 +08:00
}
2014-07-20 02:43:48 +08:00
clear();
2014-07-25 05:31:46 +08:00
auto workbook_relationships = reader::read_relationships(f, "xl/workbook.xml");
for(auto relationship : workbook_relationships)
{
create_relationship(relationship.get_id(), relationship.get_target_uri(), relationship.get_type());
}
2014-05-21 22:20:30 +08:00
pugi::xml_document doc;
2014-08-01 21:44:21 +08:00
doc.load(f.read("xl/workbook.xml").c_str());
2014-05-21 22:20:30 +08:00
auto root_node = doc.child("workbook");
auto workbook_pr_node = root_node.child("workbookPr");
2014-07-20 04:59:05 +08:00
get_properties().excel_base_date = (workbook_pr_node.attribute("date1904") != nullptr && workbook_pr_node.attribute("date1904").as_int() != 0) ? calendar::mac_1904 : calendar::windows_1900;
2014-05-21 22:20:30 +08:00
auto sheets_node = root_node.child("sheets");
std::vector<std::string> shared_strings;
2014-08-02 04:46:54 +08:00
if(f.has_file("xl/sharedStrings.xml"))
2014-05-21 22:20:30 +08:00
{
2014-08-02 04:46:54 +08:00
shared_strings = xlnt::reader::read_shared_string(f.read("xl/sharedStrings.xml"));
2014-05-21 22:20:30 +08:00
}
2014-07-17 07:53:45 +08:00
std::vector<int> number_format_ids;
2014-08-02 04:46:54 +08:00
if(f.has_file("xl/styles.xml"))
2014-07-17 07:53:45 +08:00
{
2014-07-20 02:43:48 +08:00
pugi::xml_document styles_doc;
2014-08-02 04:46:54 +08:00
styles_doc.load(f.read("xl/styles.xml").c_str());
2014-07-20 02:43:48 +08:00
auto stylesheet_node = styles_doc.child("styleSheet");
auto cell_xfs_node = stylesheet_node.child("cellXfs");
for(auto xf_node : cell_xfs_node.children("xf"))
{
number_format_ids.push_back(xf_node.attribute("numFmtId").as_int());
}
2014-07-17 07:53:45 +08:00
}
2014-05-21 22:20:30 +08:00
for(auto sheet_node : sheets_node.children("sheet"))
{
std::string rel_id = sheet_node.attribute("r:id").as_string();
auto rel = std::find_if(d_->relationships_.begin(), d_->relationships_.end(),
[&](relationship &rel) { return rel.get_id() == rel_id; });
if (rel == d_->relationships_.end())
{
throw std::runtime_error("relationship not found");
}
auto ws = create_sheet(sheet_node.attribute("name").as_string(), *rel);
auto sheet_filename = rel->get_target_uri();
2014-08-01 21:44:21 +08:00
xlnt::reader::read_worksheet(ws, f.read(sheet_filename).c_str(), shared_strings, number_format_ids);
2014-05-21 22:20:30 +08:00
}
2014-06-05 06:42:17 +08:00
return true;
2014-05-21 22:20:30 +08:00
}
2014-07-25 05:31:46 +08:00
void workbook::set_guess_types(bool guess)
{
d_->guess_types_ = guess;
}
bool workbook::get_guess_types() const
{
return d_->guess_types_;
}
2014-07-20 02:43:48 +08:00
void workbook::create_relationship(const std::string &id, const std::string &target, relationship::type type)
{
d_->relationships_.push_back(relationship(type, id, target));
}
relationship workbook::get_relationship(const std::string &id) const
{
for(auto &rel : d_->relationships_)
{
if(rel.get_id() == id)
{
return rel;
}
}
throw std::runtime_error("");
}
2014-05-21 22:20:30 +08:00
void workbook::remove_sheet(worksheet ws)
{
2014-05-31 06:42:25 +08:00
auto match_iter = std::find_if(d_->worksheets_.begin(), d_->worksheets_.end(), [=](detail::worksheet_impl &comp) { return worksheet(&comp) == ws; });
if(match_iter == d_->worksheets_.end())
2014-05-21 22:20:30 +08:00
{
throw std::runtime_error("worksheet not owned by this workbook");
}
d_->worksheets_.erase(match_iter);
2014-05-21 22:20:30 +08:00
}
worksheet workbook::create_sheet(std::size_t index)
{
create_sheet();
if (index != d_->worksheets_.size() - 1)
{
std::swap(d_->worksheets_.back(), d_->worksheets_[index]);
d_->worksheets_.pop_back();
}
return worksheet(&d_->worksheets_[index]);
2014-05-21 22:20:30 +08:00
}
worksheet workbook::create_sheet(const std::string &title, const relationship &rel)
{
d_->worksheets_.push_back(detail::worksheet_impl(this, title));
auto index = index_from_ws_filename(rel.get_target_uri());
if (index != d_->worksheets_.size() - 1)
{
std::swap(d_->worksheets_.back(), d_->worksheets_[index]);
d_->worksheets_.pop_back();
}
return worksheet(&d_->worksheets_[index]);
}
2014-05-21 22:20:30 +08:00
worksheet workbook::create_sheet(std::size_t index, const std::string &title)
{
auto ws = create_sheet(index);
ws.set_title(title);
2014-05-21 22:20:30 +08:00
return ws;
}
worksheet workbook::create_sheet(const std::string &title)
{
if(title.length() > 31)
{
2014-06-06 04:19:31 +08:00
throw sheet_title_exception(title);
2014-05-21 22:20:30 +08:00
}
if(std::find_if(title.begin(), title.end(),
[](char c) { return c == '*' || c == ':' || c == '/' || c == '\\' || c == '?' || c == '[' || c == ']'; }) != title.end())
{
2014-06-06 04:19:31 +08:00
throw sheet_title_exception(title);
2014-05-21 22:20:30 +08:00
}
2014-07-20 04:59:05 +08:00
std::string unique_title = title;
if(std::find_if(d_->worksheets_.begin(), d_->worksheets_.end(), [&](detail::worksheet_impl &ws) { return worksheet(&ws).get_title() == unique_title; }) != d_->worksheets_.end())
2014-05-21 22:20:30 +08:00
{
2014-07-20 04:59:05 +08:00
std::size_t suffix = 1;
while(std::find_if(d_->worksheets_.begin(), d_->worksheets_.end(), [&](detail::worksheet_impl &ws) { return worksheet(&ws).get_title() == unique_title; }) != d_->worksheets_.end())
{
unique_title = title + std::to_string(suffix);
suffix++;
}
2014-05-21 22:20:30 +08:00
}
auto ws = create_sheet();
2014-07-20 04:59:05 +08:00
ws.set_title(unique_title);
return ws;
2014-05-21 22:20:30 +08:00
}
workbook::iterator workbook::begin()
2014-05-21 22:20:30 +08:00
{
return iterator(*this, 0);
2014-05-21 22:20:30 +08:00
}
workbook::iterator workbook::end()
2014-05-21 22:20:30 +08:00
{
return iterator(*this, d_->worksheets_.size());
}
workbook::const_iterator workbook::cbegin() const
{
return const_iterator(*this, 0);
}
workbook::const_iterator workbook::cend() const
{
return const_iterator(*this, d_->worksheets_.size());
2014-05-21 22:20:30 +08:00
}
std::vector<std::string> workbook::get_sheet_names() const
{
std::vector<std::string> names;
for(auto ws : *this)
2014-05-21 22:20:30 +08:00
{
names.push_back(ws.get_title());
}
2014-05-21 22:20:30 +08:00
return names;
}
worksheet workbook::operator[](const std::string &name)
{
return get_sheet_by_name(name);
2014-05-21 22:20:30 +08:00
}
2014-06-11 05:12:15 +08:00
worksheet workbook::operator[](std::size_t index)
2014-05-21 22:20:30 +08:00
{
return worksheet(&d_->worksheets_[index]);
2014-05-21 22:20:30 +08:00
}
void workbook::clear()
{
d_->worksheets_.clear();
2014-07-20 02:43:48 +08:00
d_->relationships_.clear();
d_->active_sheet_index_ = 0;
d_->drawings_.clear();
2014-07-20 04:59:05 +08:00
d_->properties_ = document_properties();
2014-05-21 22:20:30 +08:00
}
2014-06-05 06:42:17 +08:00
bool workbook::save(std::vector<unsigned char> &data)
{
2014-06-11 05:12:15 +08:00
auto temp_file = CreateTemporaryFilename();
save(temp_file);
std::ifstream tmp;
tmp.open(temp_file, std::ios::in | std::ios::binary);
auto char_data = std::vector<char>((std::istreambuf_iterator<char>(tmp)),
std::istreambuf_iterator<char>());
data = std::vector<unsigned char>(char_data.begin(), char_data.end());
tmp.close();
std::remove(temp_file.c_str());
return true;
2014-06-05 06:42:17 +08:00
}
bool workbook::save(const std::string &filename)
2014-05-21 22:20:30 +08:00
{
2014-08-01 21:44:21 +08:00
zip_file f;
2014-08-01 21:44:21 +08:00
f.writestr("[Content_Types].xml", writer::write_content_types(*this));
2014-05-21 22:20:30 +08:00
2014-08-01 21:44:21 +08:00
f.writestr("docProps/app.xml", writer::write_properties_app(*this));
f.writestr("docProps/core.xml", writer::write_properties_core(get_properties()));
std::set<std::string> shared_strings_set;
for(auto ws : *this)
{
for(auto row : ws.rows())
{
for(auto cell : row)
{
if(cell.get_value().is(value::type::string))
{
shared_strings_set.insert(cell.get_value().get<std::string>());
}
}
}
}
std::vector<std::string> shared_strings(shared_strings_set.begin(), shared_strings_set.end());
2014-08-01 21:44:21 +08:00
f.writestr("xl/sharedStrings.xml", writer::write_shared_strings(shared_strings));
2014-08-01 21:44:21 +08:00
f.writestr("xl/theme/theme1.xml", writer::write_theme());
f.writestr("xl/styles.xml", style_writer(*this).write_table());
2014-08-01 21:44:21 +08:00
f.writestr("_rels/.rels", writer::write_root_rels());
f.writestr("xl/_rels/workbook.xml.rels", writer::write_workbook_rels(*this));
2014-08-01 21:44:21 +08:00
f.writestr("xl/workbook.xml", writer::write_workbook(*this));
2014-07-20 02:43:48 +08:00
for(auto relationship : d_->relationships_)
{
if(relationship.get_type() == relationship::type::worksheet)
{
auto sheet_index = index_from_ws_filename(relationship.get_target_uri());
auto ws = get_sheet_by_index(sheet_index);
f.writestr(relationship.get_target_uri(), writer::write_worksheet(ws, shared_strings));
2014-07-20 02:43:48 +08:00
}
}
2014-06-05 06:42:17 +08:00
2014-08-02 04:46:54 +08:00
f.save(filename);
2014-06-05 06:42:17 +08:00
return true;
2014-05-21 22:20:30 +08:00
}
2014-07-20 04:59:05 +08:00
bool workbook::operator==(std::nullptr_t) const
{
return d_.get() == nullptr;
}
2014-05-21 22:20:30 +08:00
bool workbook::operator==(const workbook &rhs) const
{
2014-06-14 03:05:24 +08:00
return d_.get() == rhs.d_.get();
2014-05-21 22:20:30 +08:00
}
std::vector<relationship> xlnt::workbook::get_relationships() const
{
return d_->relationships_;
2014-05-22 07:17:56 +08:00
}
std::vector<content_type> xlnt::workbook::get_content_types() const
{
std::vector<content_type> content_types;
2014-06-19 03:12:44 +08:00
content_types.push_back({ true, "xml", "", "application/xml" });
content_types.push_back({ true, "rels", "", "application/vnd.openxmlformats-package.relationships+xml" });
2014-07-20 02:43:48 +08:00
content_types.push_back({ false, "", "/xl/workbook.xml", "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet.main+xml" });
for(std::size_t i = 0; i < get_sheet_names().size(); i++)
{
content_types.push_back({false, "", "/xl/worksheets/sheet" + std::to_string(i + 1) + ".xml", "application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml"});
}
content_types.push_back({false, "", "/xl/theme/theme1.xml", "application/vnd.openxmlformats-officedocument.theme+xml"});
content_types.push_back({false, "", "/xl/styles.xml", "application/vnd.openxmlformats-officedocument.spreadsheetml.styles+xml"});
content_types.push_back({false, "", "/xl/sharedStrings.xml", "application/vnd.openxmlformats-officedocument.spreadsheetml.sharedStrings+xml"});
content_types.push_back({false, "", "/docProps/core.xml", "application/vnd.openxmlformats-package.core-properties+xml"});
content_types.push_back({false, "", "/docProps/app.xml", "application/vnd.openxmlformats-officedocument.extended-properties+xml"});
return content_types;
}
2014-07-20 04:59:05 +08:00
document_properties &workbook::get_properties()
{
return d_->properties_;
}
const document_properties &workbook::get_properties() const
{
return d_->properties_;
}
2014-07-24 08:51:28 +08:00
void swap(workbook &left, workbook &right)
2014-07-20 04:59:05 +08:00
{
2014-07-24 08:51:28 +08:00
using std::swap;
swap(left.d_, right.d_);
for(auto ws : left)
{
ws.set_parent(left);
}
for(auto ws : right)
{
ws.set_parent(right);
}
}
2014-07-20 04:59:05 +08:00
2014-07-24 08:51:28 +08:00
workbook &workbook::operator=(workbook other)
{
swap(*this, other);
return *this;
}
workbook::workbook(workbook &&other) : workbook()
{
swap(*this, other);
}
workbook::workbook(const workbook &other) : workbook()
{
*d_.get() = *other.d_.get();
for(auto ws : *this)
{
ws.set_parent(*this);
}
2014-07-20 04:59:05 +08:00
}
2014-07-25 05:31:46 +08:00
bool workbook::get_data_only() const
{
return d_->data_only_;
}
void workbook::set_data_only(bool data_only)
{
d_->data_only_ = data_only;
}
std::size_t workbook::index_from_ws_filename(const std::string &ws_filename)
{
std::string sheet_index_string(ws_filename);
sheet_index_string = sheet_index_string.substr(0, sheet_index_string.find('.'));
sheet_index_string = sheet_index_string.substr(sheet_index_string.find_last_of('/'));
auto iter = sheet_index_string.end();
iter--;
while (isdigit(*iter)) iter--;
auto first_digit = iter - sheet_index_string.begin();
sheet_index_string = sheet_index_string.substr(first_digit + 1);
auto sheet_index = std::stoi(sheet_index_string) - 1;
return sheet_index;
}
2014-06-19 03:12:44 +08:00
}