panda3d/panda/src/express/zipArchive.cxx

/**
 * PANDA 3D SOFTWARE
 * Copyright (c) Carnegie Mellon University.  All rights reserved.
 *
 * All use of this software is subject to the terms of the revised BSD
 * license.  You should have received a copy of this license along
 * with this source code in a file named "LICENSE."
 *
 * @file zipArchive.cxx
 * @author rdb
 * @date 2019-01-20
 */

#include "zipArchive.h"

#include "config_express.h"
#include "streamWriter.h"
#include "streamReader.h"
#include "datagram.h"
#include "zStream.h"
#include "encryptStream.h"
#include "virtualFileSystem.h"
#include "virtualFile.h"

#include <algorithm>
#include <iterator>
#include <time.h>

#include "openSSLWrapper.h"

using std::streamoff;
using std::streampos;
using std::streamsize;
using std::stringstream;
using std::string;

// 1980-01-01 00:00:00
static const time_t dos_epoch = 315532800;

/**
 *
 */
ZipArchive::
ZipArchive() :
  _read_filew(_read_file),
  _read_write_filew(_read_write_file)
{
  _read = nullptr;
  _write = nullptr;
  _owns_stream = false;
  _index_changed = false;
  _needs_repack = false;
  _record_timestamp = true;
}

/**
 *
 */
ZipArchive::
~ZipArchive() {
  close();
}

/**
 * Opens the named ZipArchive on disk for reading.  The ZipArchive index is read
 * in, and the list of subfiles becomes available; individual subfiles may
 * then be extracted or read, but the list of subfiles may not be modified.
 *
 * Also see the version of open_read() which accepts an istream.  Returns true
 * on success, false on failure.
 */
bool ZipArchive::
open_read(const Filename &filename) {
  close();
  Filename fname = filename;
  fname.set_binary();

  VirtualFileSystem *vfs = VirtualFileSystem::get_global_ptr();
  PT(VirtualFile) vfile = vfs->get_file(fname);
  if (vfile == nullptr) {
    return false;
  }
  std::istream *stream = vfile->open_read_file(false);
  if (stream == nullptr) {
    return false;
  }

  _read = new IStreamWrapper(stream, true);
  _owns_stream = true;
  _filename = filename;
  return read_index();
}

/**
 * Opens an anonymous ZipArchive for reading using an istream.  There must be
 * seek functionality via seekg() and tellg() on the istream.
 *
 * If owns_pointer is true, then the ZipArchive assumes ownership of the stream
 * pointer and will delete it when the ZIP file is closed, including if this
 * function returns false.
 *
 * The given stream must be seekable.
 */
bool ZipArchive::
open_read(IStreamWrapper *stream, bool owns_pointer) {
  close();
  _read = stream;
  _owns_stream = owns_pointer;
  return read_index();
}

/**
 * Opens the named ZipArchive on disk for writing.  If there already exists a
 * file by that name, it is truncated.  The ZipArchive is then prepared for
 * accepting a brand new set of subfiles, which will be written to the
 * indicated filename.  Individual subfiles may not be extracted or read.
 *
 * Also see the version of open_write() which accepts an ostream.  Returns
 * true on success, false on failure.
 */
bool ZipArchive::
open_write(const Filename &filename) {
  close();
  Filename fname = filename;
  fname.set_binary();
  if (!fname.open_write(_write_file, true)) {
    return false;
  }
  _write = &_write_file;
  _filename = filename;
  _index_start = 0;
  _file_end = 0;
  _index_changed = true;
  return true;
}

/**
 * Opens an anonymous ZipArchive for writing using an ostream.
 *
 * If owns_pointer is true, then the ZipArchive assumes ownership of the stream
 * pointer and will delete it when the ZIP file is closed, including if this
 * function returns false.
 */
bool ZipArchive::
open_write(std::ostream *stream, bool owns_pointer) {
  close();
  _write = stream;
  _owns_stream = owns_pointer;
  _write->seekp(0, ios::beg);
  _index_start = 0;
  _file_end = 0;
  _index_changed = true;
  return true;
}

/**
 * Opens the named ZipArchive on disk for reading and writing.  If there
 * already exists a file by that name, its index is read.  Subfiles may be
 * added or removed, and the resulting changes will be written to the named
 * file.
 *
 * Also see the version of open_read_write() which accepts an iostream.
 * Returns true on success, false on failure.
 */
bool ZipArchive::
open_read_write(const Filename &filename) {
  close();
  Filename fname = filename;
  fname.set_binary();
  bool exists = fname.exists();
  if (!fname.open_read_write(_read_write_file)) {
    return false;
  }
  _read = &_read_write_filew;
  _write = &_read_write_file;
  _filename = filename;

  if (exists) {
    return read_index();
  } else {
    _index_start = 0;
    _file_end = 0;
    _index_changed = true;
    return true;
  }
}

/**
 * Opens an anonymous ZipArchive for reading and writing using an iostream.
 * There must be seek functionality via seekg()/seekp() and tellg()/tellp() on
 * the iostream.
 *
 * If owns_pointer is true, then the ZipArchive assumes ownership of the stream
 * pointer and will delete it when the ZIP file is closed, including if this
 * function returns false.
 */
bool ZipArchive::
open_read_write(std::iostream *stream, bool owns_pointer) {
  close();

  // We don't support locking when opening a file in read-write mode, because
  // we don't bother with locking on write.  But we need to have an
  // IStreamWrapper to assign to the _read member, so we create one on-the-fly
  // here.
  _read = new StreamWrapper(stream, owns_pointer);
  _write = stream;
  _owns_stream = true;  // Because we own the StreamWrapper, above.
  _write->seekp(0, ios::beg);

  // Check whether the read stream is empty.
  stream->seekg(0, ios::end);
  if (stream->tellg() == (streampos)0) {
    // The read stream is empty, which is always valid.
    _index_changed = true;
    return true;
  }

  // The read stream is not empty, so we'd better have a valid ZipArchive.
  return read_index();
}

/**
 * Verifies the integrity of the contents of the ZIP archive.
 */
bool ZipArchive::
verify() {
  nassertr_always(is_read_valid(), false);

  _read->acquire();
  std::istream *read = _read->get_istream();

  bool passes = true;

  for (Subfile *subfile : _subfiles) {
    if (!subfile->read_header(*read) ||
        !subfile->verify_data(*read)) {
      passes = false;
    }
  }

  _read->release();
  return passes;
}

/**
 * Closes the ZipArchive if it is open.  All changes are flushed to disk, and
 * the file becomes invalid for further operations until the next call to
 * open().
 */
void ZipArchive::
close() {
  flush();

  if (_owns_stream) {
    // We prefer to delete the IStreamWrapper over the ostream, if possible.
    if (_read != nullptr) {
      // Only delete it if no SubStream is still referencing it.
      if (!_read->unref()) {
        delete _read;
      }
    } else if (_write != nullptr) {
      delete _write;
    }
  }

  _read = nullptr;
  _write = nullptr;
  _owns_stream = false;
  _index_start = 0;
  _file_end = 0;
  _index_changed = false;
  _needs_repack = false;

  _read_file.close();
  _write_file.close();
  _read_write_file.close();
  _filename = Filename();

  clear_subfiles();
}

/**
 * Adds a file on disk as a subfile to the ZipArchive.  The file named by
 * filename will be read and added to the ZipArchive immediately, but the index
 * will not be updated until you call flush().  If there already exists a
 * subfile with the indicated name, it is replaced without examining its
 * contents (but see also update_subfile).
 *
 * Returns the subfile name on success (it might have been modified slightly),
 * or empty string on failure.
 */
std::string ZipArchive::
add_subfile(const std::string &subfile_name, const Filename &filename,
            int compression_level) {
  nassertr(is_write_valid(), std::string());

#ifndef HAVE_ZLIB
  express_cat.warning()
    << "zlib not compiled in; unable to modify ZIP file.\n";
  return std::string();
#endif

  VirtualFileSystem *vfs = VirtualFileSystem::get_global_ptr();
  PT(VirtualFile) vfile = vfs->get_file(filename);
  if (vfile == nullptr) {
    return std::string();
  }

  std::istream *in = vfs->open_read_file(filename, false);
  if (in == nullptr) {
    return std::string();
  }

  std::string name = add_subfile(subfile_name, in, compression_level);
  vfs->close_read_file(in);
  return name;
}

/**
 * Adds a file from a stream as a subfile to the ZipArchive.  The indicated
 * istream will be read and its contents added to the end of the current ZIP
 * file immediately.
 *
 * Note that the istream must remain untouched and unused by any other code
 * until flush() is called.  At that time, the index of the ZIP archive will be
 * rewritten to the end of the file.
 *
 * Returns the subfile name on success (it might have been modified slightly),
 * or empty string on failure.
 */
std::string ZipArchive::
add_subfile(const std::string &subfile_name, std::istream *subfile_data,
            int compression_level) {
  nassertr(is_write_valid(), string());

#ifndef HAVE_ZLIB
  express_cat.warning()
    << "zlib not compiled in; unable to modify ZIP file.\n";
  return std::string();
#endif

  std::string name = standardize_subfile_name(subfile_name);
  if (!name.empty()) {
    Subfile *subfile = new Subfile(subfile_name, compression_level);

    // Write it straight away, overwriting the index at the end of the file.
    // This index will be rewritten at the next call to flush() or close().
    std::streampos fpos = _index_start;
    _write->seekp(fpos);

    if (!subfile->write_header(*_write, fpos)) {
      delete subfile;
      return "";
    }

    if (!subfile->write_data(*_write, subfile_data, fpos, compression_level)) {
      // Failed to write the data.
      delete subfile;
      return "";
    }

    if (fpos > _index_start) {
      _index_start = fpos;
    }
    add_new_subfile(subfile, compression_level);
  }

  return name;
}

/**
 * Adds a file on disk to the subfile.  If a subfile already exists with the
 * same name, its contents are compared byte-for-byte to the disk file, and it
 * is replaced only if it is different; otherwise, the ZIP file is left
 * unchanged.
 *
 * Either Filename:::set_binary() or set_text() must have been called
 * previously to specify the nature of the source file.  If set_text() was
 * called, the text flag will be set on the subfile.
 */
string ZipArchive::
update_subfile(const std::string &subfile_name, const Filename &filename,
               int compression_level) {
  nassertr(is_write_valid(), string());

#ifndef HAVE_ZLIB
  express_cat.warning()
    << "zlib not compiled in; unable to modify ZIP file.\n";
  return std::string();
#endif

  if (!filename.exists()) {
    return string();
  }
  std::string name = standardize_subfile_name(subfile_name);
  if (!name.empty()) {
    int index = find_subfile(name);
    if (index >= 0) {
      // The subfile already exists; compare it to the source file.
      if (compare_subfile(index, filename)) {
        // The files are identical; do nothing.
        return name;
      }
    }

    // The subfile does not already exist or it is different from the source
    // file.  Add the new source file.
    Subfile *subfile = new Subfile(name, compression_level);
    add_new_subfile(subfile, compression_level);
  }

  return name;
}

/**
 * Ensures that any changes made to the ZIP archive have been synchronized to
 * disk.  In particular, this causes the central directory to be rewritten at
 * the end of the file.
 *
 * This may result in a suboptimal packing in the ZIP file, especially if
 * existing files were changed or files were removed.  To guarantee that the
 * file is as compact as it can be, call repack() instead of flush().
 *
 * It is not necessary to call flush() explicitly unless you are concerned
 * about reading the recently-added subfiles immediately.
 *
 * Returns true on success, false on failure.
 */
bool ZipArchive::
flush() {
  if (!is_write_valid()) {
    return false;
  }

  nassertr(_write != nullptr, false);

  // First, mark out all of the removed subfiles.
  for (Subfile *subfile : _removed_subfiles) {
    delete subfile;
  }
  _removed_subfiles.clear();

  if (_index_changed) {
    std::streampos fpos = _index_start;
    _write->seekp(fpos);
    if (!write_index(*_write, fpos)) {
      express_cat.info()
        << "Unable to write updated central directory to ZIP archive " << _filename << ".\n";
      close();
      return false;
    }
    _index_changed = false;
  }

  _write->flush();
  return true;
}

/**
 * Forces a complete rewrite of the ZipArchive and all of its contents, so that
 * the files are tightly packed in the file without any gaps.  This is useful to
 * do after removing files, to ensure that the file size is minimized.
 *
 * It is only valid to call this if the ZipArchive was opened using
 * open_read_write() and an explicit filename, rather than an iostream.  Also,
 * we must have write permission to the directory containing the ZipArchive.
 *
 * Returns true on success, false on failure.
 */
bool ZipArchive::
repack() {
  nassertr(is_write_valid() && is_read_valid(), false);
  nassertr(!_filename.empty(), false);

  // First, we open a temporary filename to copy the ZipArchive to.
  Filename dirname = _filename.get_dirname();
  if (dirname.empty()) {
    dirname = ".";
  }
  Filename temp_filename = Filename::temporary(dirname, "ziptemp");
  temp_filename.set_binary();
  pofstream temp;
  if (!temp_filename.open_write(temp)) {
    express_cat.info()
      << "Unable to open temporary file " << temp_filename << "\n";
    return false;
  }

  // Now we scrub our internal structures so it looks like we're a brand new
  // ZipArchive.
  for (Subfile *subfile : _removed_subfiles) {
    delete subfile;
  }
  _removed_subfiles.clear();

  // And we write our contents to our new temporary file.
  //_write = &temp;

  bool success = true;

  _read->acquire();
  std::istream &read = *_read->get_istream();

  // Copy over all of the subfiles.
  std::streampos fpos = 0;

  for (Subfile *subfile : _subfiles) {
    if (!subfile->read_header(read)) {
      success = false;
      continue;
    }

    // We don't need to write a data descriptor, since at this point we know
    // the checksum and sizes.
    subfile->_flags &= ~SF_data_descriptor;

    if (!subfile->write_header(temp, fpos)) {
      success = false;
      continue;
    }

    static const size_t buffer_size = 4096;
    char buffer[buffer_size];
    uint64_t num_bytes = subfile->_data_length;
    fpos += num_bytes;

    while (num_bytes >= buffer_size) {
      read.read(buffer, buffer_size);
      temp.write(buffer, buffer_size);
      num_bytes -= buffer_size;
    }
    if (num_bytes > 0) {
      read.read(buffer, num_bytes);
      temp.write(buffer, num_bytes);
    }
  }
  _read->release();

  // Write the central directory at the end of the file.
  success = success && write_index(temp, fpos);

  if (!success) {
    express_cat.error()
      << "Failed to write repacked archive to " << temp_filename << ".\n";
    temp.close();
    temp_filename.unlink();
    return false;
  }

  // Now close everything, and move the temporary file back over our original
  // file.
  Filename orig_name = _filename;
  temp.close();
  close();
  orig_name.unlink();
  if (!temp_filename.rename_to(orig_name)) {
    express_cat.info()
      << "Unable to rename temporary file " << temp_filename << " to "
      << orig_name << ".\n";
    return false;
  }

  if (!open_read_write(orig_name)) {
    express_cat.info()
      << "Unable to read newly repacked " << _filename
      << ".\n";
    return false;
  }

  return true;
}

/**
 * Returns the number of subfiles within the ZipArchive.  The subfiles may be
 * accessed in alphabetical order by iterating through [0 ..
 * get_num_subfiles()).
 */
int ZipArchive::
get_num_subfiles() const {
  return _subfiles.size();
}

/**
 * Returns the index of the subfile with the indicated name, or -1 if the
 * named subfile is not within the ZipArchive.
 */
int ZipArchive::
find_subfile(const std::string &subfile_name) const {
  Subfile find_subfile;
  find_subfile._name = standardize_subfile_name(subfile_name);
  Subfiles::const_iterator fi;
  fi = _subfiles.find(&find_subfile);
  if (fi == _subfiles.end()) {
    // Not present.
    return -1;
  }
  return (fi - _subfiles.begin());
}

/**
 * Returns true if the indicated subfile name is the directory prefix to one
 * or more files within the ZipArchive.  That is, the ZipArchive contains at
 * least one file named "subfile_name/...".
 */
bool ZipArchive::
has_directory(const std::string &subfile_name) const {
  string prefix = subfile_name;
  if (!prefix.empty()) {
    prefix += '/';
  }
  Subfile find_subfile;
  find_subfile._name = prefix;
  Subfiles::const_iterator fi;
  fi = _subfiles.upper_bound(&find_subfile);
  if (fi == _subfiles.end()) {
    // Not present.
    return false;
  }

  // At least one subfile exists whose name sorts after prefix.  If it
  // contains prefix as the initial substring, then we have a match.
  Subfile *subfile = (*fi);
  return (subfile->_name.length() > prefix.length() &&
          subfile->_name.substr(0, prefix.length()) == prefix);
}

/**
 * Considers subfile_name to be the name of a subdirectory within the
 * ZipArchive, but not a file itself; fills the given vector up with the sorted
 * list of subdirectories or files within the named directory.
 *
 * Note that directories do not exist explicitly within a ZipArchive; this just
 * checks for the existence of files with the given initial prefix.
 *
 * Returns true if successful, false otherwise.
 */
bool ZipArchive::
scan_directory(vector_string &contents, const std::string &subfile_name) const {
  string prefix = subfile_name;
  if (!prefix.empty()) {
    prefix += '/';
  }
  Subfile find_subfile;
  find_subfile._name = prefix;
  Subfiles::const_iterator fi;
  fi = _subfiles.upper_bound(&find_subfile);

  string previous = "";
  while (fi != _subfiles.end()) {
    Subfile *subfile = (*fi);
    if (!(subfile->_name.length() > prefix.length() &&
          subfile->_name.substr(0, prefix.length()) == prefix)) {
      // We've reached the end of the list of subfiles beneath the indicated
      // directory prefix.
      return true;
    }

    size_t slash = subfile->_name.find('/', prefix.length());
    string basename = subfile->_name.substr(prefix.length(), slash - prefix.length());
    if (basename != previous) {
      contents.push_back(basename);
      previous = basename;
    }
    ++fi;
  }

  return true;
}

/**
 * Removes the nth subfile from the ZipArchive.  This will cause all subsequent
 * index numbers to decrease by one.  The file will not actually be removed
 * from the disk until the next call to flush().
 *
 * Note that this does not actually remove the data from the indicated
 * subfile; it simply removes it from the index.  The ZipArchive will not be
 * reduced in size after this operation, until the next call to repack().
 */
void ZipArchive::
remove_subfile(int index) {
  nassertv(is_write_valid());
  nassertv(index >= 0 && index < (int)_subfiles.size());
  Subfile *subfile = _subfiles[index];
  //subfile->_flags |= SF_deleted;
  _removed_subfiles.push_back(subfile);
  _subfiles.erase(_subfiles.begin() + index);

  // We'll need to rewrite the index to remove it.  The packing is also
  // suboptimal now, so a repack would be good.
  _index_changed = true;
  _needs_repack = true;
}

/**
 * Returns the name of the nth subfile.
 */
const string &ZipArchive::
get_subfile_name(int index) const {
#ifndef NDEBUG
  static string empty_string;
  nassertr(index >= 0 && index < (int)_subfiles.size(), empty_string);
#endif
  return _subfiles[index]->_name;
}

/**
 * Returns the uncompressed data length of the nth subfile.
 */
size_t ZipArchive::
get_subfile_length(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), 0);
  return _subfiles[index]->_uncompressed_length;
}

/**
 * Returns the modification time of the nth subfile.  If this is called on an
 * older .zip file, which did not store individual timestamps in the file (or
 * if get_record_timestamp() is false), this will return the modification time
 * of the overall ZIP file.
 */
time_t ZipArchive::
get_subfile_timestamp(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), 0);
  return _subfiles[index]->_timestamp;
}

/**
 * Returns true if the indicated subfile has been compressed when stored
 * within the archive, false otherwise.
 */
bool ZipArchive::
is_subfile_compressed(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);
  return _subfiles[index]->is_compressed();
}

/**
 * Returns true if the indicated subfile has been encrypted when stored within
 * the archive, false otherwise.
 */
bool ZipArchive::
is_subfile_encrypted(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);
  return _subfiles[index]->is_encrypted();
}

/**
 * Returns the starting byte position within the ZipArchive at which the
 * indicated subfile begins.  This may be used, with
 * get_subfile_internal_length(), for low-level access to the subfile, but
 * usually it is better to use open_read_subfile() instead (which
 * automatically decrypts and/or uncompresses the subfile data).
 */
streampos ZipArchive::
get_subfile_internal_start(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), 0);
  _read->acquire();
  _subfiles[index]->read_header(*_read->get_istream());
  std::streampos data_start = _read->get_istream()->tellg();
  _read->release();
  return data_start;
}

/**
 * Returns the number of bytes the indicated subfile consumes within the
 * archive.  For compressed subfiles, this will generally be smaller than
 * get_subfile_length(); for encrypted (but noncompressed) subfiles, it may be
 * slightly different, for noncompressed and nonencrypted subfiles, it will be
 * equal.
 */
size_t ZipArchive::
get_subfile_internal_length(int index) const {
  nassertr(index >= 0 && index < (int)_subfiles.size(), 0);
  return _subfiles[index]->_data_length;
}

/**
 * Returns an istream that may be used to read the indicated subfile.  You may
 * seek() within this istream to your heart's content; even though it will be
 * a reference to the already-opened pfstream of the ZipArchive itself, byte 0
 * appears to be the beginning of the subfile and EOF appears to be the end of
 * the subfile.
 *
 * The returned istream will have been allocated via new; you should pass the
 * pointer to close_read_subfile() when you are finished with it to delete it
 * and release its resources.
 *
 * Any future calls to repack() or close() (or the ZipArchive destructor) will
 * invalidate all currently open subfile pointers.
 *
 * The return value will be NULL if the stream cannot be opened for some
 * reason.
 */
std::istream *ZipArchive::
open_read_subfile(int index) {
  nassertr(is_read_valid(), nullptr);
  nassertr(index >= 0 && index < (int)_subfiles.size(), nullptr);
  Subfile *subfile = _subfiles[index];

  return open_read_subfile(subfile);
}

/**
 * Closes a file opened by a previous call to open_read_subfile().  This
 * really just deletes the istream pointer, but it is recommended to use this
 * interface instead of deleting it explicitly, to help work around compiler
 * issues.
 */
void ZipArchive::
close_read_subfile(std::istream *stream) {
  if (stream != nullptr) {
    // For some reason--compiler bug in gcc 3.2?--explicitly deleting the
    // stream pointer does not call the appropriate global delete function;
    // instead apparently calling the system delete function.  So we call the
    // delete function by hand instead.
#if !defined(WIN32_VC) && !defined(USE_MEMORY_NOWRAPPERS) && defined(REDEFINE_GLOBAL_OPERATOR_NEW)
    stream->~istream();
    (*global_operator_delete)(stream);
#else
    delete stream;
#endif
  }
}

/**
 * Extracts the nth subfile into a file with the given name.
 */
bool ZipArchive::
extract_subfile(int index, const Filename &filename) {
  nassertr(is_read_valid(), false);
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);

  filename.make_dir();

  Filename fname = filename;
  if (!filename.is_text()) {
    fname.set_binary();
  }

  pofstream out;
  if (!fname.open_write(out, true)) {
    express_cat.info()
      << "Unable to write to file " << filename << "\n";
    return false;
  }

  return extract_subfile_to(index, out);
}

/**
 * Extracts the nth subfile to the indicated ostream.
 */
bool ZipArchive::
extract_subfile_to(int index, std::ostream &out) {
  nassertr(is_read_valid(), false);
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);

  std::istream *in = open_read_subfile(index);
  if (in == nullptr) {
    return false;
  }

  static const size_t buffer_size = 4096;
  char buffer[buffer_size];

  in->read(buffer, buffer_size);
  size_t count = in->gcount();
  while (count != 0) {
    out.write(buffer, count);
    in->read(buffer, buffer_size);
    count = in->gcount();
  }

  bool failed = (in->fail() && !in->eof());
  close_read_subfile(in);
  nassertr(!failed, false);

  return (!out.fail());
}

/**
 * Performs a byte-for-byte comparison of the indicated file on disk with the
 * nth subfile.  Returns true if the files are equivalent, or false if they
 * are different (or the file is missing).
 *
 * If Filename::set_binary() or set_text() has already been called, it
 * specifies the nature of the source file.  If this is different from the
 * text flag of the subfile, the comparison will always return false.  If this
 * has not been specified, it will be set from the text flag of the subfile.
 */
bool ZipArchive::
compare_subfile(int index, const Filename &filename) {
  nassertr(is_read_valid(), false);
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);

  if (!filename.exists()) {
    express_cat.info()
      << "File is missing: " << filename << "\n";
    return false;
  }

  std::istream *in1 = open_read_subfile(index);
  if (in1 == nullptr) {
    return false;
  }

  pifstream in2;

  if (!filename.open_read(in2)) {
    express_cat.info()
      << "Cannot read " << filename << "\n";
    return false;
  }

  if (filename.is_binary()) {
    // Check the file size.
    in2.seekg(0, ios::end);
    streampos file_size = in2.tellg();

    if (file_size != (streampos)get_subfile_length(index)) {
      // The files have different sizes.
      close_read_subfile(in1);
      return false;
    }
  }

  // Check the file data, byte-for-byte.
  in2.seekg(0);
  int byte1 = in1->get();
  int byte2 = in2.get();
  while (!in1->fail() && !in2.fail()) {
    if (byte1 != byte2) {
      close_read_subfile(in1);
      return false;
    }
    byte1 = in1->get();
    byte2 = in2.get();
  }

  bool failed = (in1->fail() && !in1->eof()) || (in2.fail() && !in2.eof());
  close_read_subfile(in1);

  nassertr(!failed, false);

  return true;
}

/**
 *
 */
void ZipArchive::
output(std::ostream &out) const {
  out << "ZipArchive " << _filename << ", " << get_num_subfiles()
      << " subfiles.\n";
}

/**
 * Shows a list of all subfiles within the ZipArchive.
 */
void ZipArchive::
ls(std::ostream &out) const {
  int num_subfiles = get_num_subfiles();
  for (int i = 0; i < num_subfiles; i++) {
    string subfile_name = get_subfile_name(i);
    out << subfile_name << "\n";
  }
}

/**
 * Sets the string which is appended to the very end of the ZIP archive.
 * This string may not be longer than 65535 characters.
 */
void ZipArchive::
set_comment(const std::string &comment) {
  nassertv(comment.size() <= 65535);

  if (_comment != comment) {
    _comment = comment;
    _index_changed = true;
  }
}

/**
 * Fills a string with the entire contents of the indicated subfile.
 */
bool ZipArchive::
read_subfile(int index, string &result) {
  result = string();

  // We use a temporary pvector, because dynamic accumulation of a pvector
  // seems to be many times faster than that of a string, at least on the
  // Windows implementation of STL.
  vector_uchar pv;
  if (!read_subfile(index, pv)) {
    return false;
  }

  if (!pv.empty()) {
    result.append((const char *)&pv[0], pv.size());
  }

  return true;
}

/**
 * Fills a pvector with the entire contents of the indicated subfile.
 */
bool ZipArchive::
read_subfile(int index, vector_uchar &result) {
  nassertr(is_read_valid(), false);
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);
  result.clear();

  // Now look up the particular Subfile we are reading.
  nassertr(is_read_valid(), false);
  nassertr(index >= 0 && index < (int)_subfiles.size(), false);
  Subfile *subfile = _subfiles[index];

  result.reserve(subfile->_uncompressed_length);

  bool success = true;
  if (subfile->is_compressed() || subfile->is_encrypted()) {
    // If the subfile is encrypted or compressed, we can't read it directly.
    // Fall back to the generic implementation.
    std::istream *in = open_read_subfile(index);
    if (in == nullptr) {
      return false;
    }

    success = VirtualFile::simple_read_file(in, result);
    close_read_subfile(in);

  } else {
    // But if the subfile is just a plain file, we can just read the data
    // directly from the ZipArchive, without paying the cost of an ISubStream.
    static const size_t buffer_size = 4096;
    char buffer[buffer_size];

    _read->acquire();
    if (!subfile->read_header(*_read->get_istream())) {
      _read->release();
      express_cat.error()
        << "Failed to read local header of "
        << _filename << "/" << subfile->_name << "\n";
      return false;
    }
    std::istream &read = *_read->get_istream();
    /*std::streampos data_start =*/ read.tellg();

    size_t bytes_to_go = subfile->_uncompressed_length;
    read.read(buffer, std::min(bytes_to_go, buffer_size));
    size_t read_bytes = read.gcount();

    while (read_bytes > 0) {
      result.insert(result.end(), buffer, buffer + read_bytes);

      bytes_to_go -= read_bytes;
      if (bytes_to_go == 0) {
        break;
      }

      read.read(buffer, std::min(bytes_to_go, buffer_size));
      read_bytes = read.gcount();
    }

    _read->release();
    success = (bytes_to_go == 0);
  }

  if (!success) {
    std::ostringstream message;
    message << "I/O error reading from " << get_filename() << " at "
            << get_subfile_name(index);
    nassert_raise(message.str());
    return false;
  }

  return true;
}

/**
 * Adds a newly-allocated Subfile pointer to the ZipArchive.
 */
void ZipArchive::
add_new_subfile(Subfile *subfile, int compression_level) {
  // We'll need to rewrite the index after this.
  _index_changed = true;

  std::pair<Subfiles::iterator, bool> insert_result = _subfiles.insert(subfile);
  if (!insert_result.second) {
    // Hmm, unable to insert.  There must already be a subfile by that name.
    // Add it to the _removed_subfiles list, so we can remove the old one.
    std::swap(subfile, *insert_result.first);
    _removed_subfiles.push_back(subfile);

    // Since we're removing a subfile and adding the new one at the end, we've
    // got empty space.  A repack would be good.
    _needs_repack = true;
  }
}

/**
 * This variant of open_read_subfile() is used internally only, and accepts a
 * pointer to the internal Subfile object, which is assumed to be valid and
 * written to the multifile.
 */
std::istream *ZipArchive::
open_read_subfile(Subfile *subfile) {
  // Read the header first.
  _read->acquire();
  if (!subfile->read_header(*_read->get_istream())) {
    _read->release();
    express_cat.error()
      << "Failed to read local header of "
      << _filename << "/" << subfile->_name << "\n";
    return nullptr;
  }
  std::streampos data_start = _read->get_istream()->tellg();
  _read->release();

  // Return an ISubStream object that references into the open ZipArchive
  // istream.
  nassertr(data_start != (streampos)0, nullptr);
  std::istream *stream =
    new ISubStream(_read, data_start,
                   data_start + (streampos)subfile->_data_length);

  if (subfile->is_compressed()) {
#ifndef HAVE_ZLIB
    express_cat.error()
      << "zlib not compiled in; cannot read compressed multifiles.\n";
    return nullptr;
#else  // HAVE_ZLIB
    // Oops, the subfile is compressed.  So actually, return an
    // IDecompressStream that wraps around the ISubStream.
    IDecompressStream *wrapper = new IDecompressStream(stream, true, -1, false);
    stream = wrapper;
#endif  // HAVE_ZLIB
  }

  if (stream->fail()) {
    // Hmm, some inexplicable problem.
    delete stream;
    return nullptr;
  }

  return stream;
}

/**
 * Returns the standard form of the subfile name.
 */
string ZipArchive::
standardize_subfile_name(const std::string &subfile_name) const {
  Filename name = subfile_name;
  name.standardize();
  if (name.empty() || name == "/") {
    // Invalid empty name.
    return string();
  }

  if (name[0] == '/') {
    return name.get_fullpath().substr(1);
  } else if (name.length() > 2 && name[0] == '.' && name[1] == '/') {
    return name.get_fullpath().substr(2);
  } else {
    return name.get_fullpath();
  }
}

/**
 * Removes the set of subfiles from the tables and frees their associated
 * memory.
 */
void ZipArchive::
clear_subfiles() {
  for (Subfile *subfile : _removed_subfiles) {
    delete subfile;
  }
  _removed_subfiles.clear();

  for (Subfile *subfile : _subfiles) {
    delete subfile;
  }
  _subfiles.clear();
}

/**
 * Reads the ZipArchive header and index.  Returns true if successful, false if
 * the ZipArchive is not valid.
 *
 * Assumes that the get pointer is at the end of the file.
 */
bool ZipArchive::
read_index() {
  nassertr(_read != nullptr, false);

  // We acquire the IStreamWrapper lock for the duration of this method.
  _read->acquire();
  std::istream *read = _read->get_istream();

  // ZIP files need to be read from the end.
  read->seekg(-2, std::ios::end);
  if (read->fail()) {
    express_cat.info()
      << "Unable to seek ZIP archive " << _filename << ".\n";
    _read->release();
    close();
    return false;
  }

  std::streampos fpos = read->tellg();
  _file_end = fpos + (std::streamoff)2;

  uint64_t cdir_entries = 0;
  uint64_t cdir_offset = 0;
  uint64_t cdir_size = 0;
  uint32_t comment_length = 0;
  std::streampos eocd_offset = 0;
  bool found = false;

  // Seek backwards until we have found the the end-of-directory record.
  StreamReader reader(read, false);
  while (comment_length <= 0xffff && fpos >= 20) {
    if (reader.get_uint16() == comment_length) {
      // This field references the distance to the end of the .zip file, so it
      // could be the comment length field at the end of the record.  Skip to the
      // beginning of the record to see if the signature matches.
      read->seekg(-22, std::ios::cur);
      if (reader.get_uint32() == 0x06054b50) {
        // Yes, got it.
        eocd_offset = read->tellg() - (std::streamoff)4;
        reader.skip_bytes(6);
        cdir_entries = reader.get_uint16();
        cdir_size = reader.get_uint32();
        cdir_offset = reader.get_uint32();
        if (comment_length > 0) {
          _comment = reader.get_fixed_string(comment_length);
        } else {
          _comment.clear();
        }
        found = true;
        break;
      }
    }

    comment_length += 2;
    read->seekg(-2, std::ios::cur);
    fpos -= 2;
  }

  if (!found) {
    express_cat.info()
      << "Unable to find end-of-directory record in ZIP archive " << _filename << ".\n";
    _read->release();
    close();
    return false;
  }

  // Now look for a ZIP64 end-of-central-directory locator.
  if (eocd_offset >= 20) {
    uint64_t eocd64_offset = 0;
    read->seekg(eocd_offset - (std::streamoff)20);
    if (reader.get_uint32() == 0x07064b50) {
      reader.skip_bytes(4); // disk no
      eocd64_offset = reader.get_uint64();
      reader.skip_bytes(4); // disk count

      read->seekg(eocd64_offset);
      if (reader.get_uint32() == 0x06064b50) {
        reader.skip_bytes(20);
        cdir_entries = reader.get_uint64();
        cdir_size = reader.get_uint64();
        cdir_offset = reader.get_uint64();
      } else {
        express_cat.info()
          << "Unable to read ZIP64 end-of-directory record in ZIP archive "
          << _filename << ".\n";
      }
    }
  }

  _index_start = cdir_offset;

  // Find the central directory.
  read->seekg((std::streampos)cdir_offset);
  if (read->fail()) {
    express_cat.info()
      << "Unable to locate central directory in ZIP archive " << _filename << ".\n";
    _read->release();
    close();
    return false;
  }

  _record_timestamp = false;

  for (size_t i = 0; i < cdir_entries; ++i) {
    Subfile *subfile = new Subfile;
    if (!subfile->read_index(*read)) {
      express_cat.info()
        << "Failed to read central directory for " << _filename << ".\n";
      _read->release();
      close();
      return false;
    }

    if (subfile->_timestamp != dos_epoch) {
      // If all subfiles have the timestamp set to the DOS epoch, we apparently
      // don't care about preserving timestamps.
      _record_timestamp = true;
    }
    _subfiles.push_back(subfile);
  }

  // Sort the subfiles.
  size_t before_size = _subfiles.size();
  _subfiles.sort();
  size_t after_size = _subfiles.size();

  // If these don't match, the same filename appeared twice in the index,
  // which shouldn't be possible.
  nassertr(before_size == after_size, false);

  _read->release();
  return true;
}

/**
 * Writes the index of the ZIP archive at the current put position.
 */
bool ZipArchive::
write_index(std::ostream &write, std::streampos &fpos) {
  nassertr(write.tellp() == fpos, false);

  _index_start = fpos;

  for (Subfile *subfile : _subfiles) {
    if (!subfile->write_index(write, fpos)) {
      express_cat.info()
        << "Failed to write central directory entry for "
        << _filename << "/" << subfile->_name << ".\n";
      _read->release();
      close();
      return false;
    }
  }

  size_t cdir_entries = _subfiles.size();
  std::streamoff cdir_size = fpos - _index_start;

  StreamWriter writer(write);

  if (_index_start >= 0xffffffff ||
      cdir_size >= 0xffffffff ||
      cdir_entries >= 0xffff) {
    // Write a ZIP64 end-of-central-directory record.
    writer.add_uint32(0x06064b50);
    writer.add_uint64(44); // size of the rest of the record (w/o first 12 bytes)
    writer.add_uint16(45); // version number that produced this file
    writer.add_uint16(45); // version number needed to read this file
    writer.add_uint32(0);
    writer.add_uint32(0);
    writer.add_uint64(cdir_entries);
    writer.add_uint64(cdir_entries);
    writer.add_uint64(cdir_size);
    writer.add_uint64(_index_start);
    nassertr(write.tellp() == fpos + std::streamoff(12 + 44), false);

    // And write the ZIP64 end-of-central-directory-record locator.
    writer.add_uint32(0x07064b50);
    writer.add_uint32(0);
    writer.add_uint64(fpos);
    writer.add_uint32(1); // number of disks
  }

  // Write the end of central directory record.
  writer.add_uint32(0x06054b50);
  writer.add_uint16(0);
  writer.add_uint16(0);
  writer.add_uint16(std::min((size_t)0xffffu, cdir_entries));
  writer.add_uint16(std::min((size_t)0xffffu, cdir_entries));
  writer.add_uint32(std::min((std::streamoff)0xffffffffu, cdir_size));
  writer.add_uint32(std::min((std::streampos)0xffffffffu, _index_start));
  writer.add_uint16(_comment.size());
  writer.append_data(_comment);

  if (write.fail()) {
    express_cat.warning()
      << "Unable to write central directory for " << _filename << ".\n";
    close();
    return false;
  }

  fpos = write.tellp();
  if (fpos < _file_end) {
    // We didn't hit the end of the file writing the index.  This is a problem
    // because readers start looking for the EOCD record at the end of the file.
    // We'll have to shift the whole index forwards.  Unfortunately it's hard to
    // anticipate having to do this ahead of time.
    fpos = _index_start + (_file_end - fpos);
    _needs_repack = true;
    write.seekp(fpos);
    return write_index(write, fpos);
  }

  _file_end = fpos;
  return true;
}

/**
 * Creates a new subfile record.
 */
ZipArchive::Subfile::
Subfile(const std::string &name, int compression_level) :
  _name(name),
  _timestamp(dos_epoch),
  _compression_method((compression_level > 0) ? CM_deflate : CM_store)
{
  // If the name contains any non-ASCII characters, we set the UTF-8 flag.
  for (char c : name) {
    if (c & ~0x7f) {
      _flags |= SF_utf8_encoding;
      break;
    }
  }

  if (compression_level > 6) {
    _flags |= SF_deflate_best;
  } else if (compression_level > 1 && compression_level < 6) {
    _flags |= SF_deflate_fast;
  } else if (compression_level == 1) {
    _flags |= SF_deflate_fastest;
  }
}

/**
 * Reads the index record for the Subfile from the indicated istream.  Assumes
 * the istream has already been positioned to the indicated stream position,
 * fpos, the start of the index record.  Returns true on success.
 */
bool ZipArchive::Subfile::
read_index(std::istream &read) {
  StreamReader reader(read);

  if (reader.get_uint32() != 0x02014b50) {
    return false;
  }

  uint16_t version = reader.get_uint8();
  _system = reader.get_uint8();
  uint16_t min_version = reader.get_uint16();
  _flags = reader.get_uint16();
  _compression_method = (CompressionMethod)reader.get_uint16();
  {
    // Convert from DOS/FAT timestamp to UNIX timestamp.
    uint16_t mtime = reader.get_uint16();
    uint16_t mdate = reader.get_uint16();

    struct tm time = {};
    time.tm_sec  =  (mtime & 0b0000000000011111u) << 1;
    time.tm_min  =  (mtime & 0b0000011111100000u) >> 5;
    time.tm_hour =  (mtime & 0b1111100000000000u) >> 11;
    time.tm_mday =  (mdate & 0b0000000000011111u);
    time.tm_mon  = ((mdate & 0b0000000111100000u) >> 5) - 1;
    time.tm_year = ((mdate & 0b1111111000000000u) >> 9) + 80;
    time.tm_isdst = -1;
    _timestamp = mktime(&time);
  }
  _checksum = reader.get_uint32();
  _data_length = reader.get_uint32();
  _uncompressed_length = reader.get_uint32();
  size_t name_length = reader.get_uint16();
  size_t extra_length = reader.get_uint16();
  size_t comment_length = reader.get_uint16();
  /*size_t disk_number =*/ reader.get_uint16();
  _internal_attribs = reader.get_uint16();
  _external_attribs = reader.get_uint32();
  _header_start = (std::streampos)reader.get_uint32();

  std::string name = reader.get_fixed_string(name_length);

  // Read the extra fields, which may include a UNIX timestamp, which can be
  // specified with greater precision than a DOS timestamp.
  while (extra_length >= 4) {
    uint16_t const tag = reader.get_uint16();
    uint16_t const size = reader.get_uint16();
    if (tag == 0x0001) {
      // ZIP64 extended info.
      int size_left = size;
      if (_uncompressed_length == 0xffffffffu && size_left >= 8) {
        _uncompressed_length = reader.get_uint64();
        size_left -= 8;
      }
      if (_data_length == 0xffffffffu && size_left >= 8) {
        _data_length = reader.get_uint64();
        size_left -= 8;
      }
      if (_header_start == 0xffffffffu && size_left >= 8) {
        _header_start = reader.get_uint64();
        size_left -= 8;
      }
      reader.skip_bytes(size_left);
    } else if (tag == 0x5455 && size == 5) {
      reader.skip_bytes(1);
      _timestamp = reader.get_uint32();
    } else {
      reader.skip_bytes(size);
    }
    extra_length -= 4 + size;
  }
  // Skip leftover bytes in the extra field not large enough to contain a proper
  // extra tag.  This may be the case for Android .apk files processed with
  // zipalign, which uses this for alignment.
  reader.skip_bytes(extra_length);

  std::string comment = reader.get_fixed_string(comment_length);

  if (_flags & SF_utf8_encoding) {
    _name = std::move(name);
    _comment = std::move(comment);
  } else {
    _name = TextEncoder::reencode_text(name, TextEncoder::E_cp437, TextEncoder::E_utf8);
    _comment = TextEncoder::reencode_text(comment, TextEncoder::E_cp437, TextEncoder::E_utf8);
  }

  return true;
}

/**
 * Reads the header record for the Subfile from the indicated istream.
 */
bool ZipArchive::Subfile::
read_header(std::istream &read) {
  read.seekg(_header_start);
  if (read.fail()) {
    return false;
  }

  // First, get the next stream position.  We do this separately, because if
  // it is zero, we don't get anything else.
  StreamReader reader(read);

  uint32_t signature = reader.get_uint32();
  if (signature != 0x04034b50) {
    //0x02014b50
    express_cat.warning()
      << "ZIP subfile " << _name << " header does not contain expected signature\n";
    return false;
  }

  // We skip most of the stuff in the local file header, since most of this is
  // duplicated in the central directory.
  reader.get_uint16();
  int flags = reader.get_uint16();

  if (flags != _flags) {
    express_cat.warning()
      << "ZIP subfile " << _name << " flags mismatch between file header and index record\n";
  }
  _flags = flags;

  if (reader.get_uint16() != (uint16_t)_compression_method) {
    express_cat.warning()
      << "ZIP subfile " << _name << " compression method mismatch between file header and index record\n";
    return false;
  }

  reader.get_uint32();

  if (flags & SF_data_descriptor) {
    // Ignore these fields, the real values will follow the file.
    reader.skip_bytes(4 * 3);
  } else {
    if (reader.get_uint32() != _checksum) {
      express_cat.warning()
        << "ZIP subfile " << _name << " CRC32 mismatch between file header and index record\n";
      return false;
    }

    // Compressed and uncompressed size
    uint32_t data_length = reader.get_uint32();
    uint32_t uncompressed_length = reader.get_uint32();

    if ((data_length != 0xffffffffu && data_length != _data_length) ||
        (uncompressed_length != 0xffffffffu && uncompressed_length != _uncompressed_length)) {
      express_cat.warning()
        << "ZIP subfile " << _name << " length mismatch between file header and index record\n";
      return false;
    }
  }

  size_t name_length = reader.get_uint16();
  size_t extra_length = reader.get_uint16();

  std::string name = reader.get_fixed_string(name_length);
  if ((flags & SF_utf8_encoding) == 0) {
    name = TextEncoder::reencode_text(name, TextEncoder::E_cp437, TextEncoder::E_utf8);
  }

  if (extra_length < 4) {
    reader.skip_bytes(extra_length);
  } else if (extra_length > 0) {
    for (int i = 0; i < extra_length;) {
      size_t length = reader.get_uint16();
      i += 4;
      reader.skip_bytes(length);
      i += length;
    }
  }

  if (name != _name) {
    express_cat.warning()
      << "Name of ZIP subfile \"" << _name << "\" in index record does not match "
         "name in file header \"" << name << "\"\n";
    return false;
  }

  //_data_start = read.tellg();
  return true;
}

/**
 * Called after read_header to verify the integrity of the data.
 * If ZLib support is not enabled, this does not verify the checksum or the
 * compression.
 */
bool ZipArchive::Subfile::
verify_data(std::istream &read) {
  //nassertr(read.tellg() == _data_start, false);

  static const size_t buffer_size = 4096;
  char buffer[buffer_size];

#ifdef HAVE_ZLIB
  unsigned long crc = crc32(0L, Z_NULL, 0);
  IDecompressStream wrapper;

  std::istream *data_stream;
  if (_compression_method == CM_store) {
    data_stream = &read;
  }
  else if (_compression_method == CM_deflate) {
    wrapper.open(&read, false, _data_length, false);
    data_stream = &wrapper;
  }
  else {
    express_cat.warning()
      << "Unable to verify ZIP subfile \"" << _name << "\": compression method "
      << (int)_compression_method << " not supported.\n";
    return false;
  }

  size_t bytes_to_go = _uncompressed_length;
  data_stream->read(buffer, std::min(bytes_to_go, buffer_size));
  size_t read_bytes = data_stream->gcount();

  while (read_bytes > 0) {
    crc = crc32(crc, (unsigned char *)buffer, read_bytes);

    bytes_to_go -= read_bytes;
    if (bytes_to_go == 0) {
      break;
    }

    data_stream->read(buffer, std::min(bytes_to_go, buffer_size));
    read_bytes = data_stream->gcount();
  }

  if (data_stream == &wrapper) {
    wrapper.close();
  }

  if (bytes_to_go > 0) {
    express_cat.warning()
      << "Reached end of compressed data verifying ZIP subfile " << _name << ".\n";
    return false;
  }

  if (crc != _checksum) {
    express_cat.warning()
      << "ZIP file member " << _name << " is corrupted.\n";
    return false;
  }
#else
  read.ignore(_data_length);

  if (read.eof()) {
    express_cat.warning()
      << "Reached EOF verifying ZIP subfile " << _name << ".\n";
    return false;
  }
#endif

  // If we are expecting a data descriptor, verify that it matches what is in
  // the index entry.
  if (_flags & SF_data_descriptor) {
    StreamReader reader(read);
    uint32_t checksum = reader.get_uint32();
    if (checksum == 0x08074b50) {
      // There is an optional data descriptor signature.
      if (_checksum == 0x08074b50) {
        // The CRC32 happens to match the data descriptor signature by accident.
        // Since the data descriptor signature is optional, we can't know for
        // sure which is which, so let's just not bother validating this.
        return true;
      }
      checksum = reader.get_uint32();
    }
    uint32_t data_length = reader.get_uint32();
    uint32_t uncompressed_length = reader.get_uint32();
    if (checksum != _checksum ||
        data_length != _data_length ||
        uncompressed_length != _uncompressed_length) {
      express_cat.warning()
        << "ZIP file member " << _name << " has mismatched data descriptor.\n";
      return false;
    }
  }

  return true;
}

/**
 * Writes the index record for the Subfile to the indicated ostream.  Assumes
 * the istream has already been positioned to the indicated stream position,
 * fpos, the start of the index record, and that this is the effective end of
 * the file.  Returns true on success.
 *
 * The _index_start member is updated by this operation.
 */
bool ZipArchive::Subfile::
write_index(std::ostream &write, streampos &fpos) {
  nassertr(write.tellp() == fpos, false);

  StreamWriter writer(write);
  writer.add_uint32(0x02014b50);

  bool zip64_length =
    (_data_length >= 0xffffffffu || _uncompressed_length >= 0xffffffffu);
  bool zip64_offset = (_header_start >= 0xffffffffu);
  size_t extra_length = zip64_length * 16 + zip64_offset * 8;

  if (zip64_length || zip64_offset) {
    writer.add_uint8(45);
    writer.add_uint8(_system);
    writer.add_uint16((_flags & SF_strong_encryption) ? 50 : 45);
  } else {
    // We just write 2.0 if it we support DEFLATE compression, 1.0 otherwise.
#ifdef HAVE_ZLIB
    writer.add_uint8(20);
    writer.add_uint8(_system);
    writer.add_uint16((_flags & SF_strong_encryption) ? 50 : (is_compressed() ? 20 : 10));
#else
    writer.add_uint8(10);
    writer.add_uint8(_system);
    writer.add_uint16((_flags & SF_strong_encryption) ? 50 : 10);
#endif
  }

  writer.add_uint16(_flags);
  writer.add_uint16((uint16_t)_compression_method);

  if (_timestamp > dos_epoch) {
    // Convert from UNIX timestamp to DOS/FAT timestamp.
    struct tm *time = localtime(&_timestamp);
    writer.add_uint16((time->tm_sec >> 1)
                    | (time->tm_min << 5)
                    | (time->tm_hour << 11));
    writer.add_uint16(time->tm_mday
                    | ((time->tm_min + 1) << 5)
                    | ((time->tm_year - 1980) << 9));
  } else {
    // January 1, 1980
    writer.add_uint16(0);
    writer.add_uint16(33);
  }

  std::string encoded_name;
  std::string encoded_comment;
  if (_flags & SF_utf8_encoding) {
    encoded_name = _name;
    encoded_comment = _comment;
 } else {
    encoded_name = TextEncoder::reencode_text(_name, TextEncoder::E_utf8, TextEncoder::E_cp437);
    encoded_comment = TextEncoder::reencode_text(_comment, TextEncoder::E_utf8, TextEncoder::E_cp437);
  }

  writer.add_uint32(_checksum);
  if (zip64_length) {
    writer.add_uint32(0xffffffffu);
    writer.add_uint32(0xffffffffu);
  } else {
    writer.add_uint32(_data_length);
    writer.add_uint32(_uncompressed_length);
  }
  writer.add_uint16(encoded_name.size());
  writer.add_uint16(extra_length);
  writer.add_uint16(encoded_comment.size());
  writer.add_uint16(0); // disk number start
  writer.add_uint16(_internal_attribs);
  writer.add_uint32(_external_attribs);
  writer.add_uint32(zip64_offset ? 0xffffffffu : (uint32_t)_header_start);

  writer.append_data(encoded_name);

  // Write any extra fields.
  if (zip64_length || zip64_offset) {
    writer.add_uint16(0x0001);
    writer.add_uint16(zip64_length * 16 + zip64_offset * 8);
    if (zip64_length) {
      writer.add_uint64(_data_length);
      writer.add_uint64(_uncompressed_length);
    }
    if (zip64_offset) {
      writer.add_uint64(_header_start);
    }
  }

  writer.append_data(encoded_comment);

  fpos += 46 + extra_length + encoded_name.size() + encoded_comment.size();
  nassertr(write.tellp() == fpos, false);
  return !write.fail();
}

/**
 * Writes the local file header to the indicated ostream.  This immediately
 * precedes the data, so should be followed up by a call to write_data.
 *
 * Assumes that the file is currently positioned at the given fpos pointer, and
 * advances it by the amount of bytes written to the output (which may be longer
 * than the actual size of the subfile).
 */
bool ZipArchive::Subfile::
write_header(std::ostream &write, std::streampos &fpos) {
  nassertr(write.tellp() == fpos, false);

  std::string encoded_name;
  if (_flags & SF_utf8_encoding) {
    encoded_name = _name;
  } else {
    encoded_name = TextEncoder::reencode_text(_name, TextEncoder::E_utf8, TextEncoder::E_cp437);
  }

  std::streamoff header_size = 30 + encoded_name.size();

  StreamWriter writer(write);
  int modulo = (fpos + header_size) % 4;
  if (!is_compressed() && modulo != 0) {
    // Align uncompressed files to 4-byte boundary.  We don't really need to do
    // this, but it's needed when producing .apk files, and it doesn't really
    // cause harm to do it in other cases as well.
    writer.pad_bytes(4 - modulo);
    fpos += (4 - modulo);
  }

  _header_start = fpos;

  writer.add_uint32(0x04034b50);
  writer.add_uint16((_flags & SF_strong_encryption) ? 50 : (is_compressed() ? 20 : 10));

  writer.add_uint16(_flags);
  writer.add_uint16((uint16_t)_compression_method);

  if (_timestamp > 315532800) {
    // Convert from UNIX timestamp to DOS/FAT timestamp.
    struct tm *time = localtime(&_timestamp);
    writer.add_uint16((time->tm_sec >> 1)
                    | (time->tm_min << 5)
                    | (time->tm_hour << 11));
    writer.add_uint16(time->tm_mday
                    | ((time->tm_min + 1) << 5)
                    | ((time->tm_year - 1980) << 9));
  } else {
    // January 1, 1980
    writer.add_uint16(0);
    writer.add_uint16(33);
  }

  // This flag is set if we don't yet have the checksum or lengths.  We will
  // write a data descriptor after the actual data containing these values.
  if (_flags & SF_data_descriptor) {
    writer.add_uint32(0);
    writer.add_uint32(0);
    writer.add_uint32(0);
  } else {
    writer.add_uint32(_checksum);
    writer.add_uint32(_data_length);
    writer.add_uint32(_uncompressed_length);
  }

  writer.add_uint16(encoded_name.size());
  writer.add_uint16(0); // We don't write extras for now.
  writer.append_data(encoded_name);

  fpos += header_size;
  nassertr(write.tellp() == fpos, false);
  return !write.fail();
}

/**
 * Writes the data record for the Subfile to the indicated ostream: the actual
 * contents of the Subfile.  Assumes the istream has already been positioned
 * to the indicated stream position, fpos, the start of the data record, and
 * that this is the effective end of the file.  Returns the position within
 * the file of the next data record.
 *
 * The _data_start, _data_length, and _uncompressed_length members are updated
 * by this operation.
 *
 * If the "read" pointer is non-NULL, it is the readable istream of a
 * ZipArchive in which the Subfile might already be packed.  This is used for
 * reading the contents of the Subfile during a repack() operation.
 */
bool ZipArchive::Subfile::
write_data(std::ostream &write, std::istream *read, std::streampos &fpos, int compression_level) {
  nassertr(write.tellp() == fpos, false);

  if (!is_compressed()) {
    nassertr((fpos % 4) == 0, false);
  }

  //_data_start = fpos;

  std::ostream *putter = &write;
  bool delete_putter = false;

#ifndef HAVE_ZLIB
  // Without ZLIB, we can't support compression.  The flag had better not be
  // set.
  nassertr(!is_compressed(), false);
#else  // HAVE_ZLIB
  if (is_compressed()) {
    // Write it compressed.
    putter = new OCompressStream(putter, delete_putter, compression_level, false);
    delete_putter = true;
  }
#endif  // HAVE_ZLIB

  static const size_t buffer_size = 4096;
  char buffer[buffer_size];
  size_t total_count = 0;

#ifdef HAVE_ZLIB
  unsigned long crc = crc32(0L, Z_NULL, 0);
#endif

  read->read(buffer, buffer_size);
  size_t count = read->gcount();
  while (count != 0) {
#ifdef HAVE_ZLIB
    crc = crc32(crc, (unsigned char *)buffer, count);
#endif
    total_count += count;
    putter->write(buffer, count);
    read->read(buffer, buffer_size);
    count = read->gcount();
  }

  if (delete_putter) {
    delete putter;
  }

  if (is_compressed()) {
    std::streampos write_end = write.tellp();
    _data_length = (size_t)(write_end - fpos);
    fpos = write_end;
  } else {
    _data_length = total_count;
    fpos += total_count;
  }
  _uncompressed_length = total_count;
#ifdef HAVE_ZLIB
  _checksum = crc;
#endif

  //TODO: what if we need a zip64 data descriptor?
  if (_flags & SF_data_descriptor) {
    StreamWriter writer(write);
    writer.add_uint32(0x08074b50);
    writer.add_uint32(_checksum);
    writer.add_uint32(_data_length);
    writer.add_uint32(_uncompressed_length);
    fpos += 16;
  }

  nassertr(write.tellp() == fpos, false);
  return !write.fail();
}