#include "esmreader.hpp" #include "readerscache.hpp" #include #include #include #include #include namespace ESM { using namespace Misc; ESM_Context ESMReader::getContext() { // Update the file position before returning mCtx.filePos = mEsm->tellg(); return mCtx; } ESMReader::ESMReader() : mRecordFlags(0) , mBuffer(50*1024) , mEncoder(nullptr) , mFileSize(0) { clearCtx(); mCtx.index = 0; } void ESMReader::restoreContext(const ESM_Context &rc) { // Reopen the file if necessary if (mCtx.filename != rc.filename) openRaw(rc.filename); // Copy the data mCtx = rc; // Make sure we seek to the right place mEsm->seekg(mCtx.filePos); } void ESMReader::close() { mEsm.reset(); clearCtx(); mHeader.blank(); } void ESMReader::clearCtx() { mCtx.filename.clear(); mCtx.leftFile = 0; mCtx.leftRec = 0; mCtx.leftSub = 0; mCtx.subCached = false; mCtx.recName.clear(); mCtx.subName.clear(); } std::string ESMReader::getMaybeFixedStringSize(std::size_t size) { if (mHeader.mFormat > 22) { std::uint32_t storedSize = 0; getT(storedSize); if (storedSize > mCtx.leftSub) fail("String does not fit subrecord (" + std::to_string(storedSize) + " > " + std::to_string(mCtx.leftSub) + ")"); size = static_cast(storedSize); } return std::string(getStringView(size)); } std::string_view ESMReader::getStringView(std::size_t size) { if (mBuffer.size() <= size) // Add some extra padding to reduce the chance of having to resize // again later. mBuffer.resize(3 * size); // And make sure the string is zero terminated mBuffer[size] = 0; // read ESM data char* ptr = mBuffer.data(); getExact(ptr, size); size = strnlen(ptr, size); // Convert to UTF8 and return if (mEncoder != nullptr) return mEncoder->getUtf8(std::string_view(ptr, size)); return std::string_view(ptr, size); } void ESMReader::resolveParentFileIndices(ReadersCache& readers) { mCtx.parentFileIndices.clear(); for (const Header::MasterData &mast : getGameFiles()) { const std::string& fname = mast.name; int index = getIndex(); for (int i = 0; i < getIndex(); i++) { const ESM::ReadersCache::BusyItem reader = readers.get(static_cast(i)); if (reader->getFileSize() == 0) continue; // Content file in non-ESM format const std::string& candidate = reader->getName(); std::string fnamecandidate = boost::filesystem::path(candidate).filename().string(); if (Misc::StringUtils::ciEqual(fname, fnamecandidate)) { index = i; break; } } mCtx.parentFileIndices.push_back(index); } } void ESMReader::openRaw(std::unique_ptr&& stream, std::string_view name) { close(); mEsm = std::move(stream); mCtx.filename = name; mEsm->seekg(0, mEsm->end); mCtx.leftFile = mFileSize = mEsm->tellg(); mEsm->seekg(0, mEsm->beg); } void ESMReader::openRaw(std::string_view filename) { openRaw(Files::openBinaryInputFileStream(std::string(filename)), filename); } void ESMReader::open(std::unique_ptr&& stream, const std::string &name) { openRaw(std::move(stream), name); if (getRecName() != "TES3") fail("Not a valid Morrowind file"); getRecHeader(); mHeader.load (*this); } void ESMReader::open(const std::string &file) { open(Files::openBinaryInputFileStream(file), file); } std::string ESMReader::getHNOString(NAME name) { if (isNextSub(name)) return getHString(); return ""; } void ESMReader::skipHNOString(NAME name) { if (isNextSub(name)) skipHString(); } std::string ESMReader::getHNString(NAME name) { getSubNameIs(name); return getHString(); } std::string ESMReader::getHString() { getSubHeader(); // Hack to make MultiMark.esp load. Zero-length strings do not // occur in any of the official mods, but MultiMark makes use of // them. For some reason, they break the rules, and contain a byte // (value 0) even if the header says there is no data. If // Morrowind accepts it, so should we. if (mCtx.leftSub == 0 && hasMoreSubs() && !mEsm->peek()) { // Skip the following zero byte mCtx.leftRec--; char c; getT(c); return std::string(); } return getString(mCtx.leftSub); } void ESMReader::skipHString() { getSubHeader(); // Hack to make MultiMark.esp load. Zero-length strings do not // occur in any of the official mods, but MultiMark makes use of // them. For some reason, they break the rules, and contain a byte // (value 0) even if the header says there is no data. If // Morrowind accepts it, so should we. if (mCtx.leftSub == 0 && hasMoreSubs() && !mEsm->peek()) { // Skip the following zero byte mCtx.leftRec--; skipT(); return; } skip(mCtx.leftSub); } void ESMReader::getHExact(void*p, int size) { getSubHeader(); if (size != static_cast (mCtx.leftSub)) reportSubSizeMismatch(size, mCtx.leftSub); getExact(p, size); } // Read the given number of bytes from a named subrecord void ESMReader::getHNExact(void*p, int size, NAME name) { getSubNameIs(name); getHExact(p, size); } // Get the next subrecord name and check if it matches the parameter void ESMReader::getSubNameIs(NAME name) { getSubName(); if (mCtx.subName != name) fail("Expected subrecord " + name.toString() + " but got " + mCtx.subName.toString()); } bool ESMReader::isNextSub(NAME name) { if (!hasMoreSubs()) return false; getSubName(); // If the name didn't match, then mark the it as 'cached' so it's // available for the next call to getSubName. mCtx.subCached = (mCtx.subName != name); // If subCached is false, then subName == name. return !mCtx.subCached; } bool ESMReader::peekNextSub(NAME name) { if (!hasMoreSubs()) return false; getSubName(); mCtx.subCached = true; return mCtx.subName == name; } // Read subrecord name. This gets called a LOT, so I've optimized it // slightly. void ESMReader::getSubName() { // If the name has already been read, do nothing if (mCtx.subCached) { mCtx.subCached = false; return; } // reading the subrecord data anyway. const std::size_t subNameSize = decltype(mCtx.subName)::sCapacity; getExact(mCtx.subName.mData, static_cast(subNameSize)); mCtx.leftRec -= static_cast(subNameSize); } void ESMReader::skipHSub() { getSubHeader(); skip(mCtx.leftSub); } void ESMReader::skipHSubSize(int size) { skipHSub(); if (static_cast (mCtx.leftSub) != size) reportSubSizeMismatch(mCtx.leftSub, size); } void ESMReader::skipHSubUntil(NAME name) { while (hasMoreSubs() && !isNextSub(name)) { mCtx.subCached = false; skipHSub(); } if (hasMoreSubs()) mCtx.subCached = true; } void ESMReader::getSubHeader() { if (mCtx.leftRec < sizeof(mCtx.leftSub)) fail("End of record while reading sub-record header"); // Get subrecord size getT(mCtx.leftSub); mCtx.leftRec -= sizeof(mCtx.leftSub); // Adjust number of record bytes left if (mCtx.leftRec < mCtx.leftSub) fail("Record size is larger than rest of file"); mCtx.leftRec -= mCtx.leftSub; } NAME ESMReader::getRecName() { if (!hasMoreRecs()) fail("No more records, getRecName() failed"); getName(mCtx.recName); mCtx.leftFile -= decltype(mCtx.recName)::sCapacity; // Make sure we don't carry over any old cached subrecord // names. This can happen in some cases when we skip parts of a // record. mCtx.subCached = false; return mCtx.recName; } void ESMReader::skipRecord() { skip(mCtx.leftRec); mCtx.leftRec = 0; mCtx.subCached = false; } void ESMReader::getRecHeader(uint32_t &flags) { // General error checking if (mCtx.leftFile < 3 * sizeof(uint32_t)) fail("End of file while reading record header"); if (mCtx.leftRec) fail("Previous record contains unread bytes"); getUint(mCtx.leftRec); getUint(flags);// This header entry is always zero getUint(flags); mCtx.leftFile -= 3 * sizeof(uint32_t); // Check that sizes add up if (mCtx.leftFile < mCtx.leftRec) reportSubSizeMismatch(mCtx.leftFile, mCtx.leftRec); // Adjust number of bytes mCtx.left in file mCtx.leftFile -= mCtx.leftRec; } /************************************************************************* * * Lowest level data reading and misc methods * *************************************************************************/ std::string ESMReader::getString(int size) { size_t s = size; if (mBuffer.size() <= s) // Add some extra padding to reduce the chance of having to resize // again later. mBuffer.resize(3*s); // And make sure the string is zero terminated mBuffer[s] = 0; // read ESM data char *ptr = mBuffer.data(); getExact(ptr, size); size = static_cast(strnlen(ptr, size)); // Convert to UTF8 and return if (mEncoder) return std::string(mEncoder->getUtf8(std::string_view(ptr, size))); return std::string (ptr, size); } [[noreturn]] void ESMReader::fail(const std::string &msg) { std::stringstream ss; ss << "ESM Error: " << msg; ss << "\n File: " << mCtx.filename; ss << "\n Record: " << mCtx.recName.toStringView(); ss << "\n Subrecord: " << mCtx.subName.toStringView(); if (mEsm.get()) ss << "\n Offset: 0x" << std::hex << mEsm->tellg(); throw std::runtime_error(ss.str()); } }