2012-09-23 18:41:41 +00:00
|
|
|
#include "esmreader.hpp"
|
2011-04-06 16:11:08 +00:00
|
|
|
|
2015-02-22 13:19:00 +00:00
|
|
|
#include <stdexcept>
|
2013-01-01 23:13:36 +00:00
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
namespace ESM
|
|
|
|
{
|
|
|
|
|
2011-06-19 16:14:03 +00:00
|
|
|
using namespace Misc;
|
|
|
|
|
2013-12-16 10:39:24 +00:00
|
|
|
std::string ESMReader::getName() const
|
|
|
|
{
|
|
|
|
return mCtx.filename;
|
|
|
|
}
|
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
ESM_Context ESMReader::getContext()
|
|
|
|
{
|
|
|
|
// Update the file position before returning
|
2015-02-22 13:12:05 +00:00
|
|
|
mCtx.filePos = mEsm->tellg();
|
2011-04-06 16:11:08 +00:00
|
|
|
return mCtx;
|
|
|
|
}
|
|
|
|
|
2013-05-16 16:50:26 +00:00
|
|
|
ESMReader::ESMReader()
|
2015-04-25 18:37:42 +00:00
|
|
|
: mIdx(0)
|
2013-05-16 16:50:26 +00:00
|
|
|
, mRecordFlags(0)
|
2015-04-25 18:37:42 +00:00
|
|
|
, mBuffer(50*1024)
|
2013-07-31 16:46:32 +00:00
|
|
|
, mGlobalReaderList(NULL)
|
|
|
|
, mEncoder(NULL)
|
2015-04-01 15:02:15 +00:00
|
|
|
, mFileSize(0)
|
2013-01-03 20:15:18 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2013-03-12 13:33:35 +00:00
|
|
|
int ESMReader::getFormat() const
|
|
|
|
{
|
|
|
|
return mHeader.mFormat;
|
|
|
|
}
|
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
void ESMReader::restoreContext(const ESM_Context &rc)
|
|
|
|
{
|
|
|
|
// Reopen the file if necessary
|
|
|
|
if (mCtx.filename != rc.filename)
|
|
|
|
openRaw(rc.filename);
|
|
|
|
|
|
|
|
// Copy the data
|
|
|
|
mCtx = rc;
|
|
|
|
|
|
|
|
// Make sure we seek to the right place
|
2015-02-22 13:12:05 +00:00
|
|
|
mEsm->seekg(mCtx.filePos);
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::close()
|
|
|
|
{
|
2015-02-22 13:12:05 +00:00
|
|
|
mEsm.reset();
|
2011-04-06 16:11:08 +00:00
|
|
|
mCtx.filename.clear();
|
|
|
|
mCtx.leftFile = 0;
|
|
|
|
mCtx.leftRec = 0;
|
|
|
|
mCtx.leftSub = 0;
|
|
|
|
mCtx.subCached = false;
|
|
|
|
mCtx.recName.val = 0;
|
|
|
|
mCtx.subName.val = 0;
|
|
|
|
}
|
|
|
|
|
2015-02-22 13:12:05 +00:00
|
|
|
void ESMReader::openRaw(Files::IStreamPtr _esm, const std::string& name)
|
2011-04-06 16:11:08 +00:00
|
|
|
{
|
|
|
|
close();
|
|
|
|
mEsm = _esm;
|
|
|
|
mCtx.filename = name;
|
2015-02-22 13:12:05 +00:00
|
|
|
mEsm->seekg(0, mEsm->end);
|
2015-04-01 15:02:15 +00:00
|
|
|
mCtx.leftFile = mFileSize = mEsm->tellg();
|
2015-02-22 13:12:05 +00:00
|
|
|
mEsm->seekg(0, mEsm->beg);
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
2015-02-22 13:12:05 +00:00
|
|
|
void ESMReader::openRaw(const std::string& filename)
|
|
|
|
{
|
|
|
|
openRaw(Files::openConstrainedFileStream(filename.c_str()), filename);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::open(Files::IStreamPtr _esm, const std::string &name)
|
2011-04-06 16:11:08 +00:00
|
|
|
{
|
|
|
|
openRaw(_esm, name);
|
|
|
|
|
|
|
|
if (getRecName() != "TES3")
|
|
|
|
fail("Not a valid Morrowind file");
|
|
|
|
|
|
|
|
getRecHeader();
|
|
|
|
|
2013-03-12 08:16:03 +00:00
|
|
|
mHeader.load (*this);
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::open(const std::string &file)
|
|
|
|
{
|
2015-02-22 13:12:05 +00:00
|
|
|
open (Files::openConstrainedFileStream (file.c_str ()), file);
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int64_t ESMReader::getHNLong(const char *name)
|
|
|
|
{
|
|
|
|
int64_t val;
|
|
|
|
getHNT(val, name);
|
|
|
|
return val;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string ESMReader::getHNOString(const char* name)
|
|
|
|
{
|
|
|
|
if (isNextSub(name))
|
|
|
|
return getHString();
|
|
|
|
return "";
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string ESMReader::getHNString(const char* name)
|
|
|
|
{
|
|
|
|
getSubNameIs(name);
|
|
|
|
return getHString();
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string ESMReader::getHString()
|
|
|
|
{
|
|
|
|
getSubHeader();
|
|
|
|
|
|
|
|
// Hack to make MultiMark.esp load. Zero-length strings do not
|
|
|
|
// occur in any of the official mods, but MultiMark makes use of
|
|
|
|
// them. For some reason, they break the rules, and contain a byte
|
|
|
|
// (value 0) even if the header says there is no data. If
|
|
|
|
// Morrowind accepts it, so should we.
|
|
|
|
if (mCtx.leftSub == 0)
|
|
|
|
{
|
|
|
|
// Skip the following zero byte
|
|
|
|
mCtx.leftRec--;
|
|
|
|
char c;
|
2015-01-31 18:38:42 +00:00
|
|
|
getExact(&c, 1);
|
2011-04-06 16:11:08 +00:00
|
|
|
return "";
|
|
|
|
}
|
|
|
|
|
|
|
|
return getString(mCtx.leftSub);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::getHExact(void*p, int size)
|
|
|
|
{
|
|
|
|
getSubHeader();
|
|
|
|
if (size != static_cast<int> (mCtx.leftSub))
|
2015-01-20 18:12:07 +00:00
|
|
|
{
|
|
|
|
std::stringstream error;
|
|
|
|
error << "getHExact(): size mismatch (requested " << size << ", got " << mCtx.leftSub << ")";
|
|
|
|
fail(error.str());
|
|
|
|
}
|
2011-04-06 16:11:08 +00:00
|
|
|
getExact(p, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Read the given number of bytes from a named subrecord
|
|
|
|
void ESMReader::getHNExact(void*p, int size, const char* name)
|
|
|
|
{
|
|
|
|
getSubNameIs(name);
|
|
|
|
getHExact(p, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get the next subrecord name and check if it matches the parameter
|
|
|
|
void ESMReader::getSubNameIs(const char* name)
|
|
|
|
{
|
|
|
|
getSubName();
|
|
|
|
if (mCtx.subName != name)
|
|
|
|
fail(
|
|
|
|
"Expected subrecord " + std::string(name) + " but got "
|
|
|
|
+ mCtx.subName.toString());
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ESMReader::isNextSub(const char* name)
|
|
|
|
{
|
|
|
|
if (!mCtx.leftRec)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
getSubName();
|
|
|
|
|
|
|
|
// If the name didn't match, then mark the it as 'cached' so it's
|
|
|
|
// available for the next call to getSubName.
|
|
|
|
mCtx.subCached = (mCtx.subName != name);
|
|
|
|
|
|
|
|
// If subCached is false, then subName == name.
|
|
|
|
return !mCtx.subCached;
|
|
|
|
}
|
|
|
|
|
2015-06-21 16:18:24 +00:00
|
|
|
bool ESMReader::peekNextSub(const char *name)
|
|
|
|
{
|
|
|
|
if (!mCtx.leftRec)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
getSubName();
|
|
|
|
|
|
|
|
mCtx.subCached = true;
|
|
|
|
return mCtx.subName == name;
|
|
|
|
}
|
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
// Read subrecord name. This gets called a LOT, so I've optimized it
|
|
|
|
// slightly.
|
|
|
|
void ESMReader::getSubName()
|
|
|
|
{
|
|
|
|
// If the name has already been read, do nothing
|
|
|
|
if (mCtx.subCached)
|
|
|
|
{
|
|
|
|
mCtx.subCached = false;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// reading the subrecord data anyway.
|
2015-01-31 18:38:42 +00:00
|
|
|
getExact(mCtx.subName.name, 4);
|
2011-04-06 16:11:08 +00:00
|
|
|
mCtx.leftRec -= 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ESMReader::isEmptyOrGetName()
|
|
|
|
{
|
|
|
|
if (mCtx.leftRec)
|
|
|
|
{
|
2015-01-31 18:38:42 +00:00
|
|
|
getExact(mCtx.subName.name, 4);
|
2011-04-06 16:11:08 +00:00
|
|
|
mCtx.leftRec -= 4;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::skipHSub()
|
|
|
|
{
|
|
|
|
getSubHeader();
|
|
|
|
skip(mCtx.leftSub);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::skipHSubSize(int size)
|
|
|
|
{
|
|
|
|
skipHSub();
|
|
|
|
if (static_cast<int> (mCtx.leftSub) != size)
|
|
|
|
fail("skipHSubSize() mismatch");
|
|
|
|
}
|
|
|
|
|
2015-01-19 22:29:06 +00:00
|
|
|
void ESMReader::skipHSubUntil(const char *name)
|
|
|
|
{
|
|
|
|
while (hasMoreSubs() && !isNextSub(name))
|
|
|
|
{
|
|
|
|
mCtx.subCached = false;
|
|
|
|
skipHSub();
|
|
|
|
}
|
|
|
|
if (hasMoreSubs())
|
|
|
|
mCtx.subCached = true;
|
|
|
|
}
|
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
void ESMReader::getSubHeader()
|
|
|
|
{
|
|
|
|
if (mCtx.leftRec < 4)
|
|
|
|
fail("End of record while reading sub-record header");
|
|
|
|
|
|
|
|
// Get subrecord size
|
|
|
|
getT(mCtx.leftSub);
|
|
|
|
|
|
|
|
// Adjust number of record bytes left
|
|
|
|
mCtx.leftRec -= mCtx.leftSub + 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::getSubHeaderIs(int size)
|
|
|
|
{
|
|
|
|
getSubHeader();
|
|
|
|
if (size != static_cast<int> (mCtx.leftSub))
|
|
|
|
fail("getSubHeaderIs(): Sub header mismatch");
|
|
|
|
}
|
|
|
|
|
|
|
|
NAME ESMReader::getRecName()
|
|
|
|
{
|
|
|
|
if (!hasMoreRecs())
|
|
|
|
fail("No more records, getRecName() failed");
|
|
|
|
getName(mCtx.recName);
|
|
|
|
mCtx.leftFile -= 4;
|
|
|
|
|
|
|
|
// Make sure we don't carry over any old cached subrecord
|
|
|
|
// names. This can happen in some cases when we skip parts of a
|
|
|
|
// record.
|
|
|
|
mCtx.subCached = false;
|
|
|
|
|
|
|
|
return mCtx.recName;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::skipRecord()
|
|
|
|
{
|
|
|
|
skip(mCtx.leftRec);
|
|
|
|
mCtx.leftRec = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::getRecHeader(uint32_t &flags)
|
|
|
|
{
|
|
|
|
// General error checking
|
|
|
|
if (mCtx.leftFile < 12)
|
|
|
|
fail("End of file while reading record header");
|
|
|
|
if (mCtx.leftRec)
|
|
|
|
fail("Previous record contains unread bytes");
|
|
|
|
|
|
|
|
getUint(mCtx.leftRec);
|
|
|
|
getUint(flags);// This header entry is always zero
|
|
|
|
getUint(flags);
|
|
|
|
mCtx.leftFile -= 12;
|
|
|
|
|
|
|
|
// Check that sizes add up
|
|
|
|
if (mCtx.leftFile < mCtx.leftRec)
|
|
|
|
fail("Record size is larger than rest of file");
|
|
|
|
|
|
|
|
// Adjust number of bytes mCtx.left in file
|
|
|
|
mCtx.leftFile -= mCtx.leftRec;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*************************************************************************
|
|
|
|
*
|
|
|
|
* Lowest level data reading and misc methods
|
|
|
|
*
|
|
|
|
*************************************************************************/
|
|
|
|
|
|
|
|
void ESMReader::getExact(void*x, int size)
|
|
|
|
{
|
2015-01-31 18:38:42 +00:00
|
|
|
try
|
|
|
|
{
|
2015-02-22 13:12:05 +00:00
|
|
|
mEsm->read((char*)x, size);
|
2015-01-31 18:38:42 +00:00
|
|
|
}
|
|
|
|
catch (std::exception& e)
|
|
|
|
{
|
|
|
|
fail(std::string("Read error: ") + e.what());
|
|
|
|
}
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
std::string ESMReader::getString(int size)
|
|
|
|
{
|
2013-01-03 20:15:18 +00:00
|
|
|
size_t s = size;
|
|
|
|
if (mBuffer.size() <= s)
|
|
|
|
// Add some extra padding to reduce the chance of having to resize
|
|
|
|
// again later.
|
|
|
|
mBuffer.resize(3*s);
|
|
|
|
|
|
|
|
// And make sure the string is zero terminated
|
|
|
|
mBuffer[s] = 0;
|
|
|
|
|
|
|
|
// read ESM data
|
|
|
|
char *ptr = &mBuffer[0];
|
|
|
|
getExact(ptr, size);
|
2011-04-06 16:11:08 +00:00
|
|
|
|
2015-01-16 22:10:57 +00:00
|
|
|
size = strnlen(ptr, size);
|
2013-12-06 13:24:14 +00:00
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
// Convert to UTF8 and return
|
2013-11-19 12:46:24 +00:00
|
|
|
if (mEncoder)
|
|
|
|
return mEncoder->getUtf8(ptr, size);
|
|
|
|
|
|
|
|
return std::string (ptr, size);
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::fail(const std::string &msg)
|
|
|
|
{
|
|
|
|
using namespace std;
|
|
|
|
|
|
|
|
stringstream ss;
|
|
|
|
|
|
|
|
ss << "ESM Error: " << msg;
|
|
|
|
ss << "\n File: " << mCtx.filename;
|
|
|
|
ss << "\n Record: " << mCtx.recName.toString();
|
|
|
|
ss << "\n Subrecord: " << mCtx.subName.toString();
|
2015-02-22 13:12:05 +00:00
|
|
|
if (mEsm.get())
|
|
|
|
ss << "\n Offset: 0x" << hex << mEsm->tellg();
|
2011-04-06 16:11:08 +00:00
|
|
|
throw std::runtime_error(ss.str());
|
|
|
|
}
|
|
|
|
|
2013-01-06 00:37:58 +00:00
|
|
|
void ESMReader::setEncoder(ToUTF8::Utf8Encoder* encoder)
|
Added new command line option: "encoding"
Added new command line option: "encoding" which allow to
change font encoding used in game messages.
Currently there are three evailable encodings:
win1250 - Central and Eastern European (languages
that use Latin script, such as Polish,
Czech, Slovak, Hungarian, Slovene, Bosnian,
Croatian, Serbian (Latin script),
Romanian and Albanian)
win1251 - languages that use the Cyrillic alphabet
such as Russian, Bulgarian, Serbian Cyrillic
and others
win1252 - Western European (Latin) - default
Signed-off-by: Lukasz Gromanowski <lgromanowski@gmail.com>
2011-07-17 20:16:50 +00:00
|
|
|
{
|
2013-01-06 00:37:58 +00:00
|
|
|
mEncoder = encoder;
|
Added new command line option: "encoding"
Added new command line option: "encoding" which allow to
change font encoding used in game messages.
Currently there are three evailable encodings:
win1250 - Central and Eastern European (languages
that use Latin script, such as Polish,
Czech, Slovak, Hungarian, Slovene, Bosnian,
Croatian, Serbian (Latin script),
Romanian and Albanian)
win1251 - languages that use the Cyrillic alphabet
such as Russian, Bulgarian, Serbian Cyrillic
and others
win1252 - Western European (Latin) - default
Signed-off-by: Lukasz Gromanowski <lgromanowski@gmail.com>
2011-07-17 20:16:50 +00:00
|
|
|
}
|
|
|
|
|
2015-02-22 13:12:05 +00:00
|
|
|
size_t ESMReader::getFileOffset()
|
|
|
|
{
|
|
|
|
return mEsm->tellg();
|
|
|
|
}
|
|
|
|
|
|
|
|
void ESMReader::skip(int bytes)
|
|
|
|
{
|
|
|
|
mEsm->seekg(getFileOffset()+bytes);
|
|
|
|
}
|
|
|
|
|
2011-04-06 16:11:08 +00:00
|
|
|
}
|