1
0
Fork 0
mirror of https://github.com/OpenMW/openmw.git synced 2025-01-22 21:53:52 +00:00
openmw/components/esm/esm_reader.hpp

737 lines
18 KiB
C++
Raw Normal View History

#ifndef _ESM_READER_H
#define _ESM_READER_H
2010-02-16 15:03:18 +00:00
#include <string>
2010-06-27 21:43:07 +00:00
#include <libs/platform/stdint.h>
2010-02-16 19:23:54 +00:00
#include <string.h>
2010-02-16 15:03:18 +00:00
#include <assert.h>
#include <vector>
2010-02-19 08:12:49 +00:00
#include <sstream>
#include <iomanip>
#include <errno.h>
#include <iconv.h>
2010-02-16 15:03:18 +00:00
#include <libs/mangle/stream/stream.hpp>
#include <libs/mangle/stream/servers/file_stream.hpp>
#include <libs/mangle/tools/str_exception.hpp>
2010-06-28 19:44:55 +00:00
#include <components/misc/stringops.hpp>
#ifdef __APPLE__
// need our own implementation of strnlen
2010-06-03 22:56:14 +00:00
static size_t strnlen(const char *s, size_t n)
{
const char *p = (const char *)memchr(s, 0, n);
return(p ? p-s : n);
}
#endif
2010-02-19 13:23:22 +00:00
namespace ESM {
enum Version
{
VER_12 = 0x3f99999a,
VER_13 = 0x3fa66666
};
2010-02-22 20:00:38 +00:00
enum FileType
{
FT_ESP = 0, // Plugin
FT_ESM = 1, // Master
FT_ESS = 32 // Savegame
};
// Used to mark special files. The original ESM files are given
// special treatment in a few places, most noticably in loading and
// filtering out "dirtly" GMST entries correctly.
enum SpecialFile
{
SF_Other,
SF_Morrowind,
SF_Tribunal,
SF_Bloodmoon
};
2010-02-16 15:03:18 +00:00
/* A structure used for holding fixed-length strings. In the case of
LEN=4, it can be more efficient to match the string as a 32 bit
number, therefore the struct is implemented as a union with an int.
*/
template <int LEN>
union NAME_T
{
char name[LEN];
int32_t val;
bool operator==(const char *str)
{
for(int i=0; i<LEN; i++)
if(name[i] != str[i]) return false;
else if(name[i] == 0) return true;
return str[LEN] == 0;
}
bool operator!=(const char *str) { return !((*this)==str); }
bool operator==(const std::string &str)
2010-02-16 15:03:18 +00:00
{
return (*this) == str.c_str();
}
bool operator!=(const std::string &str) { return !((*this)==str); }
2010-02-16 15:03:18 +00:00
bool operator==(int v) { return v == val; }
bool operator!=(int v) { return v != val; }
2010-02-16 19:23:54 +00:00
2010-02-26 15:36:54 +00:00
std::string toString() const { return std::string(name, strnlen(name, LEN)); }
2010-02-16 15:03:18 +00:00
};
typedef NAME_T<4> NAME;
typedef NAME_T<32> NAME32;
2010-02-17 13:54:22 +00:00
typedef NAME_T<64> NAME64;
2010-02-16 15:03:18 +00:00
typedef NAME_T<256> NAME256;
2010-02-25 13:03:03 +00:00
#pragma pack(push)
#pragma pack(1)
/// File header data for all ES files
struct HEDRstruct
{
/* File format version. This is actually a float, the supported
versions are 1.2 and 1.3. These correspond to:
1.2 = 0x3f99999a and 1.3 = 0x3fa66666
*/
int version;
int type; // 0=esp, 1=esm, 32=ess
NAME32 author; // Author's name
NAME256 desc; // File description
int records; // Number of records? Not used.
};
// Defines another files (esm or esp) that this file depends upon.
struct MasterData
{
std::string name;
uint64_t size;
};
// Data that is only present in save game files
struct SaveData
{
float pos[6]; // Player position and rotation
NAME64 cell; // Cell name
float unk2; // Unknown value - possibly game time?
NAME32 player; // Player name
};
#pragma pack(pop)
/* This struct defines a file 'context' which can be saved and later
restored by an ESMReader instance. It will save the position within
a file, and when restored will let you read from that position as
if you never left it.
*/
struct ESM_Context
{
std::string filename;
uint32_t leftRec, leftSub;
size_t leftFile;
NAME recName, subName;
HEDRstruct header;
// True if subName has been read but not used.
bool subCached;
// File position. Only used for stored contexts, not regularly
// updated within the reader itself.
size_t filePos;
};
2010-02-16 15:03:18 +00:00
class ESMReader
{
public:
2010-02-16 15:03:18 +00:00
/*************************************************************************
*
* Public type definitions
*
*************************************************************************/
2010-02-17 13:54:22 +00:00
typedef std::vector<MasterData> MasterList;
2010-02-16 19:23:54 +00:00
/*************************************************************************
*
* Information retrieval
*
*************************************************************************/
2010-02-25 13:03:03 +00:00
int getVer() { return c.header.version; }
float getFVer() { return *((float*)&c.header.version); }
int getSpecial() { return spf; }
2010-02-25 13:03:03 +00:00
const std::string getAuthor() { return c.header.author.toString(); }
const std::string getDesc() { return c.header.desc.toString(); }
const SaveData &getSaveData() { return saveData; }
const MasterList &getMasters() { return masters; }
2010-02-26 15:36:54 +00:00
const NAME &retSubName() { return c.subName; }
2010-02-25 13:03:03 +00:00
uint32_t getSubSize() { return c.leftSub; }
/*************************************************************************
*
* Opening and closing
*
*************************************************************************/
2010-02-25 13:03:03 +00:00
/** Save the current file position and information in a ESM_Context
struct
*/
ESM_Context getContext()
{
// Update the file position before returning
c.filePos = esm->tell();
return c;
}
/** Restore a previously saved context */
void restoreContext(const ESM_Context &rc)
{
// Reopen the file if necessary
if(c.filename != rc.filename)
openRaw(rc.filename);
// Copy the data
c = rc;
// Make sure we seek to the right place
esm->seek(c.filePos);
}
/** Close the file, resets all information. After calling close()
the structure may be reused to load a new file.
*/
void close()
2010-02-16 15:03:18 +00:00
{
esm.reset();
2010-02-25 13:03:03 +00:00
c.filename.clear();
c.leftFile = 0;
c.leftRec = 0;
c.leftSub = 0;
c.subCached = false;
c.recName.val = 0;
c.subName.val = 0;
}
2010-02-19 08:12:49 +00:00
/// Raw opening. Opens the file and sets everything up but doesn't
/// parse the header.
void openRaw(Mangle::Stream::StreamPtr _esm, const std::string &name)
2010-06-28 19:44:55 +00:00
{
close();
esm = _esm;
2010-02-25 13:03:03 +00:00
c.filename = name;
c.leftFile = esm->size();
2010-02-16 15:03:18 +00:00
// Flag certain files for special treatment, based on the file
// name.
2010-02-25 13:03:03 +00:00
const char *cstr = c.filename.c_str();
if(iends(cstr, "Morrowind.esm")) spf = SF_Morrowind;
else if(iends(cstr, "Tribunal.esm")) spf = SF_Tribunal;
else if(iends(cstr, "Bloodmoon.esm")) spf = SF_Bloodmoon;
else spf = SF_Other;
2010-02-19 08:12:49 +00:00
}
/// Load ES file from a new stream, parses the header. Closes the
/// currently open file first, if any.
2010-02-19 08:12:49 +00:00
void open(Mangle::Stream::StreamPtr _esm, const std::string &name)
{
openRaw(_esm, name);
2010-02-16 19:23:54 +00:00
2010-02-16 15:03:18 +00:00
if(getRecName() != "TES3")
fail("Not a valid Morrowind file");
getRecHeader();
2010-02-16 19:23:54 +00:00
// Get the header
2010-02-25 13:03:03 +00:00
getHNT(c.header, "HEDR", 300);
2010-02-16 19:23:54 +00:00
2010-02-25 13:03:03 +00:00
if(c.header.version != VER_12 &&
c.header.version != VER_13)
2010-02-16 19:23:54 +00:00
fail("Unsupported file format version");
while(isNextSub("MAST"))
{
MasterData m;
m.name = getHString();
m.size = getHNLong("DATA");
masters.push_back(m);
2010-02-16 19:23:54 +00:00
}
2010-02-25 13:03:03 +00:00
if(c.header.type == FT_ESS)
2010-02-17 13:54:22 +00:00
{
// Savegame-related data
// Player position etc
2010-02-18 13:58:50 +00:00
getHNT(saveData, "GMDT", 124);
2010-02-17 13:54:22 +00:00
/* Image properties, five ints. Is always:
Red-mask: 0xff0000
Blue-mask: 0x00ff00
Green-mask: 0x0000ff
Alpha-mask: 0x000000
Bpp: 32
*/
getSubNameIs("SCRD");
skipHSubSize(20);
/* Savegame screenshot:
128x128 pixels * 4 bytes per pixel
*/
getSubNameIs("SCRS");
skipHSubSize(65536);
}
2010-02-16 15:03:18 +00:00
}
void open(const std::string &file)
2010-02-16 15:03:18 +00:00
{
using namespace Mangle::Stream;
open(StreamPtr(new FileStream(file)), file);
}
2010-02-19 08:12:49 +00:00
void openRaw(const std::string &file)
{
using namespace Mangle::Stream;
openRaw(StreamPtr(new FileStream(file)), file);
}
2010-02-16 19:23:54 +00:00
/*************************************************************************
*
* Medium-level reading shortcuts
*
*************************************************************************/
// Read data of a given type, stored in a subrecord of a given name
template <typename X>
void getHNT(X &x, const char* name)
{
getSubNameIs(name);
getHT(x);
}
// Optional version of getHNT
template <typename X>
void getHNOT(X &x, const char* name)
{
if(isNextSub(name))
getHT(x);
}
2010-02-18 13:58:50 +00:00
// Version with extra size checking, to make sure the compiler
// doesn't mess up our struct padding.
template <typename X>
void getHNT(X &x, const char* name, int size)
{
assert(sizeof(X) == size);
getSubNameIs(name);
getHT(x);
}
2010-02-17 13:54:22 +00:00
int64_t getHNLong(const char *name)
{
int64_t val;
getHNT(val, name);
return val;
}
2010-02-16 19:23:54 +00:00
// Get data of a given type/size, including subrecord header
template <typename X>
void getHT(X &x)
{
getSubHeader();
2010-02-25 13:03:03 +00:00
if(c.leftSub != sizeof(X))
2010-02-16 19:23:54 +00:00
fail("getHT(): subrecord size mismatch");
getT(x);
}
2010-02-20 20:55:51 +00:00
// Version with extra size checking, to make sure the compiler
// doesn't mess up our struct padding.
template <typename X>
void getHT(X &x, int size)
{
assert(sizeof(X) == size);
getHT(x);
}
2010-02-18 13:58:50 +00:00
// Read a string by the given name if it is the next record.
std::string getHNOString(const char* name)
{
if(isNextSub(name))
return getHString();
return "";
}
// Read a string with the given sub-record name
std::string getHNString(const char* name)
{
getSubNameIs(name);
return getHString();
}
2010-02-18 13:58:50 +00:00
// Read a string, including the sub-record header (but not the name)
std::string getHString()
2010-02-17 13:54:22 +00:00
{
getSubHeader();
// Hack to make MultiMark.esp load. Zero-length strings do not
// occur in any of the official mods, but MultiMark makes use of
// them. For some reason, they break the rules, and contain a byte
// (value 0) even if the header says there is no data. If
// Morrowind accepts it, so should we.
2010-02-25 13:03:03 +00:00
if(c.leftSub == 0)
2010-02-17 13:54:22 +00:00
{
// Skip the following zero byte
2010-02-25 13:03:03 +00:00
c.leftRec--;
2010-02-17 13:54:22 +00:00
char c;
esm->read(&c,1);
return "";
}
2010-02-25 13:03:03 +00:00
return getString(c.leftSub);
2010-02-17 13:54:22 +00:00
}
// Read the given number of bytes from a subrecord
void getHExact(void*p, int size)
{
getSubHeader();
if(size !=static_cast<int> (c.leftSub))
fail("getHExact() size mismatch");
getExact(p,size);
}
// Read the given number of bytes from a named subrecord
void getHNExact(void*p, int size, const char* name)
{
getSubNameIs(name);
getHExact(p,size);
}
2010-02-16 15:03:18 +00:00
/*************************************************************************
*
2010-02-17 13:54:22 +00:00
* Low level sub-record methods
2010-02-16 15:03:18 +00:00
*
*************************************************************************/
2010-02-16 19:23:54 +00:00
// Get the next subrecord name and check if it matches the parameter
void getSubNameIs(const char* name)
{
getSubName();
2010-02-25 13:03:03 +00:00
if(c.subName != name)
fail("Expected subrecord " + std::string(name) + " but got " + c.subName.toString());
2010-02-16 19:23:54 +00:00
}
2010-02-17 13:54:22 +00:00
/** Checks if the next sub record name matches the parameter. If it
does, it is read into 'subName' just as if getSubName() was
called. If not, the read name will still be available for future
calls to getSubName(), isNextSub() and getSubNameIs().
*/
bool isNextSub(const char* name)
2010-02-16 15:03:18 +00:00
{
2010-02-25 13:03:03 +00:00
if(!c.leftRec) return false;
2010-02-17 13:54:22 +00:00
getSubName();
// If the name didn't match, then mark the it as 'cached' so it's
// available for the next call to getSubName.
2010-02-25 13:03:03 +00:00
c.subCached = (c.subName != name);
2010-02-17 13:54:22 +00:00
// If subCached is false, then subName == name.
2010-02-25 13:03:03 +00:00
return !c.subCached;
2010-02-16 15:03:18 +00:00
}
2010-02-17 13:54:22 +00:00
// Read subrecord name. This gets called a LOT, so I've optimized it
// slightly.
2010-02-16 19:23:54 +00:00
void getSubName()
{
2010-02-17 13:54:22 +00:00
// If the name has already been read, do nothing
2010-02-25 13:03:03 +00:00
if(c.subCached)
2010-02-17 13:54:22 +00:00
{
2010-02-25 13:03:03 +00:00
c.subCached = false;
2010-02-17 13:54:22 +00:00
return;
}
2010-02-16 19:23:54 +00:00
// Don't bother with error checking, we will catch an EOF upon
// reading the subrecord data anyway.
2010-02-25 13:03:03 +00:00
esm->read(c.subName.name, 4);
c.leftRec -= 4;
2010-02-16 19:23:54 +00:00
}
2010-02-26 15:36:54 +00:00
// This is specially optimized for LoadINFO.
bool isEmptyOrGetName()
{
if(c.leftRec)
{
esm->read(c.subName.name, 4);
c.leftRec -= 4;
return false;
}
return true;
}
2010-02-17 13:54:22 +00:00
// Skip current sub record, including header (but not including
// name.)
void skipHSub()
{
getSubHeader();
2010-02-25 13:03:03 +00:00
skip(c.leftSub);
2010-02-17 13:54:22 +00:00
}
// Skip sub record and check its size
void skipHSubSize(int size)
{
skipHSub();
if(static_cast<int> (c.leftSub) != size)
2010-02-17 13:54:22 +00:00
fail("skipHSubSize() mismatch");
}
/* Sub-record header. This updates leftRec beyond the current
2010-02-16 19:23:54 +00:00
sub-record as well. leftSub contains size of current sub-record.
*/
void getSubHeader()
{
2010-02-25 13:03:03 +00:00
if(c.leftRec < 4)
2010-02-16 19:23:54 +00:00
fail("End of record while reading sub-record header");
2010-02-17 13:54:22 +00:00
// Get subrecord size
2010-02-25 13:03:03 +00:00
getT(c.leftSub);
2010-02-16 19:23:54 +00:00
// Adjust number of record bytes left
2010-02-25 13:03:03 +00:00
c.leftRec -= c.leftSub + 4;
2010-02-16 19:23:54 +00:00
2010-02-17 13:54:22 +00:00
// Check that sizes added up
2010-02-25 13:03:03 +00:00
if(c.leftRec < 0)
2010-02-16 19:23:54 +00:00
fail("Not enough bytes left in record for this subrecord.");
}
/** Get sub header and check the size
*/
void getSubHeaderIs(int size)
{
getSubHeader();
if(size != static_cast<int> (c.leftSub))
fail("getSubHeaderIs(): Sub header mismatch");
}
2010-02-17 13:54:22 +00:00
/*************************************************************************
*
* Low level record methods
*
*************************************************************************/
// Get the next record name
NAME getRecName()
{
if(!hasMoreRecs())
fail("No more records, getRecName() failed");
2010-02-25 13:03:03 +00:00
getName(c.recName);
c.leftFile -= 4;
2010-02-19 08:12:49 +00:00
// Make sure we don't carry over any old cached subrecord
// names. This can happen in some cases when we skip parts of a
// record.
2010-02-25 13:03:03 +00:00
c.subCached = false;
2010-02-19 08:12:49 +00:00
2010-02-25 13:03:03 +00:00
return c.recName;
2010-02-17 13:54:22 +00:00
}
// Skip the rest of this record. Assumes the name and header have
// already been read
void skipRecord()
{
2010-02-25 13:03:03 +00:00
skip(c.leftRec);
c.leftRec = 0;
}
// Skip an entire record, including the header (but not the name)
void skipHRecord()
{
2010-02-25 13:03:03 +00:00
if(!c.leftFile) return;
getRecHeader();
skipRecord();
}
2010-02-16 15:03:18 +00:00
/* Read record header. This updatesleftFile BEYOND the data that
follows the header, ie beyond the entire record. You should use
leftRec to orient yourself inside the record itself.
*/
void getRecHeader() { uint32_t u; getRecHeader(u); }
2010-02-16 15:03:18 +00:00
void getRecHeader(uint32_t &flags)
{
// General error checking
2010-02-25 13:03:03 +00:00
if(c.leftFile < 12)
2010-02-16 15:03:18 +00:00
fail("End of file while reading record header");
2010-02-25 13:03:03 +00:00
if(c.leftRec)
2010-02-16 15:03:18 +00:00
fail("Previous record contains unread bytes");
2010-02-25 13:03:03 +00:00
getUint(c.leftRec);
2010-02-16 15:03:18 +00:00
getUint(flags);// This header entry is always zero
getUint(flags);
2010-02-25 13:03:03 +00:00
c.leftFile -= 12;
2010-02-16 15:03:18 +00:00
// Check that sizes add up
2010-02-25 13:03:03 +00:00
if(c.leftFile < c.leftRec)
2010-02-16 15:03:18 +00:00
fail("Record size is larger than rest of file");
2010-02-25 13:03:03 +00:00
// Adjust number of bytes c.left in file
c.leftFile -= c.leftRec;
2010-02-16 15:03:18 +00:00
}
2010-02-25 13:03:03 +00:00
bool hasMoreRecs() { return c.leftFile > 0; }
bool hasMoreSubs() { return c.leftRec > 0; }
2010-02-16 15:03:18 +00:00
2010-02-17 13:54:22 +00:00
/*************************************************************************
*
* Lowest level data reading and misc methods
*
*************************************************************************/
2010-02-16 19:23:54 +00:00
template <typename X>
2010-02-18 13:58:50 +00:00
void getT(X &x) { getExact(&x, sizeof(X)); }
void getExact(void*x, int size)
2010-02-17 13:54:22 +00:00
{
2010-02-18 13:58:50 +00:00
int t = esm->read(x, size);
if(t != size)
2010-02-17 13:54:22 +00:00
fail("Read error");
}
2010-02-16 19:23:54 +00:00
void getName(NAME &name) { getT(name); }
void getUint(uint32_t &u) { getT(u); }
2010-02-16 15:03:18 +00:00
2010-02-17 13:54:22 +00:00
// Read the next size bytes and return them as a string
std::string getString(int size)
{
// Not very optimized, but we can fix that later
2010-02-17 13:54:22 +00:00
char *ptr = new char[size];
esm->read(ptr,size);
// Remove any zero terminators
for(int i=0; i<size; i++)
if(ptr[i] == 0)
size = i;
// Convert to std::string and return
std::string res(ptr,size);
2010-02-17 13:54:22 +00:00
delete[] ptr;
return convertToUTF8(res);
}
// Convert a string from ISO-8859-1 encoding to UTF-8
std::string convertToUTF8(std::string input)
{
std::string output = "";
//create convert description
iconv_t cd = iconv_open("UTF-8", "ISO-8859-1");
if (cd == (iconv_t)-1) //error handling
{
std::string errMsg = "Creating description for UTF-8 converting failed: ";
switch (errno) //detailed error messages (maybe it contains too much detail :)
{
case EMFILE:
errMsg += "{OPEN_MAX} files descriptors are currently open in the calling process.";
case ENFILE:
errMsg += "Too many files are currently open in the system.";
case ENOMEM:
errMsg +="Insufficient storage space is available.";
case EINVAL:
errMsg += "The conversion specified by fromcode and tocode is not supported by the implementation.";
default:
errMsg += "Unknown Error\n";
}
fail(errMsg);
}
else
{
const size_t inputSize = input.size();
if (inputSize) //input is not empty
{
//convert function doesn't accept const char *, therefore copy content into an char *
std::vector<char> inputBuffer(input.begin(), input.end());
char *inputBufferBegin = &inputBuffer[0];
size_t inputBytesLeft = inputSize; //bytes to convert
static const size_t outputSize = 1000;
size_t outputBytesLeft;
char outputBuffer[outputSize];
char *outputBufferBegin;
while (inputBytesLeft > 0 )
{
outputBytesLeft = outputSize;
outputBufferBegin = outputBuffer;
if (iconv(cd, &inputBufferBegin, &inputBytesLeft, &outputBufferBegin, &outputBytesLeft) == (size_t)-1)
{
switch (errno)
{
case E2BIG: //outputBuffer is full
output += std::string(outputBuffer, outputSize);
break;
case EILSEQ:
fail("Iconv: Invalid multibyte sequence.\n");
break;
case EINVAL:
fail("Iconv: Incomplete multibyte sequence.\n");
break;
default:
fail("Iconv: Unknown Error\n");
}
}
}
//read only relevant bytes from outputBuffer
output += std::string(outputBuffer, outputSize - outputBytesLeft);
}
}
iconv_close (cd);
return output;
2010-02-17 13:54:22 +00:00
}
void skip(int bytes) { esm->seek(esm->tell()+bytes); }
2010-02-19 08:12:49 +00:00
uint64_t getOffset() { return esm->tell(); }
2010-02-16 15:03:18 +00:00
/// Used for error handling
void fail(const std::string &msg)
{
2010-02-19 08:12:49 +00:00
using namespace std;
stringstream ss;
ss << "ESM Error: " << msg;
2010-02-25 13:03:03 +00:00
ss << "\n File: " << c.filename;
ss << "\n Record: " << c.recName.toString();
ss << "\n Subrecord: " << c.subName.toString();
2010-02-19 08:12:49 +00:00
if(esm != NULL)
ss << "\n Offset: 0x" << hex << esm->tell();
throw str_exception(ss.str());
2010-02-16 15:03:18 +00:00
}
private:
Mangle::Stream::StreamPtr esm;
2010-02-16 15:03:18 +00:00
2010-02-25 13:03:03 +00:00
ESM_Context c;
2010-02-25 13:03:03 +00:00
// Special file signifier (see SpecialFile enum above)
int spf;
SaveData saveData;
MasterList masters;
};
2010-02-19 13:23:22 +00:00
}
#endif