/* Copyright (C) 2010 Wildfire Games. * This file is part of 0 A.D. * * 0 A.D. is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 2 of the License, or * (at your option) any later version. * * 0 A.D. is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with 0 A.D. If not, see . */ #include "precompiled.h" #include "BinarySerializer.h" #include "SerializedScriptTypes.h" #include "lib/byte_order.h" #include "lib/utf8.h" #include "ps/CLogger.h" #include "ps/utf16string.h" #include "scriptinterface/ScriptInterface.h" #include "scriptinterface/AutoRooters.h" // Shut up some warnings triggered by jsobj.h #if MSC_VERSION # pragma warning(push) # pragma warning(disable:4512) // assignment operator could not be generated # pragma warning(disable:4800) // forcing value to bool 'true' or 'false' (performance warning) #endif #include "js/jsobj.h" #if MSC_VERSION # pragma warning(pop) #endif CBinarySerializer::CBinarySerializer(ScriptInterface& scriptInterface) : m_ScriptInterface(scriptInterface), m_ScriptBackrefsNext(1), m_Rooter(scriptInterface) { } /* The Put* implementations here are designed for subclasses that want an efficient, portable, deserializable representation. (Subclasses with different requirements should override these methods.) Numbers are converted to little-endian byte strings, for portability and efficiency. Data is not aligned, for storage efficiency. */ void CBinarySerializer::PutNumber(const char* name, uint8_t value) { Put(name, (const u8*)&value, sizeof(uint8_t)); } void CBinarySerializer::PutNumber(const char* name, int32_t value) { int32_t v = (i32)to_le32((u32)value); Put(name, (const u8*)&v, sizeof(int32_t)); } void CBinarySerializer::PutNumber(const char* name, uint32_t value) { uint32_t v = to_le32(value); Put(name, (const u8*)&v, sizeof(uint32_t)); } void CBinarySerializer::PutNumber(const char* name, float value) { Put(name, (const u8*)&value, sizeof(float)); } void CBinarySerializer::PutNumber(const char* name, double value) { Put(name, (const u8*)&value, sizeof(double)); } void CBinarySerializer::PutNumber(const char* name, fixed value) { PutNumber(name, value.GetInternalValue()); } void CBinarySerializer::PutBool(const char* name, bool value) { NumberU8(name, value ? 1 : 0, 0, 1); } void CBinarySerializer::PutString(const char* name, const std::string& value) { // TODO: should intern strings, particularly to save space with script property names PutNumber("string length", (uint32_t)value.length()); Put(name, (u8*)value.data(), value.length()); } void CBinarySerializer::PutScriptVal(const char* UNUSED(name), jsval value) { HandleScriptVal(value); } //////////////////////////////////////////////////////////////// void CBinarySerializer::HandleScriptVal(jsval val) { JSContext* cx = m_ScriptInterface.GetContext(); switch (JS_TypeOfValue(cx, val)) { case JSTYPE_VOID: { NumberU8_Unbounded("type", SCRIPT_TYPE_VOID); break; } case JSTYPE_NULL: // This type is never actually returned (it's a JS2 feature) { NumberU8_Unbounded("type", SCRIPT_TYPE_NULL); break; } case JSTYPE_OBJECT: { if (JSVAL_IS_NULL(val)) { NumberU8_Unbounded("type", SCRIPT_TYPE_NULL); break; } JSObject* obj = JSVAL_TO_OBJECT(val); // If we've already serialized this object, just output a reference to it u32 tag = GetScriptBackrefTag(obj); if (tag) { NumberU8_Unbounded("type", SCRIPT_TYPE_BACKREF); NumberU32_Unbounded("tag", tag); break; } if (JS_IsArrayObject(cx, obj)) { NumberU8_Unbounded("type", SCRIPT_TYPE_ARRAY); // TODO: probably should have a more efficient storage format } else { NumberU8_Unbounded("type", SCRIPT_TYPE_OBJECT); // if (JS_GetClass(cx, obj)) // { // LOGERROR("Cannot serialise JS objects of type 'object' with a class"); // throw PSERROR_Serialize_InvalidScriptValue(); // } // TODO: ought to complain only about non-standard classes // TODO: probably ought to do something cleverer for classes, prototypes, etc // (See Trac #406, #407) } // Find all properties (ordered by insertion time) // JS_Enumerate is a bit slow (lots of memory allocation), so do the enumeration manually // (based on the code from JS_Enumerate, using the probably less stable JSObject API): // (Note that we don't do any rooting, because we assume nothing is going to trigger GC. // I'm not absolute certain that's necessarily a valid assumption.) jsval iter_state, num_properties; if (!obj->enumerate(cx, JSENUMERATE_INIT, &iter_state, &num_properties)) throw PSERROR_Serialize_ScriptError("enumerate INIT failed"); debug_assert(JSVAL_TO_INT(num_properties) >= 0); size_t n = (size_t)JSVAL_TO_INT(num_properties); // Note: num_properties might be 0 if the object doesn't know in advance how many to enumerate; // we can't distinguish that from really having 0 properties without performing the actual iteration, // so just assume the object always returns the correct count NumberU32_Unbounded("num props", (uint32_t)n); jsid id; for (size_t i = 0; i < n; ++i) { if (!obj->enumerate(cx, JSENUMERATE_NEXT, &iter_state, &id)) throw PSERROR_Serialize_ScriptError("enumerate NEXT failed"); if (JSVAL_IS_NULL(iter_state)) throw PSERROR_Serialize_ScriptError("enumerate NEXT gave unexpected null"); jsval idval, propval; // Get the property name as a string if (!JS_IdToValue(cx, id, &idval)) throw PSERROR_Serialize_ScriptError("JS_IdToValue failed"); JSString* idstr = JS_ValueToString(cx, idval); if (!idstr) throw PSERROR_Serialize_ScriptError("JS_ValueToString failed"); ScriptString("prop name", idstr); // Use LookupProperty instead of GetProperty to avoid the danger of getters // (they might delete values and trigger GC) if (!JS_LookupPropertyById(cx, obj, id, &propval)) throw PSERROR_Serialize_ScriptError("JS_LookupPropertyById failed"); HandleScriptVal(propval); } // Check we really reached the end of the iteration if (!obj->enumerate(cx, JSENUMERATE_NEXT, &iter_state, &id)) throw PSERROR_Serialize_ScriptError("enumerate NEXT failed"); if (!JSVAL_IS_NULL(iter_state)) throw PSERROR_Serialize_ScriptError("enumerate NEXT didn't give unexpected null"); break; } case JSTYPE_FUNCTION: { LOGERROR(L"Cannot serialise JS objects of type 'function'"); throw PSERROR_Serialize_InvalidScriptValue(); } case JSTYPE_STRING: { NumberU8_Unbounded("type", SCRIPT_TYPE_STRING); ScriptString("string", JSVAL_TO_STRING(val)); break; } case JSTYPE_NUMBER: { // For efficiency, handle ints and doubles separately. if (JSVAL_IS_INT(val)) { NumberU8_Unbounded("type", SCRIPT_TYPE_INT); // jsvals are limited to JSVAL_INT_BITS == 31 bits, even on 64-bit platforms NumberI32("value", (int32_t)JSVAL_TO_INT(val), JSVAL_INT_MIN, JSVAL_INT_MAX); } else { debug_assert(JSVAL_IS_DOUBLE(val)); NumberU8_Unbounded("type", SCRIPT_TYPE_DOUBLE); jsdouble* dbl = JSVAL_TO_DOUBLE(val); NumberDouble_Unbounded("value", *dbl); } break; } case JSTYPE_BOOLEAN: { NumberU8_Unbounded("type", SCRIPT_TYPE_BOOLEAN); JSBool b = JSVAL_TO_BOOLEAN(val); NumberU8_Unbounded("value", b ? 1 : 0); break; } case JSTYPE_XML: { LOGERROR(L"Cannot serialise JS objects of type 'xml'"); throw PSERROR_Serialize_InvalidScriptValue(); } default: { debug_warn(L"Invalid TypeOfValue"); throw PSERROR_Serialize_InvalidScriptValue(); } } } void CBinarySerializer::ScriptString(const char* name, JSString* string) { jschar* chars = JS_GetStringChars(string); size_t length = JS_GetStringLength(string); #if BYTE_ORDER != LITTLE_ENDIAN #error TODO: probably need to convert JS strings to little-endian #endif // Serialize strings directly as UTF-16, to avoid expensive encoding conversions NumberU32_Unbounded("string length", (uint32_t)length); RawBytes(name, (const u8*)chars, length*2); } u32 CBinarySerializer::GetScriptBackrefTag(JSObject* obj) { // To support non-tree structures (e.g. "var x = []; var y = [x, x];"), we need a way // to indicate multiple references to one object(/array). So every time we serialize a // new object, we give it a new non-zero tag; when we serialize it a second time we just // refer to that tag. // // The tags are stored in a map. Maybe it'd be more efficient to store it inline in the object // somehow? but this works okay for now std::pair it = m_ScriptBackrefs.insert(std::make_pair(obj, m_ScriptBackrefsNext)); // If it was already there, return the tag if (!it.second) return it.first->second; // If it was newly inserted, we need to make sure it gets rooted // for the duration that it's in m_ScriptBackrefs m_Rooter.Push(it.first->first); m_ScriptBackrefsNext++; // Return a non-tag number so callers know they need to serialize the object return 0; }