Index: pkg/serialization/lib/src/format.dart |
diff --git a/pkg/serialization/lib/src/format.dart b/pkg/serialization/lib/src/format.dart |
new file mode 100644 |
index 0000000000000000000000000000000000000000..791cc83404d64bb227c4cd3c8e42e226f9330595 |
--- /dev/null |
+++ b/pkg/serialization/lib/src/format.dart |
@@ -0,0 +1,561 @@ |
+part of serialization; |
+ |
+/** |
+ * An abstract class for serialization formats. Subclasses define how data |
+ * is read or written to a particular output mechanism. |
+ */ |
+abstract class Format { |
+ |
+ const Format(); |
+ |
+ /** |
+ * Return true if this format stores primitives in their own area and uses |
+ * references to them (e.g. [SimpleFlatFormat]) and false if primitives |
+ * are stored directly (e.g. [SimpleJsonFormat], [SimpleMapFormat]). |
+ */ |
+ bool get shouldUseReferencesForPrimitives => false; |
+ |
+ /** |
+ * Generate output for [w] and return it. The particular form of the output |
+ * will depend on the format. The format can assume that [w] has data |
+ * generated by rules in a series of lists, and that each list will contain |
+ * either primitives (null, bool, num, String), Lists or Maps. The Lists or |
+ * Maps may contain any of the same things recursively, or may contain |
+ * Reference objects. For lists and maps the rule will tell us if they can |
+ * be of variable length or not. The format is allowed to operate |
+ * destructively on the rule data. |
+ */ |
+ generateOutput(Writer w); |
+ |
+ /** |
+ * Read the data from [input] in the context of [reader] and return it as a |
+ * Map with entries for "roots", "data" and "rules", which the reader knows |
+ * how to interpret. The type of [input] will depend on the particular format. |
+ */ |
+ Map<String, dynamic> read(input, Reader reader); |
+} |
+ |
+/** |
+ * This is the most basic format, which provides the internal representation |
+ * of the serialization, exposing the Reference objects. |
+ */ |
+class InternalMapFormat extends Format { |
+ const InternalMapFormat(); |
+ |
+ /** |
+ * Generate output for this format from [w] and return it as a nested Map |
+ * structure. The top level has |
+ * 3 fields, "rules" which may hold a definition of the rules used, |
+ * "data" which holds the serialized data, and "roots", which holds |
+ * [Reference] objects indicating the root objects. Note that roots are |
+ * necessary because the data is not organized in the same way as the object |
+ * structure, it's a list of lists holding self-contained maps which only |
+ * refer to other parts via [Reference] objects. |
+ */ |
+ Map<String, dynamic> generateOutput(Writer w) { |
+ var result = { |
+ "rules" : w.serializedRules(), |
+ "data" : w.states, |
+ "roots" : w._rootReferences() |
+ }; |
+ return result; |
+ } |
+ |
+ /** |
+ * Read serialized data written from this format |
+ * and return the nested Map representation described in [generateOutput]. If |
+ * the data also includes rule definitions, then these will replace the rules |
+ * in the [Serialization] for [reader]. |
+ */ |
+ Map<String, dynamic> read(Map<String, dynamic> topLevel, Reader reader) { |
+ var ruleString = topLevel["rules"]; |
+ reader.readRules(ruleString); |
+ reader._data = topLevel["data"]; |
+ topLevel["roots"] = topLevel["roots"]; |
+ return topLevel; |
+ } |
+} |
+ |
+/** |
+ * A format that stores the data in maps which can be converted into a JSON |
+ * string or passed through an isolate. Note that this consists of maps, but |
+ * that they don't follow the original object structure or look like the nested |
+ * maps of a [json] representation. They are flat, and [Reference] objects |
+ * are converted into a map form that will not make sense to |
+ * anything but this format. For simple acyclic JSON that other programs |
+ * can read, use [SimpleJsonFormat]. This is the default format, and is |
+ * easier to read than the more efficient [SimpleFlatFormat]. |
+ */ |
+class SimpleMapFormat extends InternalMapFormat { |
+ |
+ const SimpleMapFormat(); |
+ |
+ /** |
+ * Generate output for this format from [w] and return it as a String which |
+ * is the [json] representation of a nested Map structure. The top level has |
+ * 3 fields, "rules" which may hold a definition of the rules used, |
+ * "data" which holds the serialized data, and "roots", which holds |
+ * [Reference] objects indicating the root objects. Note that roots are |
+ * necessary because the data is not organized in the same way as the object |
+ * structure, it's a list of lists holding self-contained maps which only |
+ * refer to other parts via [Reference] objects. |
+ * This effectively defines a custom JSON serialization format, although |
+ * the details of the format vary depending which rules were used. |
+ */ |
+ Map<String, dynamic> generateOutput(Writer w) { |
+ forAllStates(w, (x) => x is Reference, referenceToMap); |
+ var result = super.generateOutput(w); |
+ result["roots"] = result["roots"].map( |
+ (x) => x is Reference ? referenceToMap(x) : x).toList(); |
+ return result; |
+ } |
+ |
+ /** |
+ * Convert the data generated by the rules to have maps with the fields |
+ * of [Reference] objects instead of the [Reference] so that the structure |
+ * can be serialized between isolates and json easily. |
+ */ |
+ void forAllStates(ReaderOrWriter w, bool predicate(value), |
+ void transform(value)) { |
+ for (var eachRule in w.rules) { |
+ var ruleData = w.states[eachRule.number]; |
+ for (var data in ruleData) { |
+ keysAndValues(data).forEach((key, value) { |
+ if (predicate(value)) { |
+ data[key] = transform(value); |
+ } |
+ }); |
+ } |
+ } |
+ } |
+ |
+ /** Convert the reference to a [json] serializable form. */ |
+ Map<String, int> referenceToMap(Reference ref) => ref == null ? null : |
+ { |
+ "__Ref" : 0, |
+ "rule" : ref.ruleNumber, |
+ "object" : ref.objectNumber |
+ }; |
+ |
+ /** |
+ * Convert the [referenceToMap] form for a reference back to a [Reference] |
+ * object. |
+ */ |
+ Reference mapToReference(ReaderOrWriter parent, Map<String, int> ref) => |
+ ref == null ? null : new Reference(parent, ref["rule"], ref["object"]); |
+ |
+ /** |
+ * Read serialized data written in this format |
+ * and return the nested Map representation described in [generateOutput]. If |
+ * the data also includes rule definitions, then these will replace the rules |
+ * in the [Serialization] for [reader]. |
+ */ |
+ Map<String, dynamic> read(Map<String, dynamic> topLevel, Reader reader) { |
+ super.read(topLevel, reader); |
+ forAllStates(reader, |
+ (ref) => ref is Map && ref["__Ref"] != null, |
+ (ref) => mapToReference(reader, ref)); |
+ topLevel["roots"] = topLevel["roots"] |
+ .map((x) => x is Map<String, int> ? mapToReference(reader, x) : x) |
+ .toList(); |
+ return topLevel; |
+ } |
+} |
+ |
+/** |
+ * A format for "normal" [json] representation of objects. It stores |
+ * the fields of the objects as nested maps, and doesn't allow cycles. This can |
+ * be useful in talking to existing APIs that expect [json] format data. The |
+ * output will be either a simple object (string, num, bool), a List, or a Map, |
+ * with nesting of those. |
+ * Note that since the classes of objects aren't normally stored, this isn't |
+ * enough information to read back the objects. However, if the |
+ * If the [storeRoundTripInfo] field of the format is set to true, then this |
+ * will store the rule number along with the data, allowing reconstruction. |
+ */ |
+class SimpleJsonFormat extends SimpleMapFormat { |
+ |
+ /** |
+ * Indicate if we should store rule numbers with map/list data so that we |
+ * will know how to reconstruct it with a read operation. If we don't, this |
+ * will be more compliant with things that expect known format JSON as input, |
+ * but we won't be able to read back the objects. |
+ */ |
+ final bool storeRoundTripInfo; |
+ |
+ /** |
+ * If we store the rule numbers, what key should we use to store them. |
+ */ |
+ static const String RULE = "_rule"; |
+ static const String RULES = "_rules"; |
+ static const String DATA = "_data"; |
+ static const String ROOTS = "_root"; |
+ |
+ const SimpleJsonFormat({this.storeRoundTripInfo : false}); |
+ |
+ /** |
+ * Generate output for this format from [w] and return it as |
+ * the [json] representation of a nested Map structure. |
+ */ |
+ generateOutput(Writer w) { |
+ jsonify(w); |
+ var root = w._rootReferences().first; |
+ if (root is Reference) root = w.stateForReference(root); |
+ if (w.selfDescribing && storeRoundTripInfo) { |
+ root = new Map() |
+ ..[RULES] = w.serializedRules() |
+ ..[DATA] = root; |
+ } |
+ return root; |
+ } |
+ |
+ /** |
+ * Convert the data generated by the rules to have nested maps instead |
+ * of Reference objects and to add rule numbers if [storeRoundTripInfo] |
+ * is true. |
+ */ |
+ void jsonify(Writer w) { |
+ for (var eachRule in w.rules) { |
+ var ruleData = w.states[eachRule.number]; |
+ jsonifyForRule(ruleData, w, eachRule); |
+ } |
+ } |
+ |
+ /** |
+ * For a particular [rule] modify the [ruleData] to conform to this format. |
+ */ |
+ void jsonifyForRule(List ruleData, Writer w, SerializationRule rule) { |
+ for (var i = 0; i < ruleData.length; i++) { |
+ var each = ruleData[i]; |
+ if (each is List) { |
+ jsonifyEntry(each, w); |
+ if (storeRoundTripInfo) ruleData[i].add(rule.number); |
+ } else if (each is Map) { |
+ jsonifyEntry(each, w); |
+ if (storeRoundTripInfo) each[RULE] = rule.number; |
+ } |
+ } |
+ } |
+ |
+ /** |
+ * For one particular entry, which is either a Map or a List, update it |
+ * to turn References into a nested List/Map. |
+ */ |
+ void jsonifyEntry(map, Writer w) { |
+ // Note, if this is a Map, and the key might be a reference, we need to |
+ // bend over backwards to avoid concurrent modifications. Non-string keys |
+ // won't actually work if we try to write this to json, but might happen |
+ // if e.g. sending between isolates. |
+ var updates = new Map(); |
+ keysAndValues(map).forEach((key, value) { |
+ if (value is Reference) updates[key] = w.stateForReference(value); |
+ }); |
+ updates.forEach((k, v) => map[k] = v); |
+ } |
+ |
+ /** |
+ * Read serialized data saved in this format, which should look like |
+ * either a simple type, a List or a Map and return the Map |
+ * representation that the reader expects, with top-level |
+ * entries for "rules", "data", and "roots". Nested lists/maps will be |
+ * converted into Reference objects. Note that if the data was not written |
+ * with [storeRoundTripInfo] true this will fail. |
+ */ |
+ Map<String, dynamic> read(data, Reader reader) { |
+ var result = new Map(); |
+ // Check the case of having been written without additional data and |
+ // read as if it had been written with storeRoundTripData set. |
+ if (reader.selfDescribing && !(data.containsKey(DATA))) { |
+ throw new SerializationException("Missing $DATA entry, " |
+ "may mean this was written and read with different values " |
+ "of selfDescribing."); |
+ } |
+ // If we are self-describing, we should have separate rule and data |
+ // sections. If not, we assume that we have just the data at the top level. |
+ var rules = reader.selfDescribing ? data[RULES] : null; |
+ var actualData = reader.selfDescribing ? data[DATA] : data; |
+ reader.readRules(rules); |
+ var ruleData = new List.generate(reader.rules.length, (_) => []); |
+ var top = recursivelyFixUp(actualData, reader, ruleData); |
+ result["data"] = ruleData; |
+ result["roots"] = [top]; |
+ return result; |
+ } |
+ |
+ /** |
+ * Convert nested references in [input] into [Reference] objects. |
+ */ |
+ recursivelyFixUp(input, Reader r, List result) { |
+ var data = input; |
+ if (isPrimitive(data)) { |
+ result[r._primitiveRule().number].add(data); |
+ return data; |
+ } |
+ var ruleNumber; |
+ // If we've added the rule number on as the last item in a list we have |
+ // to get rid of it or it will be interpreted as extra data. For a map |
+ // the library will be ok, but we need to get rid of the extra key before |
+ // the data is shown to the user, so we destructively modify. |
+ if (data is List) { |
+ ruleNumber = data.last; |
+ data = data.take(data.length - 1).toList(); |
+ } else if (data is Map) { |
+ ruleNumber = data.remove(RULE); |
+ } else { |
+ throw new SerializationException("Invalid data format"); |
+ } |
+ // Do not use map or other lazy operations for this. They do not play |
+ // well with a function that destructively modifies its arguments. |
+ var newData = mapValues(data, (each) => recursivelyFixUp(each, r, result)); |
+ result[ruleNumber].add(newData); |
+ return new Reference(r, ruleNumber, result[ruleNumber].length - 1); |
+ } |
+} |
+ |
+/** |
+ * Writes to a simple mostly-flat format. Details are subject to change. |
+ * Right now this produces a List containing null, num, and String. This is |
+ * more space-efficient than the map formats, but much less human-readable. |
+ * Simple usage is to turn this into JSON for transmission. |
+ */ |
+class SimpleFlatFormat extends Format { |
+ bool get shouldUseReferencesForPrimitives => true; |
+ |
+ /** |
+ * For each rule we store data to indicate whether it will be reconstructed |
+ * as a primitive, a list or a map. |
+ */ |
+ static const int STORED_AS_LIST = 1; |
+ static const int STORED_AS_MAP = 2; |
+ static const int STORED_AS_PRIMITIVE = 3; |
+ |
+ const SimpleFlatFormat(); |
+ |
+ /** |
+ * Generate output for this format from [w]. This will return a List with |
+ * three entries, corresponding to the "rules", "data", and "roots" from |
+ * [SimpleMapFormat]. The data is stored as a single List containing |
+ * primitives. |
+ */ |
+ List generateOutput(Writer w) { |
+ var result = new List(3); |
+ var flatData = []; |
+ for (var eachRule in w.rules) { |
+ var ruleData = w.states[eachRule.number]; |
+ flatData.add(ruleData.length); |
+ writeStateInto(eachRule, ruleData, flatData); |
+ } |
+ result[0] = w.serializedRules(); |
+ result[1] = flatData; |
+ result[2] = []; |
+ w._rootReferences().forEach((x) => x.writeToList(result[2])); |
+ return result; |
+ } |
+ |
+ /** |
+ * Writes the data from [rule] into the [target] list. |
+ */ |
+ void writeStateInto(SerializationRule rule, List ruleData, List target) { |
+ if (!ruleData.isEmpty) { |
+ var sample = ruleData.first; |
+ if (rule.storesStateAsLists || sample is List) { |
+ writeLists(rule, ruleData, target); |
+ } else if (rule.storesStateAsMaps || sample is Map) { |
+ writeMaps(rule, ruleData, target); |
+ } else if (rule.storesStateAsPrimitives || isPrimitive(sample)) { |
+ writeObjects(ruleData, target); |
+ } else { |
+ throw new SerializationException("Invalid data format"); |
+ } |
+ } else { |
+ // If there is no data, write a zero for the length. |
+ target.add(0); |
+ } |
+ } |
+ |
+ /** |
+ * Write [entries], which contains Lists. Either the lists are variable |
+ * length, in which case we add a length field, or they are fixed length, in |
+ * which case we don't, and assume the [rule] will know how to read the |
+ * right length when we read it back. We expect everything in the list to be |
+ * a reference, which is stored as two numbers. |
+ */ |
+ void writeLists(SerializationRule rule, List<List> entries, List target) { |
+ target.add(STORED_AS_LIST); |
+ for (var eachEntry in entries) { |
+ if (rule.hasVariableLengthEntries) { |
+ target.add(eachEntry.length); |
+ } |
+ for (var eachReference in eachEntry) { |
+ writeReference(eachReference, target); |
+ } |
+ } |
+ } |
+ |
+ /** |
+ * Write [entries], which contains Maps. Either the Maps are variable |
+ * length, in which case we add a length field, or they are fixed length, in |
+ * which case we don't, and assume the [rule] will know how to read the |
+ * right length when we read it back. Then we write alternating keys and |
+ * values. We expect the values to be references, which we store as |
+ * two numbers. |
+ */ |
+ void writeMaps(SerializationRule rule, List<Map> entries, List target) { |
+ target.add(STORED_AS_MAP); |
+ for (var eachEntry in entries) { |
+ if (rule.hasVariableLengthEntries) { |
+ target.add(eachEntry.length); |
+ } |
+ eachEntry.forEach((key, value) { |
+ writeReference(key, target); |
+ writeReference(value, target); |
+ }); |
+ } |
+ } |
+ |
+ /** |
+ * Write [entries], which contains simple objects which we can put directly |
+ * into [target]. |
+ */ |
+ void writeObjects(List entries, List target) { |
+ target.add(STORED_AS_PRIMITIVE); |
+ for (var each in entries) { |
+ if (!isPrimitive(each)) throw new SerializationException("Invalid data"); |
+ } |
+ target.addAll(entries); |
+ } |
+ |
+ /** |
+ * Write [eachRef] to [target]. It will be written as two ints. If [eachRef] |
+ * is null it will be written as two nulls. |
+ */ |
+ void writeReference(Reference eachRef, List target) { |
+ // TODO(alanknight): Writing nulls is problematic in a real flat format. |
+ if (eachRef == null) { |
+ target..add(null)..add(null); |
+ } else { |
+ eachRef.writeToList(target); |
+ } |
+ } |
+ |
+ /** |
+ * Read the data from [rawInput] in the context of [r] and return it as a |
+ * Map with entries for "roots", "data" and "rules", which the reader knows |
+ * how to interpret. We expect [rawInput] to have been generated from this |
+ * format. |
+ */ |
+ Map<String, dynamic> read(List rawInput, Reader r) { |
+ // TODO(alanknight): It's annoying to have to pass the reader around so |
+ // much, consider having the format be specific to a particular |
+ // serialization operation along with the reader and having it as a field. |
+ var input = {}; |
+ input["rules"] = rawInput[0]; |
+ r.readRules(input["rules"]); |
+ |
+ var flatData = rawInput[1]; |
+ var stream = flatData.iterator; |
+ var tempData = new List(r.rules.length); |
+ for (var eachRule in r.rules) { |
+ tempData[eachRule.number] = readRuleDataFrom(stream, eachRule, r); |
+ } |
+ input["data"] = tempData; |
+ |
+ var roots = []; |
+ var rootsAsInts = rawInput[2].iterator; |
+ do { |
+ roots.add(nextReferenceFrom(rootsAsInts, r)); |
+ } while (rootsAsInts.current != null); |
+ |
+ input["roots"] = roots; |
+ return input; |
+ } |
+ |
+ /** |
+ * Read the data for [rule] from [input] and return it. |
+ */ |
+ readRuleDataFrom(Iterator input, SerializationRule rule, Reader r) { |
+ var numberOfEntries = _next(input); |
+ var entryType = _next(input); |
+ if (entryType == STORED_AS_LIST) { |
+ return readLists(input, rule, numberOfEntries, r); |
+ } |
+ if (entryType == STORED_AS_MAP) { |
+ return readMaps(input, rule, numberOfEntries, r); |
+ } |
+ if (entryType == STORED_AS_PRIMITIVE) { |
+ return readPrimitives(input, rule, numberOfEntries); |
+ } |
+ if (numberOfEntries == 0) { |
+ return []; |
+ } else { |
+ throw new SerializationException("Invalid data in serialization"); |
+ } |
+ } |
+ |
+ /** |
+ * Read data for [rule] from [input] with [length] number of entries, |
+ * creating lists from the results. |
+ */ |
+ List readLists(Iterator input, SerializationRule rule, int length, Reader r) { |
+ var ruleData = []; |
+ for (var i = 0; i < length; i++) { |
+ var subLength = |
+ rule.hasVariableLengthEntries ? _next(input) : rule.dataLength; |
+ var subList = []; |
+ ruleData.add(subList); |
+ for (var j = 0; j < subLength; j++) { |
+ subList.add(nextReferenceFrom(input, r)); |
+ } |
+ } |
+ return ruleData; |
+ } |
+ |
+ /** |
+ * Read data for [rule] from [input] with [length] number of entries, |
+ * creating maps from the results. |
+ */ |
+ List readMaps(Iterator input, SerializationRule rule, int length, Reader r) { |
+ var ruleData = []; |
+ for (var i = 0; i < length; i++) { |
+ var subLength = |
+ rule.hasVariableLengthEntries ? _next(input) : rule.dataLength; |
+ var map = new Map(); |
+ ruleData.add(map); |
+ for (var j = 0; j < subLength; j++) { |
+ var key = nextReferenceFrom(input, r); |
+ var value = nextReferenceFrom(input, r); |
+ map[key] = value; |
+ } |
+ } |
+ return ruleData; |
+ } |
+ |
+ /** |
+ * Read data for [rule] from [input] with [length] number of entries, |
+ * treating the data as primitives that can be returned directly. |
+ */ |
+ List readPrimitives(Iterator input, SerializationRule rule, int length) { |
+ var ruleData = []; |
+ for (var i = 0; i < length; i++) { |
+ ruleData.add(_next(input)); |
+ } |
+ return ruleData; |
+ } |
+ |
+ /** Read the next Reference from the input. */ |
+ Reference nextReferenceFrom(Iterator input, Reader r) { |
+ var a = _next(input); |
+ var b = _next(input); |
+ if (a == null) { |
+ return null; |
+ } else { |
+ return new Reference(r, a, b); |
+ } |
+ } |
+ |
+ /** Return the next element from the input. */ |
+ _next(Iterator input) { |
+ input.moveNext(); |
+ return input.current; |
+ } |
+} |