Optimized GC performance when loading,
greatly decreasing memory usage and improving speed by 30% or more.
This commit is contained in:
parent
915428c8ed
commit
9d68b6fa9a
|
@ -29,7 +29,7 @@ links = ../index.html Documentation home
|
||||||
# Source files or patterns to ignore. Supports regexp syntax.
|
# Source files or patterns to ignore. Supports regexp syntax.
|
||||||
# E.g; To ignore main.d and all source files in the test/ directory,
|
# E.g; To ignore main.d and all source files in the test/ directory,
|
||||||
# you would use: "main.d test/*"
|
# you would use: "main.d test/*"
|
||||||
ignore = test/*, examples/*, docsrc/*, autoddoc/*, yaml.d, unittest.d, cdc.d, dyaml/composer.d, dyaml/event.d, dyaml/parser.d, dyaml/reader.d, dyaml/scanner.d, dyaml/token.d, dyaml/util.d, dyaml/anchor.d, dyaml/emitter.d, dyaml/flags.d, dyaml/serializer.d, dyaml/sharedobject.d, dyaml/tag.d, dyaml/tagdirectives.d, dyaml/queue.d
|
ignore = test/*, examples/*, docsrc/*, autoddoc/*, yaml.d, unittest.d, cdc.d, dyaml/composer.d, dyaml/event.d, dyaml/parser.d, dyaml/reader.d, dyaml/scanner.d, dyaml/token.d, dyaml/util.d, dyaml/anchor.d, dyaml/emitter.d, dyaml/flags.d, dyaml/serializer.d, dyaml/sharedobject.d, dyaml/tag.d, dyaml/tagdirectives.d, dyaml/queue.d, dyaml/escapes.d
|
||||||
|
|
||||||
[DDOC]
|
[DDOC]
|
||||||
# Command to use to generate the documentation.
|
# Command to use to generate the documentation.
|
||||||
|
|
|
@ -26,6 +26,7 @@ import std.utf;
|
||||||
|
|
||||||
import dyaml.anchor;
|
import dyaml.anchor;
|
||||||
import dyaml.encoding;
|
import dyaml.encoding;
|
||||||
|
import dyaml.escapes;
|
||||||
import dyaml.event;
|
import dyaml.event;
|
||||||
import dyaml.exception;
|
import dyaml.exception;
|
||||||
import dyaml.flags;
|
import dyaml.flags;
|
||||||
|
@ -1343,23 +1344,6 @@ struct ScalarWriter
|
||||||
///Write text as double quoted scalar.
|
///Write text as double quoted scalar.
|
||||||
void writeDoubleQuoted()
|
void writeDoubleQuoted()
|
||||||
{
|
{
|
||||||
immutable dchar[dchar] escapeReplacements =
|
|
||||||
['\0': '0',
|
|
||||||
'\x07': 'a',
|
|
||||||
'\x08': 'b',
|
|
||||||
'\x09': 't',
|
|
||||||
'\x0A': 'n',
|
|
||||||
'\x0B': 'v',
|
|
||||||
'\x0C': 'f',
|
|
||||||
'\x0D': 'r',
|
|
||||||
'\x1B': 'e',
|
|
||||||
'\"': '\"',
|
|
||||||
'\\': '\\',
|
|
||||||
'\u0085': 'N',
|
|
||||||
'\xA0': '_',
|
|
||||||
'\u2028': 'L',
|
|
||||||
'\u2029': 'P'];
|
|
||||||
|
|
||||||
resetTextPosition();
|
resetTextPosition();
|
||||||
emitter_.writeIndicator("\"", true);
|
emitter_.writeIndicator("\"", true);
|
||||||
do
|
do
|
||||||
|
@ -1377,10 +1361,10 @@ struct ScalarWriter
|
||||||
if(c != dcharNone)
|
if(c != dcharNone)
|
||||||
{
|
{
|
||||||
auto appender = appender!string();
|
auto appender = appender!string();
|
||||||
if((c in escapeReplacements) !is null)
|
if((c in dyaml.escapes.toEscapes) !is null)
|
||||||
{
|
{
|
||||||
appender.put('\\');
|
appender.put('\\');
|
||||||
appender.put(escapeReplacements[c]);
|
appender.put(dyaml.escapes.toEscapes[c]);
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
|
|
61
dyaml/escapes.d
Normal file
61
dyaml/escapes.d
Normal file
|
@ -0,0 +1,61 @@
|
||||||
|
|
||||||
|
|
||||||
|
// Copyright Ferdinand Majerech 2011.
|
||||||
|
// Distributed under the Boost Software License, Version 1.0.
|
||||||
|
// (See accompanying file LICENSE_1_0.txt or copy at
|
||||||
|
// http://www.boost.org/LICENSE_1_0.txt)
|
||||||
|
|
||||||
|
module dyaml.escapes;
|
||||||
|
|
||||||
|
|
||||||
|
package:
|
||||||
|
|
||||||
|
///Translation table from YAML escapes to dchars.
|
||||||
|
dchar[dchar] fromEscapes;
|
||||||
|
///Translation table from dchars to YAML escapes.
|
||||||
|
dchar[dchar] toEscapes;
|
||||||
|
///Translation table from prefixes of escaped hexadecimal format characters to their lengths.
|
||||||
|
uint[dchar] escapeHexCodes;
|
||||||
|
|
||||||
|
|
||||||
|
static this()
|
||||||
|
{
|
||||||
|
fromEscapes =
|
||||||
|
['0': '\0',
|
||||||
|
'a': '\x07',
|
||||||
|
'b': '\x08',
|
||||||
|
't': '\x09',
|
||||||
|
'\t': '\x09',
|
||||||
|
'n': '\x0A',
|
||||||
|
'v': '\x0B',
|
||||||
|
'f': '\x0C',
|
||||||
|
'r': '\x0D',
|
||||||
|
'e': '\x1B',
|
||||||
|
' ': '\x20',
|
||||||
|
'\"': '\"',
|
||||||
|
'\\': '\\',
|
||||||
|
'N': '\u0085',
|
||||||
|
'_': '\xA0',
|
||||||
|
'L': '\u2028',
|
||||||
|
'P': '\u2029'];
|
||||||
|
|
||||||
|
toEscapes =
|
||||||
|
['\0': '0',
|
||||||
|
'\x07': 'a',
|
||||||
|
'\x08': 'b',
|
||||||
|
'\x09': 't',
|
||||||
|
'\x0A': 'n',
|
||||||
|
'\x0B': 'v',
|
||||||
|
'\x0C': 'f',
|
||||||
|
'\x0D': 'r',
|
||||||
|
'\x1B': 'e',
|
||||||
|
'\"': '\"',
|
||||||
|
'\\': '\\',
|
||||||
|
'\u0085': 'N',
|
||||||
|
'\xA0': '_',
|
||||||
|
'\u2028': 'L',
|
||||||
|
'\u2029': 'P'];
|
||||||
|
|
||||||
|
escapeHexCodes = ['x': 2, 'u': 4, 'U': 8];
|
||||||
|
}
|
||||||
|
|
|
@ -183,7 +183,7 @@ Event documentEndEvent(Mark start, Mark end, bool explicit)
|
||||||
* style = Scalar style.
|
* style = Scalar style.
|
||||||
*/
|
*/
|
||||||
Event scalarEvent(in Mark start, in Mark end, in Anchor anchor, in Tag tag,
|
Event scalarEvent(in Mark start, in Mark end, in Anchor anchor, in Tag tag,
|
||||||
in bool[2] implicit, in string value,
|
in Tuple!(bool, bool) implicit, in string value,
|
||||||
in ScalarStyle style = ScalarStyle.Invalid)
|
in ScalarStyle style = ScalarStyle.Invalid)
|
||||||
{
|
{
|
||||||
return Event(value, start, end, anchor, tag, EventID.Scalar, style, implicit[0],
|
return Event(value, start, end, anchor, tag, EventID.Scalar, style, implicit[0],
|
||||||
|
|
11
dyaml/node.d
11
dyaml/node.d
|
@ -1371,5 +1371,14 @@ void merge(ref Node.Pair[] pairs, ref Node.Pair toMerge)
|
||||||
*/
|
*/
|
||||||
void merge(ref Node.Pair[] pairs, Node.Pair[] toMerge)
|
void merge(ref Node.Pair[] pairs, Node.Pair[] toMerge)
|
||||||
{
|
{
|
||||||
foreach(ref pair; toMerge){merge(pairs, pair);}
|
bool eq(ref Node.Pair a, ref Node.Pair b){return a.key == b.key;}
|
||||||
|
|
||||||
|
//Preallocating to limit GC reallocations.
|
||||||
|
auto len = pairs.length;
|
||||||
|
pairs.length = len + toMerge.length;
|
||||||
|
foreach(ref pair; toMerge) if(!canFind!eq(pairs, pair))
|
||||||
|
{
|
||||||
|
pairs[len++] = pair;
|
||||||
|
}
|
||||||
|
pairs.length = len;
|
||||||
}
|
}
|
||||||
|
|
|
@ -12,6 +12,7 @@ module dyaml.parser;
|
||||||
|
|
||||||
|
|
||||||
import std.array;
|
import std.array;
|
||||||
|
import std.container;
|
||||||
import std.conv;
|
import std.conv;
|
||||||
import std.exception;
|
import std.exception;
|
||||||
import std.typecons;
|
import std.typecons;
|
||||||
|
@ -124,9 +125,10 @@ final class Parser
|
||||||
tagDirective[] tagHandles_;
|
tagDirective[] tagHandles_;
|
||||||
|
|
||||||
///Stack of states.
|
///Stack of states.
|
||||||
Event delegate()[] states_;
|
Array!(Event delegate()) states_;
|
||||||
///Stack of marks used to keep track of extents of e.g. YAML collections.
|
///Stack of marks used to keep track of extents of e.g. YAML collections.
|
||||||
Mark[] marks_;
|
Array!Mark marks_;
|
||||||
|
|
||||||
///Current state.
|
///Current state.
|
||||||
Event delegate() state_;
|
Event delegate() state_;
|
||||||
|
|
||||||
|
@ -136,6 +138,8 @@ final class Parser
|
||||||
{
|
{
|
||||||
state_ = &parseStreamStart;
|
state_ = &parseStreamStart;
|
||||||
scanner_ = scanner;
|
scanner_ = scanner;
|
||||||
|
states_.reserve(32);
|
||||||
|
marks_.reserve(32);
|
||||||
}
|
}
|
||||||
|
|
||||||
///Destroy the parser.
|
///Destroy the parser.
|
||||||
|
@ -145,9 +149,7 @@ final class Parser
|
||||||
clear(tagHandles_);
|
clear(tagHandles_);
|
||||||
tagHandles_ = null;
|
tagHandles_ = null;
|
||||||
clear(states_);
|
clear(states_);
|
||||||
states_ = null;
|
|
||||||
clear(marks_);
|
clear(marks_);
|
||||||
marks_ = null;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -228,8 +230,8 @@ final class Parser
|
||||||
{
|
{
|
||||||
enforce(states_.length > 0,
|
enforce(states_.length > 0,
|
||||||
new YAMLException("Parser: Need to pop state but no states left to pop"));
|
new YAMLException("Parser: Need to pop state but no states left to pop"));
|
||||||
const result = states_.back();
|
const result = states_.back;
|
||||||
states_.popBack;
|
states_.length = states_.length - 1;
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -238,8 +240,8 @@ final class Parser
|
||||||
{
|
{
|
||||||
enforce(marks_.length > 0,
|
enforce(marks_.length > 0,
|
||||||
new YAMLException("Parser: Need to pop mark but no marks left to pop"));
|
new YAMLException("Parser: Need to pop mark but no marks left to pop"));
|
||||||
const result = marks_.back();
|
const result = marks_.back;
|
||||||
marks_.popBack;
|
marks_.length = marks_.length - 1;
|
||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -468,7 +470,7 @@ final class Parser
|
||||||
bool implicit_2 = (!implicit) && tag is null;
|
bool implicit_2 = (!implicit) && tag is null;
|
||||||
state_ = popState();
|
state_ = popState();
|
||||||
return scalarEvent(startMark, token.endMark, Anchor(anchor), Tag(tag),
|
return scalarEvent(startMark, token.endMark, Anchor(anchor), Tag(tag),
|
||||||
[implicit, implicit_2], token.value, token.style);
|
tuple(implicit, implicit_2), token.value, token.style);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(scanner_.checkToken(TokenID.FlowSequenceStart))
|
if(scanner_.checkToken(TokenID.FlowSequenceStart))
|
||||||
|
@ -512,7 +514,7 @@ final class Parser
|
||||||
|
|
||||||
//Empty scalars are allowed even if a tag or an anchor is specified.
|
//Empty scalars are allowed even if a tag or an anchor is specified.
|
||||||
return scalarEvent(startMark, endMark, Anchor(anchor), Tag(tag),
|
return scalarEvent(startMark, endMark, Anchor(anchor), Tag(tag),
|
||||||
[implicit, false] , "");
|
tuple(implicit, false) , "");
|
||||||
}
|
}
|
||||||
|
|
||||||
immutable token = scanner_.peekToken();
|
immutable token = scanner_.peekToken();
|
||||||
|
@ -585,7 +587,7 @@ final class Parser
|
||||||
if(!scanner_.checkToken(TokenID.BlockEnd))
|
if(!scanner_.checkToken(TokenID.BlockEnd))
|
||||||
{
|
{
|
||||||
immutable token = scanner_.peekToken();
|
immutable token = scanner_.peekToken();
|
||||||
throw new Error("While parsing a block collection", marks_[$ - 1],
|
throw new Error("While parsing a block collection", marks_.back,
|
||||||
"expected block end, but found " ~ token.idString,
|
"expected block end, but found " ~ token.idString,
|
||||||
token.startMark);
|
token.startMark);
|
||||||
}
|
}
|
||||||
|
@ -650,7 +652,7 @@ final class Parser
|
||||||
if(!scanner_.checkToken(TokenID.BlockEnd))
|
if(!scanner_.checkToken(TokenID.BlockEnd))
|
||||||
{
|
{
|
||||||
immutable token = scanner_.peekToken();
|
immutable token = scanner_.peekToken();
|
||||||
throw new Error("While parsing a block mapping", marks_[$ - 1],
|
throw new Error("While parsing a block mapping", marks_.back,
|
||||||
"expected block end, but found: " ~ token.idString,
|
"expected block end, but found: " ~ token.idString,
|
||||||
token.startMark);
|
token.startMark);
|
||||||
}
|
}
|
||||||
|
@ -711,7 +713,7 @@ final class Parser
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
immutable token = scanner_.peekToken;
|
immutable token = scanner_.peekToken;
|
||||||
throw new Error("While parsing a flow sequence", marks_[$ - 1],
|
throw new Error("While parsing a flow sequence", marks_.back,
|
||||||
"expected ',' or ']', but got: " ~
|
"expected ',' or ']', but got: " ~
|
||||||
token.idString, token.startMark);
|
token.idString, token.startMark);
|
||||||
}
|
}
|
||||||
|
@ -818,7 +820,7 @@ final class Parser
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
immutable token = scanner_.peekToken;
|
immutable token = scanner_.peekToken;
|
||||||
throw new Error("While parsing a flow mapping", marks_[$ - 1],
|
throw new Error("While parsing a flow mapping", marks_.back,
|
||||||
"expected ',' or '}', but got: " ~
|
"expected ',' or '}', but got: " ~
|
||||||
token.idString, token.startMark);
|
token.idString, token.startMark);
|
||||||
}
|
}
|
||||||
|
@ -860,6 +862,6 @@ final class Parser
|
||||||
{
|
{
|
||||||
//PyYAML uses a Tuple!(true, false) for the second last arg here,
|
//PyYAML uses a Tuple!(true, false) for the second last arg here,
|
||||||
//but the second bool is never used after that - so we don't use it.
|
//but the second bool is never used after that - so we don't use it.
|
||||||
return scalarEvent(mark, mark, Anchor(), Tag(), [true, false], "");
|
return scalarEvent(mark, mark, Anchor(), Tag(), tuple(true, false), "");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -138,8 +138,11 @@ final class Reader
|
||||||
{
|
{
|
||||||
updateBuffer(index + 1);
|
updateBuffer(index + 1);
|
||||||
|
|
||||||
enforce(buffer_.length >= bufferOffset_ + index + 1,
|
if(buffer_.length < bufferOffset_ + index + 1)
|
||||||
new ReaderException("Trying to read past the end of the stream"));
|
{
|
||||||
|
throw new ReaderException("Trying to read past the end of the stream");
|
||||||
|
}
|
||||||
|
|
||||||
return buffer_[bufferOffset_ + index];
|
return buffer_[bufferOffset_ + index];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -205,6 +208,8 @@ final class Reader
|
||||||
*/
|
*/
|
||||||
void forward(size_t length = 1)
|
void forward(size_t length = 1)
|
||||||
{
|
{
|
||||||
|
//This is here due to optimization.
|
||||||
|
static newlines = "\n\u0085\u2028\u2029";
|
||||||
updateBuffer(length + 1);
|
updateBuffer(length + 1);
|
||||||
|
|
||||||
while(length > 0)
|
while(length > 0)
|
||||||
|
@ -212,9 +217,8 @@ final class Reader
|
||||||
const c = buffer_[bufferOffset_];
|
const c = buffer_[bufferOffset_];
|
||||||
++bufferOffset_;
|
++bufferOffset_;
|
||||||
++charIndex_;
|
++charIndex_;
|
||||||
//new line
|
//New line.
|
||||||
if(['\n', '\u0085', '\u2028', '\u2029'].canFind(c) ||
|
if(newlines.canFind(c) || (c == '\r' && buffer_[bufferOffset_] != '\n'))
|
||||||
(c == '\r' && buffer_[bufferOffset_] != '\n'))
|
|
||||||
{
|
{
|
||||||
++line_;
|
++line_;
|
||||||
column_ = 0;
|
column_ = 0;
|
||||||
|
@ -246,7 +250,7 @@ final class Reader
|
||||||
* If there are not enough characters in the stream, it will get
|
* If there are not enough characters in the stream, it will get
|
||||||
* as many as possible.
|
* as many as possible.
|
||||||
*
|
*
|
||||||
* Params: length = Number of characters we need to read.
|
* Params: length = Mimimum number of characters we need to read.
|
||||||
*
|
*
|
||||||
* Throws: ReaderException if trying to read past the end of the stream
|
* Throws: ReaderException if trying to read past the end of the stream
|
||||||
* or if invalid data is read.
|
* or if invalid data is read.
|
||||||
|
@ -265,10 +269,10 @@ final class Reader
|
||||||
bufferOffset_ = 0;
|
bufferOffset_ = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
////load chars in batches of at most 64 bytes
|
////Load chars in batches of at most 1024 bytes (256 chars)
|
||||||
while(buffer_.length <= bufferOffset_ + length)
|
while(buffer_.length <= bufferOffset_ + length)
|
||||||
{
|
{
|
||||||
loadChars(16);
|
loadChars(256);
|
||||||
|
|
||||||
if(done)
|
if(done)
|
||||||
{
|
{
|
||||||
|
@ -290,10 +294,8 @@ final class Reader
|
||||||
* if nonprintable characters are detected, or
|
* if nonprintable characters are detected, or
|
||||||
* if there is an error reading from the stream.
|
* if there is an error reading from the stream.
|
||||||
*/
|
*/
|
||||||
void loadChars(in uint chars)
|
void loadChars(uint chars)
|
||||||
{
|
{
|
||||||
const oldLength = buffer_.length;
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Get next character from the stream.
|
* Get next character from the stream.
|
||||||
*
|
*
|
||||||
|
@ -369,15 +371,25 @@ final class Reader
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
const oldLength = buffer_.length;
|
||||||
const oldPosition = stream_.position;
|
const oldPosition = stream_.position;
|
||||||
try
|
|
||||||
|
|
||||||
|
//Preallocating memory to limit GC reallocations.
|
||||||
|
buffer_.length = buffer_.length + chars;
|
||||||
|
scope(exit)
|
||||||
{
|
{
|
||||||
foreach(i; 0 .. chars)
|
buffer_.length = buffer_.length - chars;
|
||||||
|
|
||||||
|
enforce(printable(buffer_[oldLength .. $]),
|
||||||
|
new ReaderException("Special unicode characters are not allowed"));
|
||||||
|
}
|
||||||
|
|
||||||
|
try for(uint c = 0; chars; --chars, ++c)
|
||||||
{
|
{
|
||||||
if(done){break;}
|
if(done){break;}
|
||||||
const available = stream_.available;
|
const available = stream_.available;
|
||||||
buffer_ ~= getDChar(available);
|
buffer_[oldLength + c] = getDChar(available);
|
||||||
}
|
|
||||||
}
|
}
|
||||||
catch(UtfException e)
|
catch(UtfException e)
|
||||||
{
|
{
|
||||||
|
@ -389,9 +401,6 @@ final class Reader
|
||||||
{
|
{
|
||||||
throw new ReaderException(e.msg);
|
throw new ReaderException(e.msg);
|
||||||
}
|
}
|
||||||
|
|
||||||
enforce(printable(buffer_[oldLength .. $]),
|
|
||||||
new ReaderException("Special unicode characters are not allowed"));
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
|
131
dyaml/scanner.d
131
dyaml/scanner.d
|
@ -22,6 +22,7 @@ import std.string;
|
||||||
import std.typecons;
|
import std.typecons;
|
||||||
import std.utf;
|
import std.utf;
|
||||||
|
|
||||||
|
import dyaml.escapes;
|
||||||
import dyaml.exception;
|
import dyaml.exception;
|
||||||
import dyaml.queue;
|
import dyaml.queue;
|
||||||
import dyaml.reader;
|
import dyaml.reader;
|
||||||
|
@ -140,12 +141,16 @@ final class Scanner
|
||||||
///Possible simple keys indexed by flow levels.
|
///Possible simple keys indexed by flow levels.
|
||||||
SimpleKey[uint] possibleSimpleKeys_;
|
SimpleKey[uint] possibleSimpleKeys_;
|
||||||
|
|
||||||
|
///Used for constructing strings while limiting reallocation.
|
||||||
|
Appender!(dchar[]) appender_;
|
||||||
|
|
||||||
public:
|
public:
|
||||||
///Construct a Scanner using specified Reader.
|
///Construct a Scanner using specified Reader.
|
||||||
this(Reader reader)
|
this(Reader reader)
|
||||||
{
|
{
|
||||||
//Return the next token, but do not delete it from the queue
|
//Return the next token, but do not delete it from the queue
|
||||||
reader_ = reader;
|
reader_ = reader;
|
||||||
|
appender_ = appender!(dchar[])();
|
||||||
fetchStreamStart();
|
fetchStreamStart();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -156,6 +161,7 @@ final class Scanner
|
||||||
clear(indents_);
|
clear(indents_);
|
||||||
indents_ = null;
|
indents_ = null;
|
||||||
clear(possibleSimpleKeys_);
|
clear(possibleSimpleKeys_);
|
||||||
|
clear(appender_);
|
||||||
possibleSimpleKeys_ = null;
|
possibleSimpleKeys_ = null;
|
||||||
reader_ = null;
|
reader_ = null;
|
||||||
}
|
}
|
||||||
|
@ -412,8 +418,7 @@ final class Scanner
|
||||||
removePossibleSimpleKey();
|
removePossibleSimpleKey();
|
||||||
allowSimpleKey_ = false;
|
allowSimpleKey_ = false;
|
||||||
//There's probably a saner way to clear an associated array than this.
|
//There's probably a saner way to clear an associated array than this.
|
||||||
SimpleKey[uint] empty;
|
clear(possibleSimpleKeys_);
|
||||||
possibleSimpleKeys_ = empty;
|
|
||||||
|
|
||||||
tokens_.push(streamEndToken(reader_.mark, reader_.mark));
|
tokens_.push(streamEndToken(reader_.mark, reader_.mark));
|
||||||
done_ = true;
|
done_ = true;
|
||||||
|
@ -1066,15 +1071,15 @@ final class Scanner
|
||||||
|
|
||||||
dstring lineBreak = "";
|
dstring lineBreak = "";
|
||||||
|
|
||||||
//Used to construct the result.
|
//Using appender_, so clear it when we're done.
|
||||||
auto appender = appender!string();
|
scope(exit){appender_.clear();}
|
||||||
|
|
||||||
//Scan the inner part of the block scalar.
|
//Scan the inner part of the block scalar.
|
||||||
while(reader_.column == indent && reader_.peek() != '\0')
|
while(reader_.column == indent && reader_.peek() != '\0')
|
||||||
{
|
{
|
||||||
appender.put(breaks);
|
appender_.put(breaks);
|
||||||
const bool leadingNonSpace = !" \t".canFind(reader_.peek());
|
const bool leadingNonSpace = !" \t".canFind(reader_.peek());
|
||||||
appender.put(scanToNextBreak());
|
appender_.put(scanToNextBreak());
|
||||||
lineBreak = ""d ~ scanLineBreak();
|
lineBreak = ""d ~ scanLineBreak();
|
||||||
|
|
||||||
auto scalarBreaks = scanBlockScalarBreaks(indent);
|
auto scalarBreaks = scanBlockScalarBreaks(indent);
|
||||||
|
@ -1089,9 +1094,9 @@ final class Scanner
|
||||||
if(style == ScalarStyle.Folded && lineBreak == "\n" &&
|
if(style == ScalarStyle.Folded && lineBreak == "\n" &&
|
||||||
leadingNonSpace && !" \t".canFind(reader_.peek()))
|
leadingNonSpace && !" \t".canFind(reader_.peek()))
|
||||||
{
|
{
|
||||||
if(breaks.length == 0){appender.put(' ');}
|
if(breaks.length == 0){appender_.put(' ');}
|
||||||
}
|
}
|
||||||
else{appender.put(lineBreak);}
|
else{appender_.put(lineBreak);}
|
||||||
////this is Clark Evans's interpretation (also in the spec
|
////this is Clark Evans's interpretation (also in the spec
|
||||||
////examples):
|
////examples):
|
||||||
//
|
//
|
||||||
|
@ -1099,18 +1104,18 @@ final class Scanner
|
||||||
//{
|
//{
|
||||||
// if(breaks.length == 0)
|
// if(breaks.length == 0)
|
||||||
// {
|
// {
|
||||||
// if(!" \t"d.canFind(reader_.peek())){appender.put(' ');}
|
// if(!" \t"d.canFind(reader_.peek())){appender_.put(' ');}
|
||||||
// else{chunks ~= lineBreak;}
|
// else{chunks ~= lineBreak;}
|
||||||
// }
|
// }
|
||||||
//}
|
//}
|
||||||
//else{appender.put(lineBreak);}
|
//else{appender_.put(lineBreak);}
|
||||||
}
|
}
|
||||||
else{break;}
|
else{break;}
|
||||||
}
|
}
|
||||||
if(chomping != Chomping.Strip){appender.put(lineBreak);}
|
if(chomping != Chomping.Strip){appender_.put(lineBreak);}
|
||||||
if(chomping == Chomping.Keep){appender.put(breaks);}
|
if(chomping == Chomping.Keep){appender_.put(breaks);}
|
||||||
|
|
||||||
return scalarToken(startMark, endMark, to!string(appender.data), style);
|
return scalarToken(startMark, endMark, to!string(cast(dstring)appender_.data), style);
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan chomping and indentation indicators of a scalar token.
|
///Scan chomping and indentation indicators of a scalar token.
|
||||||
|
@ -1214,45 +1219,25 @@ final class Scanner
|
||||||
const startMark = reader_.mark;
|
const startMark = reader_.mark;
|
||||||
const quote = reader_.get();
|
const quote = reader_.get();
|
||||||
|
|
||||||
auto appender = appender!dstring();
|
//Using appender_, so clear it when we're done.
|
||||||
appender.put(scanFlowScalarNonSpaces(quotes, startMark));
|
scope(exit){appender_.clear();}
|
||||||
|
|
||||||
|
//Puts scanned data to appender_.
|
||||||
|
scanFlowScalarNonSpaces(quotes, startMark);
|
||||||
while(reader_.peek() != quote)
|
while(reader_.peek() != quote)
|
||||||
{
|
{
|
||||||
appender.put(scanFlowScalarSpaces(startMark));
|
//Puts scanned data to appender_.
|
||||||
appender.put(scanFlowScalarNonSpaces(quotes, startMark));
|
scanFlowScalarSpaces(startMark);
|
||||||
|
scanFlowScalarNonSpaces(quotes, startMark);
|
||||||
}
|
}
|
||||||
reader_.forward();
|
reader_.forward();
|
||||||
|
|
||||||
return scalarToken(startMark, reader_.mark, to!string(appender.data), quotes);
|
return scalarToken(startMark, reader_.mark, to!string(cast(dstring)appender_.data), quotes);
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan nonspace characters in a flow scalar.
|
///Scan nonspace characters in a flow scalar.
|
||||||
dstring scanFlowScalarNonSpaces(ScalarStyle quotes, in Mark startMark)
|
void scanFlowScalarNonSpaces(ScalarStyle quotes, in Mark startMark)
|
||||||
{
|
{
|
||||||
dchar[dchar] escapeReplacements =
|
|
||||||
['0': '\0',
|
|
||||||
'a': '\x07',
|
|
||||||
'b': '\x08',
|
|
||||||
't': '\x09',
|
|
||||||
'\t': '\x09',
|
|
||||||
'n': '\x0A',
|
|
||||||
'v': '\x0B',
|
|
||||||
'f': '\x0C',
|
|
||||||
'r': '\x0D',
|
|
||||||
'e': '\x1B',
|
|
||||||
' ': '\x20',
|
|
||||||
'\"': '\"',
|
|
||||||
'\\': '\\',
|
|
||||||
'N': '\u0085',
|
|
||||||
'_': '\xA0',
|
|
||||||
'L': '\u2028',
|
|
||||||
'P': '\u2029'];
|
|
||||||
|
|
||||||
uint[dchar] escapeCodes = ['x': 2, 'u': 4, 'U': 8];
|
|
||||||
|
|
||||||
//Can't use an Appender due to a Phobos bug, so appending to a string.
|
|
||||||
dstring result;
|
|
||||||
|
|
||||||
for(;;)
|
for(;;)
|
||||||
{
|
{
|
||||||
dchar c = reader_.peek();
|
dchar c = reader_.peek();
|
||||||
|
@ -1263,33 +1248,33 @@ final class Scanner
|
||||||
c = reader_.peek(length);
|
c = reader_.peek(length);
|
||||||
}
|
}
|
||||||
|
|
||||||
if(length > 0){result ~= reader_.get(length);}
|
if(length > 0){appender_.put(reader_.get(length));}
|
||||||
|
|
||||||
c = reader_.peek();
|
c = reader_.peek();
|
||||||
if(quotes == ScalarStyle.SingleQuoted &&
|
if(quotes == ScalarStyle.SingleQuoted &&
|
||||||
c == '\'' && reader_.peek(1) == '\'')
|
c == '\'' && reader_.peek(1) == '\'')
|
||||||
{
|
{
|
||||||
result ~= '\'';
|
appender_.put('\'');
|
||||||
reader_.forward(2);
|
reader_.forward(2);
|
||||||
}
|
}
|
||||||
else if((quotes == ScalarStyle.DoubleQuoted && c == '\'') ||
|
else if((quotes == ScalarStyle.DoubleQuoted && c == '\'') ||
|
||||||
(quotes == ScalarStyle.SingleQuoted && "\"\\".canFind(c)))
|
(quotes == ScalarStyle.SingleQuoted && "\"\\".canFind(c)))
|
||||||
{
|
{
|
||||||
result ~= c;
|
appender_.put(c);
|
||||||
reader_.forward();
|
reader_.forward();
|
||||||
}
|
}
|
||||||
else if(quotes == ScalarStyle.DoubleQuoted && c == '\\')
|
else if(quotes == ScalarStyle.DoubleQuoted && c == '\\')
|
||||||
{
|
{
|
||||||
reader_.forward();
|
reader_.forward();
|
||||||
c = reader_.peek();
|
c = reader_.peek();
|
||||||
if((c in escapeReplacements) !is null)
|
if((c in dyaml.escapes.fromEscapes) !is null)
|
||||||
{
|
{
|
||||||
result ~= escapeReplacements[c];
|
appender_.put(dyaml.escapes.fromEscapes[c]);
|
||||||
reader_.forward();
|
reader_.forward();
|
||||||
}
|
}
|
||||||
else if((c in escapeCodes) !is null)
|
else if((c in dyaml.escapes.escapeHexCodes) !is null)
|
||||||
{
|
{
|
||||||
length = escapeCodes[c];
|
length = dyaml.escapes.escapeHexCodes[c];
|
||||||
reader_.forward();
|
reader_.forward();
|
||||||
|
|
||||||
foreach(i; 0 .. length)
|
foreach(i; 0 .. length)
|
||||||
|
@ -1303,12 +1288,12 @@ final class Scanner
|
||||||
}
|
}
|
||||||
|
|
||||||
dstring hex = reader_.get(length);
|
dstring hex = reader_.get(length);
|
||||||
result ~= cast(dchar)parse!int(hex, 16);
|
appender_.put(cast(dchar)parse!int(hex, 16));
|
||||||
}
|
}
|
||||||
else if("\n\r\u0085\u2028\u2029".canFind(c))
|
else if("\n\r\u0085\u2028\u2029".canFind(c))
|
||||||
{
|
{
|
||||||
scanLineBreak();
|
scanLineBreak();
|
||||||
result ~= scanFlowScalarBreaks(startMark);
|
appender_.put(scanFlowScalarBreaks(startMark));
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
|
@ -1318,12 +1303,15 @@ final class Scanner
|
||||||
to!string(c), reader_.mark);
|
to!string(c), reader_.mark);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else{return result;}
|
else
|
||||||
|
{
|
||||||
|
return;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan space characters in a flow scalar.
|
///Scan space characters in a flow scalar.
|
||||||
dstring scanFlowScalarSpaces(in Mark startMark)
|
void scanFlowScalarSpaces(in Mark startMark)
|
||||||
{
|
{
|
||||||
uint length = 0;
|
uint length = 0;
|
||||||
while(" \t".canFind(reader_.peek(length))){++length;}
|
while(" \t".canFind(reader_.peek(length))){++length;}
|
||||||
|
@ -1334,18 +1322,16 @@ final class Scanner
|
||||||
new Error("While scanning a quoted scalar", startMark,
|
new Error("While scanning a quoted scalar", startMark,
|
||||||
"found unexpected end of stream", reader_.mark));
|
"found unexpected end of stream", reader_.mark));
|
||||||
|
|
||||||
auto appender = appender!dstring();
|
|
||||||
if("\n\r\u0085\u2028\u2029".canFind(c))
|
if("\n\r\u0085\u2028\u2029".canFind(c))
|
||||||
{
|
{
|
||||||
const lineBreak = scanLineBreak();
|
const lineBreak = scanLineBreak();
|
||||||
const breaks = scanFlowScalarBreaks(startMark);
|
const breaks = scanFlowScalarBreaks(startMark);
|
||||||
|
|
||||||
if(lineBreak != '\n'){appender.put(lineBreak);}
|
if(lineBreak != '\n'){appender_.put(lineBreak);}
|
||||||
else if(breaks.length == 0){appender.put(' ');}
|
else if(breaks.length == 0){appender_.put(' ');}
|
||||||
appender.put(breaks);
|
appender_.put(breaks);
|
||||||
}
|
}
|
||||||
else{appender.put(whitespaces);}
|
else{appender_.put(whitespaces);}
|
||||||
return appender.data;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan line breaks in a flow scalar.
|
///Scan line breaks in a flow scalar.
|
||||||
|
@ -1378,7 +1364,8 @@ final class Scanner
|
||||||
{
|
{
|
||||||
//We keep track of the allowSimpleKey_ flag here.
|
//We keep track of the allowSimpleKey_ flag here.
|
||||||
//Indentation rules are loosed for the flow context
|
//Indentation rules are loosed for the flow context
|
||||||
auto appender = appender!dstring();
|
//Using appender_, so clear it when we're done.
|
||||||
|
scope(exit){appender_.clear();}
|
||||||
const startMark = reader_.mark;
|
const startMark = reader_.mark;
|
||||||
Mark endMark = startMark;
|
Mark endMark = startMark;
|
||||||
const indent = indent_ + 1;
|
const indent = indent_ + 1;
|
||||||
|
@ -1420,8 +1407,8 @@ final class Scanner
|
||||||
if(length == 0){break;}
|
if(length == 0){break;}
|
||||||
allowSimpleKey_ = false;
|
allowSimpleKey_ = false;
|
||||||
|
|
||||||
appender.put(spaces);
|
appender_.put(spaces);
|
||||||
appender.put(reader_.get(length));
|
appender_.put(reader_.get(length));
|
||||||
|
|
||||||
endMark = reader_.mark;
|
endMark = reader_.mark;
|
||||||
|
|
||||||
|
@ -1432,7 +1419,7 @@ final class Scanner
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
return scalarToken(startMark, endMark, to!string(appender.data), ScalarStyle.Plain);
|
return scalarToken(startMark, endMark, to!string(cast(dstring)appender_.data), ScalarStyle.Plain);
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan spaces in a plain scalar.
|
///Scan spaces in a plain scalar.
|
||||||
|
@ -1516,7 +1503,8 @@ final class Scanner
|
||||||
dstring scanTagURI(string name, in Mark startMark)
|
dstring scanTagURI(string name, in Mark startMark)
|
||||||
{
|
{
|
||||||
//Note: we do not check if URI is well-formed.
|
//Note: we do not check if URI is well-formed.
|
||||||
auto appender = appender!dstring();
|
//Using appender_, so clear it when we're done.
|
||||||
|
scope(exit){appender_.clear();}
|
||||||
uint length = 0;
|
uint length = 0;
|
||||||
|
|
||||||
dchar c = reader_.peek();
|
dchar c = reader_.peek();
|
||||||
|
@ -1524,23 +1512,23 @@ final class Scanner
|
||||||
{
|
{
|
||||||
if(c == '%')
|
if(c == '%')
|
||||||
{
|
{
|
||||||
appender.put(reader_.get(length));
|
appender_.put(reader_.get(length));
|
||||||
length = 0;
|
length = 0;
|
||||||
appender.put(scanURIEscapes(name, startMark));
|
appender_.put(scanURIEscapes(name, startMark));
|
||||||
}
|
}
|
||||||
else{++length;}
|
else{++length;}
|
||||||
c = reader_.peek(length);
|
c = reader_.peek(length);
|
||||||
}
|
}
|
||||||
if(length > 0)
|
if(length > 0)
|
||||||
{
|
{
|
||||||
appender.put(reader_.get(length));
|
appender_.put(reader_.get(length));
|
||||||
length = 0;
|
length = 0;
|
||||||
}
|
}
|
||||||
enforce(appender.data.length > 0,
|
enforce(appender_.data.length > 0,
|
||||||
new Error("While parsing a " ~ name, startMark,
|
new Error("While parsing a " ~ name, startMark,
|
||||||
"expected URI, but found: " ~ to!string(c), reader_.mark));
|
"expected URI, but found: " ~ to!string(c), reader_.mark));
|
||||||
|
|
||||||
return appender.data;
|
return cast(dstring)appender_.data;
|
||||||
}
|
}
|
||||||
|
|
||||||
///Scan URI escape sequences.
|
///Scan URI escape sequences.
|
||||||
|
@ -1606,8 +1594,7 @@ final class Scanner
|
||||||
{
|
{
|
||||||
const c = reader_.peek();
|
const c = reader_.peek();
|
||||||
|
|
||||||
dchar[] plainLineBreaks = ['\r', '\n', '\u0085'];
|
if("\r\n\u0085".canFind(c))
|
||||||
if(plainLineBreaks.canFind(c))
|
|
||||||
{
|
{
|
||||||
if(reader_.prefix(2) == "\r\n"){reader_.forward(2);}
|
if(reader_.prefix(2) == "\r\n"){reader_.forward(2);}
|
||||||
else{reader_.forward();}
|
else{reader_.forward();}
|
||||||
|
|
|
@ -13,6 +13,7 @@ module dyaml.serializer;
|
||||||
|
|
||||||
import std.array;
|
import std.array;
|
||||||
import std.format;
|
import std.format;
|
||||||
|
import std.typecons;
|
||||||
|
|
||||||
import dyaml.anchor;
|
import dyaml.anchor;
|
||||||
import dyaml.emitter;
|
import dyaml.emitter;
|
||||||
|
@ -193,12 +194,13 @@ struct Serializer
|
||||||
{
|
{
|
||||||
assert(node.isType!string, "Scalar node type must be string before serialized");
|
assert(node.isType!string, "Scalar node type must be string before serialized");
|
||||||
auto value = node.as!string;
|
auto value = node.as!string;
|
||||||
Tag detectedTag = resolver_.resolve(NodeID.Scalar, Tag(null), value, true);
|
const Tag detectedTag = resolver_.resolve(NodeID.Scalar, Tag(null), value, true);
|
||||||
Tag defaultTag = resolver_.resolve(NodeID.Scalar, Tag(null), value, false);
|
const Tag defaultTag = resolver_.resolve(NodeID.Scalar, Tag(null), value, false);
|
||||||
|
bool isDetected = node.tag_ == detectedTag;
|
||||||
|
bool isDefault = node.tag_ == defaultTag;
|
||||||
|
|
||||||
emitter_.emit(scalarEvent(Mark(), Mark(), aliased, node.tag_,
|
emitter_.emit(scalarEvent(Mark(), Mark(), aliased, node.tag_,
|
||||||
[node.tag_ == detectedTag, node.tag_ == defaultTag],
|
tuple(isDetected, isDefault), value, ScalarStyle.Invalid));
|
||||||
value, ScalarStyle.Invalid));
|
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
if(node.isSequence)
|
if(node.isSequence)
|
||||||
|
|
|
@ -10,6 +10,7 @@ module dyaml.testemitter;
|
||||||
import std.algorithm;
|
import std.algorithm;
|
||||||
import std.file;
|
import std.file;
|
||||||
import std.range;
|
import std.range;
|
||||||
|
import std.typecons;
|
||||||
|
|
||||||
import dyaml.dumper;
|
import dyaml.dumper;
|
||||||
import dyaml.event;
|
import dyaml.event;
|
||||||
|
@ -163,7 +164,7 @@ void testEmitterStyles(bool verbose, string dataFilename, string canonicalFilena
|
||||||
if(event.id == EventID.Scalar)
|
if(event.id == EventID.Scalar)
|
||||||
{
|
{
|
||||||
event = scalarEvent(Mark(), Mark(), event.anchor, event.tag,
|
event = scalarEvent(Mark(), Mark(), event.anchor, event.tag,
|
||||||
[event.implicit, event.implicit_2],
|
tuple(event.implicit, event.implicit_2),
|
||||||
event.value, style);
|
event.value, style);
|
||||||
}
|
}
|
||||||
else if(event.id == EventID.SequenceStart)
|
else if(event.id == EventID.SequenceStart)
|
||||||
|
|
Loading…
Reference in a new issue