dyaml/examples/yaml_bench/yaml_bench.d
Cameron Ross e37c4daa7e switch to a non-templated Dumper struct (#234)
switch to a non-templated Dumper struct
merged-on-behalf-of: Basile-z <Basile-z@users.noreply.github.com>
2019-02-07 08:48:50 +01:00

180 lines
5.8 KiB
D

module dyaml.yaml_bench;
//Benchmark that loads, and optionally extracts data from and/or emits a YAML file.
import std.algorithm;
import std.conv;
import std.datetime.systime;
import std.datetime.stopwatch;
import std.file;
import std.getopt;
import std.range;
import std.stdio;
import std.string;
import dyaml;
///Get data out of every node.
void extract(ref Node document) @safe
{
void crawl(ref Node root) @safe
{
final switch (root.nodeID)
{
case NodeID.scalar:
switch(root.tag)
{
case "tag:yaml.org,2002:null": auto value = root.as!YAMLNull; break;
case "tag:yaml.org,2002:bool": auto value = root.as!bool; break;
case "tag:yaml.org,2002:int": auto value = root.as!long; break;
case "tag:yaml.org,2002:float": auto value = root.as!real; break;
case "tag:yaml.org,2002:binary": auto value = root.as!(ubyte[]); break;
case "tag:yaml.org,2002:timestamp": auto value = root.as!SysTime; break;
case "tag:yaml.org,2002:str": auto value = root.as!string; break;
default: writeln("Unrecognozed tag: ", root.tag);
}
break;
case NodeID.sequence:
foreach(ref Node node; root)
{
crawl(node);
}
break;
case NodeID.mapping:
foreach(ref Node key, ref Node value; root)
{
crawl(key);
crawl(value);
}
break;
case NodeID.invalid:
assert(0);
}
}
crawl(document);
}
void main(string[] args) //@safe
{
import std.array : array;
bool get = false;
bool dump = false;
bool reload = false;
bool quiet = false;
bool verbose = false;
bool scanOnly = false;
uint runs = 1;
auto help = getopt(
args,
"get|g", "Extract data from the file (using Node.as()).", &get,
"dump|d", "Dump the loaded data (to YAML_FILE.dump).", &dump,
"runs|r", "Repeat parsing the file NUM times.", &runs,
"reload", "Reload the file from the diskl on every repeat By default,"~
" the file is loaded to memory once and repeatedly parsed from memory.", &reload,
"quiet|q", "Don't print anything.", &quiet,
"verbose|v", "Print even more.", &verbose,
"scan-only|s", "Do not execute the entire parsing process, only scanning. Overrides '--dump'", &scanOnly
);
if (help.helpWanted || (args.length < 2))
{
defaultGetoptPrinter(
"D:YAML benchmark\n"~
"Copyright (C) 2011-2018 Ferdinand Majerech, Cameron \"Herringway\" Ross\n"~
"Usage: yaml_bench [OPTION ...] [YAML_FILE]\n\n"~
"Loads and optionally extracts data and/or dumps a YAML file.\n",
help.options
);
return;
}
string file = args[1];
auto stopWatch = StopWatch(AutoStart.yes);
void[] fileInMemory;
if(!reload) { fileInMemory = std.file.read(file); }
void[] fileWorkingCopy = fileInMemory.dup;
auto loadTime = stopWatch.peek();
stopWatch.reset();
try
{
// Instead of constructing a resolver/constructor with each Loader,
// construct them once to remove noise when profiling.
auto resolver = Resolver.withDefaultResolvers;
auto constructTime = stopWatch.peek();
Node[] nodes;
void runLoaderBenchmark() //@safe
{
// Loading the file rewrites the loaded buffer, so if we don't reload from
// disk, we need to use a copy of the originally loaded file.
if(reload) { fileInMemory = std.file.read(file); }
else { fileWorkingCopy[] = fileInMemory[]; }
void[] fileToLoad = reload ? fileInMemory : fileWorkingCopy;
auto loader = Loader.fromBuffer(fileToLoad);
if(scanOnly)
{
loader.scanBench();
return;
}
loader.resolver = resolver;
nodes = loader.array;
}
void runDumpBenchmark() @safe
{
if(dump)
{
dumper().dump(File(file ~ ".dump", "w").lockingTextWriter, nodes);
}
}
void runGetBenchmark() @safe
{
if(get) foreach(ref node; nodes)
{
extract(node);
}
}
auto totalTime = benchmark!(runLoaderBenchmark, runDumpBenchmark, runGetBenchmark)(runs);
if (!quiet)
{
auto enabledOptions =
only(
get ? "Get" : "",
dump ? "Dump" : "",
reload ? "Reload" : "",
scanOnly ? "Scan Only": ""
).filter!(x => x != "");
if (!enabledOptions.empty)
{
writefln!"Options enabled: %-(%s, %)"(enabledOptions);
}
if (verbose)
{
if (!reload)
{
writeln("Time to load file: ", loadTime);
}
writeln("Time to set up resolver: ", constructTime);
}
writeln("Runs: ", runs);
foreach(time, func, enabled; lockstep(totalTime[], only("Loader", "Dumper", "Get"), only(true, dump, get)))
{
if (enabled)
{
writeln("Average time spent on ", func, ": ", time / runs);
writeln("Total time spent on ", func, ": ", time);
}
}
}
}
catch(YAMLException e)
{
writeln("ERROR: ", e.msg);
}
}