UNPKG

graphy/cli.js

Version:
51.2 kBJavaScriptView Raw
1#!/usr/bin/env node
2
3
4/* eslint-disable global-require */
5/* eslint-disable no-console */
6
7const gobble = (s_text, s_indent='') => {
let m_pad = /^(\s+)/.exec(s_text.replace(/^([ \t]*\n)/, ''));
if(m_pad) {
return s_indent+s_text.replace(new RegExp(`\\n${m_pad[1]}`, 'g'), '\n'+s_indent.trim()).trim();
}
else {
return s_indent+s_text.trim();
}
15};
16
17const fs =require('fs');
18const path = require('path');
19const yargs = require('yargs');
20const mk_yargs = require('yargs/yargs');
21const graphy = require('./api.js');
22const factory = require('@graphy/core.data.factory');
23const stream = require('@graphy/core.iso.stream');
24const dataset_tree = require('@graphy/memory.dataset.fast');
25
26const parse_filter = require('./quad-expression.js').parse;
27const expression_handler = require('./expression-handler.js');
28
29const F_ADAPT_STREAM = function(ds_out) {
let ds_dst = ds_out;
31
// non-object mode
if(!ds_dst._writableState.objectMode) {
// transform to JSON
ds_out = stream.quads_to_json();
}
// yes object mode and graphy writable
else if(ds_out.isGraphyWritable) {
// transform to writable data events
ds_out = stream.quads_to_writable();
}
// forward as-is to super
else {
return this.constructor.prototype.pipe.call(this, ds_dst);
}
46
// forward output to super
this.constructor.prototype.pipe.call(this, ds_out);
49
// pipe output to destination
return ds_out.pipe(ds_dst);
52};
53
54const bypass = a_inputs => a_inputs.map((ds_input) => {
// intercept pipe
ds_input.pipe = F_ADAPT_STREAM;
57
return ds_input;
59});
60
61const map_streams = (a_inputs, f_map) => a_inputs.map((ds_input) => {
let ds_output = f_map(ds_input);
63
// intercept pipe
ds_output.pipe = F_ADAPT_STREAM;
66
// pipe input to step and return step
return ds_input.pipe(ds_output);
69});
70
71const warp_term = (z_term, h_prefixes) => {
// c1 string
if('string' === typeof z_term) {
return factory.c1(z_term, h_prefixes);
}
// normalize term
else {
return factory.fromTerm(z_term);
}
80};
81
82const interpret_item = (z_item, h_prefixes, ds_transform, fke_transform) => {
// array
if(Array.isArray(z_item)) {
// zero-length, skip
if(!z_item.length) return fke_transform();
87
// first object is also array
if(Array.isArray(z_item[0])) {
	let nl_subs = z_item.length;
91
	let c_resolves = 0;
93
	for(let z_sub of z_item) {
		interpret_item(z_sub, h_prefixes, ds_transform, () => {  // eslint-disable-line no-loop-func
			if(++c_resolves === nl_subs) {
				fke_transform();
			}
		});
	}
101
	// do not consume transform synchronously
	return;
}
// triple/quad
else if(3 === z_item.length || 4 === z_item.length) {
	let a_terms = z_item.map(z => warp_term(z, h_prefixes));
108
	ds_transform.push(factory.quad(...a_terms));
}
}
// string (trig)
else if('string' === typeof z_item) {
graphy.content.trig.read({
	input: {
		string: z_item,
117
		error(e_read) {
			warn(`The 'transform' command threw an Error while trying to read the returned TriG string: '${z_item}'\n\nThe reader reported: ${e_read.stack}`);
120
			// done
			fke_transform();
		},
	},
125
	data(g_quad_read) {
		ds_transform.push(g_quad_read);
	},
129
	eof() {
		// done
		fke_transform();
	},
});
135
// do not consume transform synchronously
return;
}
// quad
else if(z_item.subject && z_item.predicate && z_item.object) {
ds_transform.push(factory.fromQuad(z_item));
}
// iterable
else if(z_item[Symbol.iterator]) {
for(let g_quad_it of z_item) {
	ds_transform.push(g_quad_it);
}
}
// other
else {
exit(`The callback function supplied to the 'transform' command returned an invalid quad value: '${z_item}'`);
}
153
// done
fke_transform();
156};
157
158const dataset_N1QQ = async(g_argv, a_inputs, fe_command, s_operation) => {
let b_canonicalize = !g_argv.strict;
160
// create trees
let a_trees = a_inputs.map(() => dataset_tree());
163
// initial tree
let k_tree_out = a_trees[0];
166
// pairwise readiness
for(let i_input=0, nl_inputs=a_inputs.length; i_input<nl_inputs; i_input++) {
let k_tree_b = a_trees[i_input];
170
// pipe input stream to tree b
a_inputs[i_input].pipe(k_tree_b);
173
// wait for input stream to finish writing to b
await k_tree_b.until('finish');
176
// canonicalize
if(b_canonicalize) {
	k_tree_b = a_trees[i_input] = k_tree_b.canonicalize();
180
	// update out ref
	if(!i_input) k_tree_out = k_tree_b;
}
184
// non-first input
if(i_input) {
	// perform pairwise operation
	k_tree_out = k_tree_out[s_operation](k_tree_b);
}
}
191
// return readable tree
return [k_tree_out];
194};
195
196const dataset_21QQ = (g_argv, a_inputs, fe_command, s_operation) => new Promise((fk_resolve) => {
let b_canonicalize = !g_argv.strict;
198
let operate = () => [k_tree_a[s_operation](k_tree_b)];
200
// wait for a
let k_tree_a = dataset_tree();
let b_finished_a = false;
k_tree_a.on('finish', () => {
// canonicalize
if(b_canonicalize) k_tree_a = k_tree_a.canonicalize();
207
// a is finished now
b_finished_a = true;
210
// b is already finished
if(b_finished_b) fk_resolve(operate());
});
214
// wait for b
let k_tree_b = dataset_tree();
let b_finished_b = false;
k_tree_b.on('finish', () => {
// canonicalize
if(b_canonicalize) k_tree_b = k_tree_b.canonicalize();
221
// b is finished now
b_finished_b = true;
224
// a is already finished
if(b_finished_a) fk_resolve(operate());
});
228
// ref both input streams
let [ds_input_a, ds_input_b] = a_inputs;
231
// pipe each to its tree
ds_input_a.pipe(k_tree_a);
ds_input_b.pipe(k_tree_b);
235});
236
237const dataset_21QR = (g_argv, a_inputs, fe_command, s_operation) => new Promise((fk_resolve) => {
let b_canonicalize = !g_argv.strict;
239
let operate = () => [new AnswerSource(k_tree_a[s_operation](k_tree_b))];
241
// wait for a
let k_tree_a = dataset_tree();
let b_finished_a = false;
k_tree_a.on('finish', () => {
// canonicalize
if(b_canonicalize) k_tree_a = k_tree_a.canonicalize();
248
// a is finished now
b_finished_a = true;
251
// b is already finished
if(b_finished_b) fk_resolve(operate());
});
255
// wait for b
let k_tree_b = dataset_tree();
let b_finished_b = false;
k_tree_b.on('finish', () => {
// canonicalize
if(b_canonicalize) k_tree_b = k_tree_b.canonicalize();
262
// b is finished now
b_finished_b = true;
265
// a is already finished
if(b_finished_a) fk_resolve(operate());
});
269
// ref both input streams
let [ds_input_a, ds_input_b] = a_inputs;
272
// pipe each to its tree
ds_input_a.pipe(k_tree_a);
ds_input_b.pipe(k_tree_b);
276});
277
278class AnswerSource extends require('stream').Readable {
constructor(w_datum) {
super({
	objectMode: true,
});
283
this._w_datum = w_datum;
}
286
// intercept pipe
pipe(ds_dst) {
// string out
if(!ds_dst._writableState.objectMode) {
	// change read mode; push as JSON
	this._read = () => {
		this.push(JSON.stringify(this._w_datum)+'\n', 'utf8');
		this.push(null);
	};
}
297
// forward to super
return super.pipe(ds_dst);
}
301
// push object
_read() {
this.push(this._w_datum);
this.push(null);
}
307}
308
309function ignore_pipe_warnings(ds_src) {
let f_pipe = ds_src.pipe;
311
// override pipe
ds_src.pipe = function pipe(ds_dst) {
// pipe without warning because of worker threads
let n_maxl_src = this._maxListeners || 10;
let n_maxl_dst = ds_dst._maxListeners || 10;
317
// set infinite max listeners
this.setMaxListeners(Infinity);
ds_dst.setMaxListeners(Infinity);
321
// call pipe
let w_ret = f_pipe.call(this, ds_dst);
324
// reset max listeners
this._maxListeners = n_maxl_src;
ds_dst._maxListeners = n_maxl_dst;
328
// return value
return w_ret;
};
332
// return self
return ds_src;
335}
336
337let b_show_stack_trace = false;
338const warn = (s_message) => {
let s_msg = (new Error(s_message)).stack;
340
if(!b_show_stack_trace) {
s_msg = s_msg.replace(/\n\s+at [^\n]*\n/, '\n')
	.replace(/^Error:/, 'Warning:');
}
345
console.warn(s_msg);
347};
348
349const exit = (s_exit) => {
console.error(s_exit);
process.exit(1);
352};
353
354
355const S_TRANSFORM_TYPE_NNSQ = 'Transform Type:  N-to-N (map);  (...Strings) --> [...Quads]';
356const S_TRANSFORM_TYPE_NNQS = 'Transform Type:  N-to-N (map);  (...Quads) --> [...Strings]';
357const S_TRANSFORM_TYPE_NNQQ = 'Transform Type:  N-to-N (map);  (...Quads) --> [...Quads]';
358const S_TRANSFORM_TYPE_NNQRB = 'Transform Type:  N-to-N (map);  (...Quads) --> [...ResultValues<Boolean>]';
359const S_TRANSFORM_TYPE_NNQRN = 'Transform Type:  N-to-N (map);  (...Quads) --> [...ResultValues<Number>]';
360const S_TRANSFORM_TYPE_21QQ = 'Transform Type:  2-to-1 (join);  (Quads, Quads) --> [Quads]';
361const S_TRANSFORM_TYPE_N1QQ = 'Transform Type:  N-to-1 (reduce);  (...Quads) --> [Quads]';
362const S_TRANSFORM_TYPE_N1AA = 'Transform Type:  N-to-1 (reduce);  (...Any) --> [Any]';
363const S_TRANSFORM_TYPE_21QRB = 'Transform Type:  2-to-1 (join);  (Quads, Quads) --> [ResultValues<Boolean>]';
364const S_TRANSFORM_TYPE_21QRN = 'Transform Type:  2-to-1 (join);  (Quads, Quads) --> [ResultValues<Number>]';
365
366const S_CATEGORY_IO = 'Input/Output Commands:';
367const S_CATEGORY_DATA = 'Quad Manipulation Commands:';
368const S_CATEGORY_STREAM = 'Stream Control Commands:';
369const S_CATEGORY_SET = 'Dataset Commands:';
370const S_CATEGORY_STATS = 'Statistics Commands:';
371
372const S_WARN_JAVASCRIPT = `WARNING: the '-j' / '--js' / '--javascript' option evals the given code. DO NOT allow user input into this option as it will grant them arbitrary code execution with whatever privileges the process is running under.`;
373
374const G_OPTIONS_DATASET = {
strict: {
type: 'boolean',
describe: 'if true, forgoes canonicalization before the set operation',
},
379};
380
381const content_type_flags = f_verb => ({
// nt: {
// 	type: 'boolean',
// 	alias: ['ntriples', 'n-triples'],
// 	conflicts: ['ttl', 'nq', 'trig'],
// 	describe: f_verb('N-Triples'),
// },
388
// nq: {
// 	type: 'boolean',
// 	alias: ['nquads', 'n-quads'],
// 	conflicts: ['nt', 'ttl', 'trig'],
// 	describe: f_verb('N-Quads'),
// },
395
// ttl: {
// 	type: 'boolean',
// 	alias: ['turtle'],
// 	conflicts: ['nt', 'nq', 'trig'],
// 	describe: f_verb(' Turtle'),
// },
402
// trig: {
// 	type: 'boolean',
// 	conflicts: ['nt', 'nq', 'ttl'],
// 	describe: f_verb('TriG'),
407// },
408});
409
410// commands
411let h_commands = {  // eslint-disable-next-line quote-props
412/*
413------ Input/Output --------
414*/
415
read: {
type: S_TRANSFORM_TYPE_NNSQ,
category: S_CATEGORY_IO,
overview: 'Deserialize RDF content',
description: [
	'Read RDF content, i.e., deserialize it, from 1 or more inputs using a single thread',
],
options: {
	c: {
		type: 'string',
		alias: ['content-type'],
		default: 'trig',
		describe: 'either an RDF Content-Type or format selector',
		group: 'Content Selector Options:',
	},
	r: {
		type: 'boolean',
		alias: ['relax'],
		default: undefined,  // eslint-disable-line no-undefined
		describe: 'relax validation of tokens within the RDF document',
	},
	b: {
		type: 'string',
		alias: ['base', 'base-uri', 'base-iri'],
		describe: 'set a base URI on the document',
	},
442
	...content_type_flags(s => `read from ${s}`),
},
examples: [
	`read -c nt`,
	`read -c n-triples`,
	`read -c 'application/n-triples'`,
	`read -c ttl`,
	`read -c turtle`,
	`read -c 'text/turtle'`,
],
453
command(g_argv, a_inputs, fe_command) {
	// select reader
	let f_reader = graphy.content(g_argv['content-type']).read;
457
	let gc_read = {
		relax: g_argv.relax || false,
	};
461
	// 'base-uri' => 'baseUri'
	if(g_argv['base-uri']) {
		gc_read.baseUri = g_argv['base-uri'];
	}
466
	return map_streams(a_inputs, () => f_reader({
		...gc_read,
469
		error: e => fe_command(e),
	}));
},
},
474
scan: {
type: S_TRANSFORM_TYPE_NNSQ,
category: S_CATEGORY_IO,
overview: 'Deserialize RDF content using multiple threads',
description: [
	'Scan RDF content, i.e., deserialize it, from 1 or more inputs using multiple threads',
],
options: {
	c: {
		type: 'string',
		alias: ['content-type'],
		default: 'nt',
		describe: 'either an RDF Content-Type or format selector',
		group: 'Content Selector Options:',
	},
	r: {
		type: 'boolean',
		alias: ['relax'],
		default: undefined,  // eslint-disable-line no-undefined
		describe: 'relax validation of tokens within the RDF document',
		group: 'Read Options:',
	},
	// b: {
	// 	type: 'string',
	// 	alias: ['base', 'base-uri', 'base-iri'],
	// 	describe: 'set a base URI on the document',
	// },
	threads: {
		type: 'number',
		describe: 'manually set the total number of threads to use (including the main thread)',
		group: 'Scan Options:',
	},
507
	...content_type_flags(s => `scan from ${s}`),
},
examples: [
	`scan -c nt`,
	`scan -c n-triples`,
	`scan -c 'application/n-triples'`,
	`scan -c nq`,
	`scan -c nquads`,
	`scan -c 'application/n-quads'`,
],
518
command(g_argv, a_inputs, fe_command, a_rest) {
	// select scanner
	let f_scanner = graphy.content(g_argv['content-type']).scan;
522
	let gc_scan = {
		relax: g_argv.relax || false,
		threads: g_argv.threads || 0,
	};
527
	// next command
	let a_series = a_rest.shift();
	let si_next = a_series? a_series[0]: null;
531
	// command
	switch(si_next) {
		// count task
		case 'count': {
			return a_inputs.map(ds_input => new Promise((fk_resolve) => {
				ds_input.on('error', fe_command);
538
				f_scanner(ds_input, {
					...gc_scan,
541
					preset: 'count',
543
					error: fe_command,
545
					report(c_quads) {
						fk_resolve(ignore_pipe_warnings(new AnswerSource(c_quads)));
					},
				});
			}));
		}
552
		// scribe / ndjson
		case 'scribe':
		case null: {
			return a_inputs.map((ds_input) => {
				ds_input.on('error', fe_command);
558
				let ds_output = ignore_pipe_warnings(new stream.PassThrough());
560
				f_scanner(ds_input, {
					...gc_scan,
563
					preset: si_next || 'ndjson',
565
					error: fe_command,
567
					update(z_scribe, i_worker) {
						ds_output.write(i_worker? Buffer.from(z_scribe).toString(): z_scribe);
					},
571
					report() {
						ds_output.end();
					},
				});
576
				return ds_output;
			});
		}
580
		// other
		default: {
			fe_command(`The 'scan' command only supports a limited set of commands to follow it; '${si_next}' is not supported`);
		}
	}
},
},
588
scribe: {
type: S_TRANSFORM_TYPE_NNQS,
category: S_CATEGORY_IO,
overview: 'Serialize RDF content fast',
description: [
	'Scribe RDF content, i.e., serialize it, fast (and possibly ugly) using the given content-type.',
],
options: {
	c: {
		type: 'string',
		alias: ['content-type'],
		default: 'trig',
		describe: 'either an RDF Content-Type or format selector',
		group: 'Content Selector Options:',
	},
604
	...content_type_flags(s => `scribe to ${s}`),
},
examples: [
	`scribe -c nt`,
	`scribe -c n-triples`,
	`scribe -c 'application/n-triples'`,
	`scribe -c ttl`,
	`scribe -c turtle`,
	`scribe -c 'text/turtle'`,
	`scribe -c xml`,
],
616
command(g_argv, a_inputs, fe_command) {
	// select scriber
	let f_scriber = graphy.content(g_argv['content-type']).scribe;
620
	// map input(s) to writer(s)
	return a_inputs.map(ds_input => ds_input.pipe(f_scriber({
		error: e => fe_command(e),
	})));
},
},
627
write: {
type: S_TRANSFORM_TYPE_NNQS,
category: S_CATEGORY_IO,
overview: 'Serialize RDF content in style (pretty-printing)',
description: [
	'Write RDF content, i.e., serialize it, in style (pretty-print) using the given content-type.',
],
options() {
	let s_group_style = 'Style Options:';
	let s_group_list = 'List Structure Options:';
638
	return {
		c: {
			type: 'string',
			alias: ['content-type'],
			describe: `either an RDF Content-Type or format selector (defaults to 'trig')`,
			group: 'Content Selector Options:',
		},
		i: {
			type: 'string',
			alias: ['indent'],
			// default: '\\t',  // eslint-disable-line no-undefined
			describe: `sets the whitespace string to use for indentation. Writers use '\\t' by default`,
			group: s_group_style,
		},
		g: {
			// type: 'string',
			alias: ['graph-keyword'],
			describe: `sets the style to use when serializing the optional 'GRAPH' keyword in TriG. Writers omit this keyword by default.
				Passing 'true' or empty with this flag on is shorthand for the all-caps 'GRAPH' keyword`.replace(/\n\s*/g, ' '),
			group: s_group_style,
		},
		s: {
			type: 'boolean',
			alias: ['simplify-default-graph'],
			describe: 'if enabled, omits serializing the surrounding optional graph block for the default graph in TriG.',
			group: s_group_style,
		},
		f: {
			type: 'string',
			alias: ['first'],
			describe: `c1 string: sets the predicate to use for the 'first' relation when serializing list structures`,
			group: s_group_list,
		},
		r: {
			type: 'string',
			alias: ['rest'],
			describe: `c1 string: sets the predicate to use for the 'rest' relation when serializing list structures`,
			group: s_group_list,
		},
		n: {
			type: 'string',
			alias: ['nil'],
			describe: `c1 string: sets the predicate to use for the 'nil' relation when serializing list structures`,
			group: s_group_list,
		},
684
		...content_type_flags(s => `write to ${s}`),
	};
},
examples: [
	`write -c nt`,
	`write -c n-triples`,
	`write -c 'application/n-triples'`,
	`write -c ttl`,
	`write -c turtle`,
	`write -c 'text/turtle'`,
],
696
command(g_argv, a_inputs, fe_command) {
	// default write config
	let gc_write = {};
700
	// extend style options
	let g_style = gc_write.style || {};
703
	// content-type selector
	let s_selector = g_argv['content-type'];
706
	// no selector specified
	if(!s_selector) {
		// default to trig
		s_selector = 'trig';
711
		// set simplify default graph so that it might also turtle-compatible
		g_style.simplify_default_graph = true;
	}
715
	// select writer
	let f_writer = graphy.content(s_selector).write;
718
	// style options
	{
		// indent
		if(g_argv.indent) g_style.indent = g_argv.indent;
723
		// graph keyword
		if(g_argv['graph-keyword']) {
			let z_graph_keyword = g_argv['graph-keyword'];
			if('boolean' === typeof z_graph_keyword) {
				g_style.graph_keyword = z_graph_keyword;
			}
			else if(/^true$/i.test(z_graph_keyword)) {
				g_style.graph_keyword = true;
			}
			else if(/^false$/i.test(z_graph_keyword)) {
				g_style.graph_keyword = false;
			}
			else if(/^graph$/i.test(z_graph_keyword)) {
				g_style.graph_keyword = z_graph_keyword;
			}
			else {
				return fe_command(`The 'write' command reported an invalid value given to the 'graph-keyword' option: '${z_graph_keyword}'`);
			}
		}
743
		// simplify default graph
		if(g_argv['simplify-default-graph']) g_style.simplify_default_graph = g_argv['simplify-default-graph'];
	}
747
	// extend list options
	let g_lists = gc_write.lists || {};
	{
		// first
		if(g_argv.first) g_lists.first = g_argv.first;
753
		// rest
		if(g_argv.rest) g_lists.rest = g_argv.rest;
756
		// nil
		if(g_argv.nil) g_lists.nil = g_argv.nil;
	}
760
	// map input(s) to writer(s)
	return a_inputs.map(ds_input => ds_input.pipe(f_writer({
		...gc_write,
764
		style: g_style,
766
		lists: g_lists,
768
		error: e => fe_command(e),
	})));
},
},
773
774/*
775------ Quad-Level --------
776*/
777
skip: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_DATA,
overview: 'Skip over some amount of quads in the stream(s)',
description: [
	'Skip over some amount of data (quads by default) for each input stream before piping the remainder as usual.',
],
syntax: '[size=1]',
positionals: {
	size: {
		type: 'number',
		describe: 'the number of things to skip',
	},
},
options: {
	q: {
		type: 'boolean',
		alias: ['quads', 't', 'triples'],
		describe: 'skip the given number of quads',
		conflicts: ['s'],
	},
799
	s: {
		type: 'boolean',
		alias: ['subjects'],
		describe: 'skip quads until the given number of distinct subjects have been encountered',
		conflicts: ['q'],
	},
806
	// m: {
	// 	type: 'number',
	// 	alias: ['multiply'],
	// },
811
	// d: {
	// 	type: 'number',
	// 	alias: ['divisions'],
	// 	describe: 'rather than counting numbers, use equal divisions of the given size',
	// 	example: gobble(`
	// 		Skip the first third of data:  skip -d 3
	// 	`),
	// },
820
	// r: {
	// 	type: 'number',
	// 	alias: ['ratio'],
	// 	describe: 'rather than counting numbers, use equal divisions of the given size',
	// 	example: gobble(`
	// 		Skip the first twothird of data:  skip -r '2/3'
	// 	`),
	// },
},
830
command(g_argv, a_inputs, fe_command) {
	// size argument
	let [
		n_skip=1,
	] = g_argv._;
836
	// count subjects
	if(g_argv.subjects) {
		return map_streams(a_inputs, () => {
			let c_subjects = 0;
			let kt_prev = null;
842
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
845
				transform(g_quad, s_encoding, fke_transform) {
					// reached length
					if(!g_quad.subject.equals(kt_prev) && ++c_subjects > n_skip) {
						// start pushing
						this.push(g_quad);
					}
852
					// save subject
					kt_prev = g_quad.subject;
855
					// done
					fke_transform();
				},
			});
		});
	}
	// count quads
	else {
		return map_streams(a_inputs, () => {
			let c_quads = 0;
866
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
869
				transform(g_quad, s_encoding, fke_transform) {
					// reached length
					if(++c_quads > n_skip) {
						// start pushing
						this.push(g_quad);
					}
876
					// done
					fke_transform();
				},
			});
		});
	}
},
},
885
head: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_DATA,
overview: 'Limit number of quads from top of stream(s)',
description: [
	'Limit the number of quads that pass through by counting from the top of the stream.',
],
syntax: '[size=1]',
positionals: {
	size: {
		type: 'number',
		describe: 'the number of things to emit',
	},
},
options: {
	q: {
		type: 'boolean',
		alias: ['quads', 't', 'triples'],
		describe: 'emit only the given number of quads from the top of a stream',
		conflicts: ['s'],
	},
907
	s: {
		type: 'boolean',
		alias: ['subjects'],
		describe: 'emit quads until the given number of distinct subjects have been encountered from the top of a stream',
		conflicts: ['q'],
	},
},
915
command(g_argv, a_inputs, fe_command) {
	// size argument
	let [
		n_head=1,
	] = g_argv._;
921
	// count subjects
	if(g_argv.subjects) {
		return map_streams(a_inputs, (ds_input) => {
			let c_subjects = 0;
			let kt_prev = null;
927
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
930
				transform(g_quad, s_encoding, fke_transform) {
					// under limit
					if(g_quad.subject.equals(kt_prev) || ++c_subjects <= n_head) {
						this.push(g_quad);
					}
					// hit limit
					else {
						// push eof
						this.push(null);
940
						// destroy source
						ds_input.destroy();
					}
944
					// save subject
					kt_prev = g_quad.subject;
947
					// done
					fke_transform();
				},
			});
		});
	}
	// count quads
	else {
		return map_streams(a_inputs, (ds_input) => {
			let c_quads = 0;
958
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
961
				transform(g_quad, s_encoding, fke_transform) {
					// under limit
					if(++c_quads <= n_head) {
						this.push(g_quad);
					}
					// hit limit
					else {
						// push eof
						this.push(null);
971
						// destroy source
						ds_input.destroy();
					}
975
					// done
					fke_transform();
				},
			});
		});
	}
},
},
984
tail: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_DATA,
overview: 'Limit number of quads from bottom of stream(s)',
description: [
	'Limit the number of quads that pass through by counting from the bottom of the stream.',
	'WARNING: quads must be buffered in memory until the end of the stream is reached. Specifying a large number of quads or subjects might therefore incur lots of memory.',
],
syntax: '[size=1]',
positionals: {
	size: {
		type: 'number',
		describe: 'the number of things to emit',
	},
},
options: {
	q: {
		type: 'boolean',
		alias: ['quads', 't', 'triples'],
		describe: 'emit only the given number of quads from the bottom of a stream',
		conflicts: ['s'],
	},
1007
	s: {
		type: 'boolean',
		alias: ['subjects'],
		describe: 'emit quads contained by the given number of distinct subjects from the bottom of a stream',
		conflicts: ['q'],
	},
},
1015
command(g_argv, a_inputs, fe_command) {
	// size argument
	let [
		n_tail=1,
	] = g_argv._;
1021
	// count subjects
	if(g_argv.subjects) {
		return map_streams(a_inputs, () => {
			let c_subjects = 0;
			let kt_prev = null;
			let a_batch = null;
			let a_fifo = [];
1029
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
1032
				transform(g_quad, s_encoding, fke_transform) {
					// different subject
					if(!g_quad.subject.equals(kt_prev)) {
						// reset batch
						a_batch = [];
1038
						// push batch to fifo
						a_fifo.push(a_batch);
1041
						// hit limit
						if(++c_subjects > n_tail) {
							a_fifo.shift();
						}
					}
1047
					// save subject
					kt_prev = g_quad.subject;
1050
					// add quad to batch
					a_batch.push(g_quad);
1053
					// done
					fke_transform();
				},
1057
				flush(fk_flush) {
					// push queue
					for(let a_quads of a_fifo) {
						for(let g_quad of a_quads) {
							this.push(g_quad);
						}
					}
1065
					// free to GC
					a_fifo.length = 0;
					a_batch.length = 0;
1069
					// done
					fk_flush();
				},
			});
		});
	}
	// count quads
	else {
		return map_streams(a_inputs, () => {
			let c_quads = 0;
			let a_fifo = [];
1081
			return new stream.Transform.QuadsToOther({
				error: e => fe_command(e),
1084
				transform(g_quad, s_encoding, fke_transform) {
					// under limit
					if(++c_quads <= n_tail) {
						a_fifo.push(g_quad);
					}
					// hit limit
					else {
						// shift off bottom
						a_fifo.shift();
1094
						// push to top
						a_fifo.push(g_quad);
					}
1098
					// done
					fke_transform();
				},
1102
				flush(fk_flush) {
					// push queue
					for(let g_quad of a_fifo) {
						this.push(g_quad);
					}
1108
					// free to GC
					a_fifo.length = 0;
1111
					// done
					fk_flush();
				},
			});
		});
	}
},
},
1120
filter: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_DATA,
overview: 'Filter quads in the stream(s) via expression',
description: [
	'Filter quads by using either a Quad Filter Expression or a bit of JavaScript.',
	'For documentation on the Quad Filter Expression syntax, see:  https://graphy.link/quad-filter-expressions',
	S_WARN_JAVASCRIPT,
],
options: {
	x: {
		type: 'string',
		alias: ['expression'],
		describe: 'filter quads using the given quad filter expression',
		conflicts: ['j'],
	},
1137
	j: {
		type: 'string',
		alias: ['js', 'javascript'],
		describe: 'filter quads using the given JavaScript expression which will be evaluated as a callback function passed the quad and current prefix map as arguments',
		conflicts: ['x'],
	},
1144
	v: {
		type: 'boolean',
		alias: ['verbose'],
		describe: 'prints the compiled quad filter expression to stderr',
	},
},
1151
examples: [
	[
		`Filter quads equivalent to the triple pattern: '?s rdf:type dbo:Plant'`,
		`filter -x '; a; dbo:Plant'`,
	],
	[
		`Filter quads equivalent to the SPARQL fragment: 'dbr:Banana ?p ?o. filter(!isLiteral(?o))'`,
		`filter -x 'dbr:Banana;; !{literal}'`,
	],
	[
		`Filter quads equivalent to the SPARQL fragment: '?s ?p ?o. filter(?o > 10e3)]`,
		`filter --js 'g => g.object.number > 10e3'`,
	],
	[
		`Filter quads equivalent to the SPARQL fragment: '?s ?p ?o. filter(strStarts(str(?s), str(?o)))'`,
		`filter --js 'g => g.object.value.startsWith(g.subject.value)'`,
	],
	// [
	// 	`Filter quads equivalent to the SPARQL fragment: '?s ?p ?o. filter(strStarts(str(?s), str(?o)))'`,
	// 	`filter --js '(g, h) => g.subject.concise(h).startsWith("db")'`,
	// ],
],
1174
command(g_argv, a_inputs, fe_command) {
	// quad filter expression
	if(g_argv.expression) {
		let g_parse = parse_filter(g_argv.expression);
1179
		let sj_eval = expression_handler.prepare(g_parse);
1181
		if(g_argv.verbose) {
			console.warn(`The compiled quad filter expression from 'transform' command: () => {\n${sj_eval.replace(/^|\n/g, '\n\t')}\n}\n`);
		}
1185
		let f_filter = new Function('factory', 'stream', sj_eval);  // eslint-disable-line no-new-func
1187
		return map_streams(a_inputs, () => f_filter(factory, stream));
	}
	// javascript expression
	else if(g_argv.javascript) {
		let f_build = new Function('factory', /* syntax: js */ `return (${g_argv.javascript}) || null;`);  // eslint-disable-line no-new-func
1193
		let f_filter = f_build(factory);
1195
		// filter exists
		if(f_filter) {
			// invalid type
			if('function' !== typeof f_filter) {
				exit(`The 'filter' command expects -j/--javascript expression to evaluate to a function, instead found '${typeof f_filter}'`);
			}
1202
			return map_streams(a_inputs, () => {
				let h_prefixes = {};
1205
				return new stream.Transform.QuadsToOther({
					error: e => fe_command(e),
1208
					prefix(si_prefix, p_iri) {
						h_prefixes[si_prefix] = p_iri;
					},
1212
					transform(g_quad, s_encoding, fke_transform) {
						if(f_filter(g_quad, h_prefixes)) {
							return fke_transform(null, g_quad);
						}
1217
						fke_transform();
					},
				});
			});
		}
	}
1224
	// neither used (bypass filter)
	warn(`The 'filter' command was not used and is being ignored.`);
	return bypass(a_inputs);
},
},
1230
// transform
transform: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_DATA,
overview: 'Apply a custom transform function to each quad in the stream(s)',
description: [
	'$1',
	S_WARN_JAVASCRIPT,
],
options: {
	j: {
		type: 'string',
		alias: ['js', 'javascript'],
		describe: 'transform quads using the given JavaScript expression which will be evaluated as a callback function passed the quad and current prefix map as arguments',
		demandOption: true,
		example: [
			`transform -j 'g => [g.object, g.predicate, g.subject]'`,
			`transform -j 'g => ({
				[factory.blankNode()]: {
					a: 'rdf:Statement',
					'rdf:subject': g.subject,
					'rdf:predicate': g.predicate,
					'rdf:object': g.object,
				},
			})'`,
		].join('\n'),
	},
},
1259
command(g_argv, a_inputs, fe_command) {
	// javascript expression
	if(g_argv.javascript) {
		let f_build = new Function('factory', 'c3', 'c4', /* syntax: js */ `return (${g_argv.javascript}) || null;`);  // eslint-disable-line no-new-func
1264
		let f_transform = f_build(factory, factory.c3, factory.c4);
1266
		// transform exists
		if(f_transform) {
			// invalid type
			if('function' !== typeof f_transform) {
				exit(`The 'filter' command expects -j/--javascript expression to evaluate to a function, instead found '${typeof f_filter}'`);
			}
1273
			return map_streams(a_inputs, () => {
				let h_prefixes = {};
1276
				return new stream.Transform.QuadsToOther({
					error: e => fe_command(e),
1279
					prefix(si_prefix, p_iri) {
						h_prefixes[si_prefix] = p_iri;
					},
1283
					transform(g_quad, s_encoding, fke_transform) {
						// alias quad property access
						g_quad.s = g_quad.subject;
						g_quad.p = g_quad.predicate;
						g_quad.o = g_quad.object;
						g_quad.g = g_quad.graph;
1290
						// try to apply transform callback
						let z_item;
						try {
							z_item = f_transform(g_quad, h_prefixes);
						}
						catch(e_transform) {
							warn(`The 'transform' command threw an Error while applying the given callback function:\n${e_transform.stack}`);
							return fke_transform();
						}
1300
						// item was returned
						if(z_item) {
							return interpret_item(z_item, h_prefixes, this, fke_transform);
						}
1305
						// done
						fke_transform();
					},
				});
			});
		}
	}
1313
	// nothing used (bypass filter)
	warn(`The 'transform' command was not used and is being ignored.`);
	return bypass(a_inputs);
},
},
1319
1320/*
1321------ Stream Control --------
1322*/
1323
concat: {
type: S_TRANSFORM_TYPE_N1AA,
category: S_CATEGORY_STREAM,
overview: 'Join stream data in order via concatentation',
description: [
	'Concatenate quads from all input streams in order.',
],
options: {},
1332
command(g_argv, a_inputs, fe_command) {
	let nl_inputs = a_inputs.length;
1335
	// single input, bypass passthrough
	if(1 === nl_inputs) return a_inputs;
1338
	// input index
	let i_input = 0;
1341
	// single output stream
	let ds_out = new stream.PassThrough();
1344
	// stream consumer
	let f_next = () => {
		// done consuming inputs; end output stream
		if(i_input >= nl_inputs) return ds_out.end();
1349
		// next input
		let ds_input = a_inputs[i_input++];
1352
		// once it ends; consume next input
		ds_input.on('end', f_next);
1355
		// catch stream errors
		ds_input.on('error', fe_command);
1358
		// pipe to passthrough
		ds_input.pipe(ds_out, {end:false});
	};
1362
	// start concatenating
	f_next();
1365
	// return stream
	return [ds_out];
1368
	// return [new stream.Readable({
	// 	objectMode: true,
1371
	// 	read() {
	// 		// while there are inputs
	// 		for(; i_input<nl_inputs; i_input++) {
	// 			// ref input
1376// 			let ds_input = a_inputs[i_input];
1377
	// 			// read chunk from input and push to output
	// 			let w_chunk;
	// 			while((w_chunk = ds_input.read()) && this.push(w_chunk)) {
	// 				; // eslint-disable-line no-empty
1382// 			}
1383
	// 			// input not fully consumed; try again next read
	// 			if(!w_chunk.readableEnded) break;
	// 		}
	// 	},
// })];
},
},
1391
merge: {
type: S_TRANSFORM_TYPE_N1AA,
category: S_CATEGORY_STREAM,
overview: `Join stream data on a 'first come, first serve' basis`,
description: [
	'Merge quads from all input streams without order.',
],
options: {},
1400
command(g_argv, a_inputs, fe_command) {
	let nl_inputs = a_inputs.length;
1403
	// single input, bypass passthrough
	if(1 === nl_inputs) return a_inputs;
1406
	// input index
	let i_input = 0;
1409
	// single output stream
	let ds_out = new stream.PassThrough();
1412
	// stream consumer
	let f_next = () => {
		// done consuming inputs; end output stream
		if(i_input >= nl_inputs) return ds_out.end();
1417
		// next input
		let ds_input = a_inputs[i_input++];
1420
		// once it ends; consume next input
		ds_input.on('end', f_next);
1423
		// catch stream errors
		ds_input.on('error', fe_command);
1426
		// pipe to passthrough
		ds_input.pipe(ds_out, {end:false});
	};
1430
	// start concatenating
	f_next();
1433
	// return stream
	return [ds_out];
},
},
1438
1439/*
1440------ Dataset --------
1441*/
1442
tree: {
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_SET,
overview: 'Put all quads into a tree data structure to remove duplicates',
description: [
	'$1',
],
options: {},
1451
command(g_argv, a_inputs, fe_command) {
	return a_inputs.map(ds_input => ds_input.pipe(dataset_tree()));
},
},
1456
canonical: {
alias: 'canonicalize',
type: S_TRANSFORM_TYPE_NNQQ,
category: S_CATEGORY_SET,
overview: 'Canonicalize a set of quads using RDF Dataset Normalization Algorithm (URDNA2015)',
description: [
	'$1',
],
options: {},
1466
command(g_argv, a_inputs, fe_command) {
	return a_inputs.map(ds_input => ds_input.pipe(dataset_tree({canonicalize:true})));
},
},
1471
union: {
type: S_TRANSFORM_TYPE_N1QQ,
category: S_CATEGORY_SET,
overview: 'Compute the set union of 1 or more inputs',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1482
command(g_argv, a_inputs, fe_command) {
	return dataset_N1QQ(g_argv, a_inputs, fe_command, 'union');
},
},
1487
intersect: {
alias: 'intersection',
type: S_TRANSFORM_TYPE_N1QQ,
category: S_CATEGORY_SET,
overview: 'Compute the set intersection of 1 or more inputs',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1499
command(g_argv, a_inputs, fe_command) {
	return dataset_N1QQ(g_argv, a_inputs, fe_command, 'intersection');
},
},
1504
diff: {
alias: 'difference',
type: S_TRANSFORM_TYPE_21QQ,
category: S_CATEGORY_SET,
overview: 'Compute the set difference between 2 inputs',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1516
command(g_argv, a_inputs, fe_command) {
	return dataset_21QQ(g_argv, a_inputs, fe_command, 'difference');
},
},
1521
minus: {
alias: ['subtract', 'subtraction'],
type: S_TRANSFORM_TYPE_21QQ,
category: S_CATEGORY_SET,
overview: 'Subtract the second input from the first: A - B',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1533
command(g_argv, a_inputs, fe_command) {
	return dataset_21QQ(g_argv, a_inputs, fe_command, 'minus');
},
},
1538
equals: {
alias: 'equal',
type: S_TRANSFORM_TYPE_21QRB,
category: S_CATEGORY_SET,
overview: 'Test if 2 inputs are equivalent',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1550
command(g_argv, a_inputs, fe_command) {
	return dataset_21QR(g_argv, a_inputs, fe_command, 'equals');
},
},
1555
disjoint: {
type: S_TRANSFORM_TYPE_21QRB,
category: S_CATEGORY_SET,
overview: 'Test if 2 inputs are completely disjoint from one another',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1566
command(g_argv, a_inputs, fe_command) {
	return dataset_21QR(g_argv, a_inputs, fe_command, 'disjoint');
},
},
1571
contains: {
alias: 'contain',
type: S_TRANSFORM_TYPE_21QRB,
category: S_CATEGORY_SET,
overview: 'Test if the first input completely contains the second',
description: [
	'$1',
],
options: {
	...G_OPTIONS_DATASET,
},
1583
command(g_argv, a_inputs, fe_command) {
	return dataset_21QR(g_argv, a_inputs, fe_command, 'contains');
},
},
1588
1589
1590/*
1591------ Statistics --------
1592*/
1593
count: {
type: S_TRANSFORM_TYPE_NNQRN,
category: S_CATEGORY_STATS,
overview: 'Count the number of events',
description: [
	'Count the number of events in each steam',
],
1601
command(g_argv, a_inputs, fe_command) {
	return a_inputs.map(ds_input => new Promise((fk_resolve) => {
		let c_items = 0;
1605
		ds_input.on('data', () => {
			c_items += 1;
		});
1609
		ds_input.on('error', fe_command);
1611
		ds_input.on('end', () => {
			fk_resolve(new AnswerSource(c_items));
		});
	}));
},
},
1618
distinct: {
type: S_TRANSFORM_TYPE_NNQRN,
category: S_CATEGORY_STATS,
overview: 'Count the number of distinct things',
description: [
	'Count the number of distinct things, such as quads, triples, subjects, etc.',
],
options() {
	let h_options = {
		q: {
			alias: ['quads'],
			type: 'boolean',
			describe: 'count the number of distinct quads',
		},
		t: {
			alias: ['triples'],
			type: 'boolean',
			describe: 'count the number of distinct triples by ignoring the graph component',
		},
		s: {
			alias: ['subjects'],
			type: 'boolean',
			describe: 'count the number of distinct subjects',
		},
		p: {
			alias: ['predicates'],
			type: 'boolean',
			describe: 'count the number of distinct predicates',
		},
		o: {
			alias: ['objects'],
			type: 'boolean',
			describe: 'count the number of distinct objects',
		},
		g: {
			alias: ['graphs'],
			type: 'boolean',
			describe: 'count the number of distinct graphs',
		},
		// l: {
		// 	alias: ['literals'],
		// 	type: 'boolean',
		// 	describe: 'count the number of distinct literals',
	// },
	};
1664
	let a_others = Object.keys(h_options);
	for(let [si_option, g_option] of Object.entries(h_options)) {
		let as_conflicts = new Set(a_others);
		as_conflicts.delete(si_option);
		g_option.conflicts = [...as_conflicts];
	}
1671
	return h_options;
},
1674
command(g_argv, a_inputs, fe_command) {
	// quad component
	let s_component = null;
	{
		if(g_argv.subjects) s_component = 'subject';
		if(g_argv.predicates) s_component = 'predicate';
		if(g_argv.objects) s_component = 'object';
		if(g_argv.graphs) s_component = 'graph';
	}
1684
	// distinct number of a certain component
	if(s_component) {
		return a_inputs.map(ds_input => new Promise((fk_resolve) => {
			// term set
			let as_terms = new Set();
1690
			// simply count
			ds_input.on('data', (g_quad) => {
				// concise term
				let sc1_term = g_quad[s_component].concise();
1695
				// add to set
				as_terms.add(sc1_term);
			});
1699
			// error handling
			ds_input.on('error', fe_command);
1702
			// once it ends
			ds_input.on('end', () => {
				fk_resolve(new AnswerSource(as_terms.size));
			});
		}));
	}
	// distinct number of triples
	else if(g_argv.triples) {
		return a_inputs.map(async(ds_input) => {
			// remove graph component
			let ds_explode = new stream.Transform.QuadsToOther({
				transform(g_quad, s_encoding, fke_transform) {
					// push quad
					this.push(factory.quad(g_quad.subject, g_quad.predicate, g_quad.object));
1717
					// done
					fke_transform();
				},
			});
1722
			// create dataset
			let k_dataset = dataset_tree();
1725
			// create pipeline
			ds_input.pipe(ds_explode)
				.pipe(k_dataset);
1729
			// await dataset finish
			await k_dataset.until('finish');
1732
			// return size
			return new AnswerSource(k_dataset.size);
		});
	}
	// distinct number of quads
	else {
		return a_inputs.map(async(ds_input) => {
			let k_dataset = dataset_tree();
1741
			ds_input.pipe(k_dataset);
1743
			await k_dataset.until('finish');
1745
			return new AnswerSource(k_dataset.size);
		});
	}
},
},
1751
// boilerplate: {
// 	type: S_TRANSFORM_TYPE_N1QQ,
// 	overview: '',
// 	description: [
// 		'Some decsription',
// 	],
1758// 	options: {},
1759
// 	command(g_argv, a_inputs, fe_command) {
// 		return map_streams(a_inputs, () => new Transform({
// 			error: e => fe_command(e),
// 		}));
// 	},
// },
1766
1767};
1768
1769// command aliases
1770let h_aliases = {};
1771
1772let n_width_column = Object.keys(h_commands)
.reduce((n, s) => Math.max(n, s.length), 0);
1774
1775// group command by category
1776let h_categories = {};
1777for(let [si_command, g_command] of Object.entries(h_commands)) {
let s_category = g_command.category;
1779
let g_category = (h_categories[s_category] = h_categories[s_category] || {
commands: [],
overview: [],
});
1784
g_category.commands.push(g_command);
let s_aliases = '';
if(g_command.alias) {
let z_aliases = g_command.alias;
if(Array.isArray(z_aliases)) {
	s_aliases = ` [aliases: ${z_aliases.join(', ')}]`;
1791
	// add aliases
	for(let s_alias of z_aliases) {
		h_aliases[s_alias] = si_command;
	}
1796
	g_command.aliases = z_aliases;
}
else {
	s_aliases = ` [alias: ${z_aliases}]`;
1801
	// add alias
	h_aliases[z_aliases] = si_command;
1804
	g_command.aliases = [z_aliases];
}
}
else {
g_command.aliases = [];
}
1811
g_category.overview.push(`  ${si_command.padEnd(n_width_column, ' ')}  ${g_command.overview}${s_aliases}`);
1813}
1814
1815// terminal width
1816let n_width_terminal = Math.max(80, yargs.terminalWidth()-10);
1817
1818// args
1819let a_argv = process.argv.slice(2);
1820let n_args = a_argv.length;
1821
1822// no arguments
1823if(!a_argv.length) {
exit('no arguments given');
1825}
1826
1827// inputs
1828let a_inputs = [];
1829
1830// pipeline
1831let a_pipeline = [];
1832{
let a_series = [];
1834
for(let i_argv=0; i_argv<n_args; i_argv++) {
let s_arg = a_argv[i_argv];
1837
// after first arg
if(i_argv) {
	// internal pipe
	if('--pipe' === s_arg) {
		a_pipeline.push(a_series);
		if(i_argv === n_args) {
			exit(`was expecting pipe destination after --pipe: ${a_argv}`);
		}
		a_series = [];
		continue;
	}
	// shorthand internal pipe
	else if('/' === s_arg) {
		a_pipeline.push(a_series);
		if(i_argv === n_args) {
			exit(`was expecting pipe destination after internal pipe character '/': ${a_argv}`);
		}
		a_series = [];
		continue;
	}
	// inputs follow
	else if('--inputs' === s_arg) {
		// convert to readable streams
		a_inputs.push(...a_argv.slice(i_argv+1).map(p => fs.createReadStream(p)));
		break;
	}
}
// first arg, main option
else if('-h' === s_arg || '--help' === s_arg || 'help' === s_arg) {
	// command overview
	let s_overview = '';
	for(let [s_category, g_category] of Object.entries(h_categories)) {
		s_overview += `${s_category}\n${g_category.overview.join('\n')}\n\n`;
	}
1872
	// eslint-disable-next-line no-console
	console.log(`\nUsage:  graphy [OPTIONS] COMMAND [ / COMMAND]* [--inputs FILES...]\n\n`
		+`Tip: Use the internal pipe operator ' / ' to string together a series of commands.\n\n`
		+s_overview
		+gobble(`
			Graphy Commands:
			  examples        Alias for '--examples'
			  help            Alias for '--help'
			  version         Alias for '--version'
1882
			Options:
			  -e, --examples  Print some examples and exit
			  -h, --help      Print this help message and exit
			  -v, --version   Print the version info and exit
1887
			More Options:
			  --show-stack-trace  Show the stack trace when printing error messages
		`)+'\n\n'
		+`\nRun 'graphy COMMAND --help' for more information on a command.\n`
		+`\nRun 'graphy --examples' to see some examples.\n`,
	);
1894
	process.exit(0);
}
// version
else if('-v' === s_arg || '--version' === s_arg || 'version' === s_arg) {
	// eslint-disable-next-line no-console
	console.log(require(path.join(__dirname, './package.json')).version);
1901
	process.exit(0);
}
// examples
else if('-e' === s_arg || '--examples' === s_arg || 'examples' === s_arg) {
	console.log(gobble(`
		Examples:
		  1) Count the number of distinct triples in a Turtle file:
1909
		     graphy read -c ttl / distinct --triples   < input.ttl
1911
		  2) Count the distinct number of subjects that are of type dbo:Place in an N-Quads file:
1913
		     graphy read -c nq / filter -x '; a; dbo:Place' / distinct --subjects   < input.nq
1915
		  3) Compute the difference between two RDF datasets 'a.ttl' and 'b.ttl':
1917
		     graphy read / diff / write  --inputs a.ttl b.ttl   > diff.trig
1919
		  4) Compute the canonicalized union of a bunch of RDF datasets in the 'data/' directory:
1921
		     graphy read / union / write   --inputs data/*.{nt,nq,ttl,trig}   > output.trig
1923
		  5) Extract the first 2 million quads of a Turtle file:
1925
		     graphy read -c ttl / head 2e6 / write -c ttl  < in.ttl  > view-2M.ttl
1927
		  6) Find all owl:sameAs triples where the object is a node and different from
		     the subject, then swap the subject and object:
		  
		     graphy read / filter -x '!$object; owl:sameAs; {node}' / transform -j  \\
		         't => [t.o, t.p, t.s]' / write -c ttl   < input.ttl   > output.ttl
1933
	`)+'\n');
1935
	process.exit(0);
}
// print stack trace in error messages
else if('--show-stack-trace' === s_arg) {
	b_show_stack_trace = true;
1941
	// consume arg
	continue;
}
1945
a_series.push(s_arg);
}
1948
// empty series
if(a_series.length) {
a_pipeline.push(a_series);
}
1953}
1954
1955// empty command list
1956if(!a_pipeline.length) {
exit('no commands given');
1958}
1959
1960(async() => {
// failure handler
let fe_command = (z_error) => {
let e_command = 'string' === typeof z_error? new Error(z_error): z_error;
debugger;
exit(e_command.stack);
};
1967
// starting inputs default to stdin if no explicit inputs given
let a_prev = a_inputs.length? a_inputs: [process.stdin];
1970
// // each series in pipeline
// for(let a_series of a_pipeline) {
1973
// each series in pipeline
while(a_pipeline.length) {
let a_series = a_pipeline.shift();
1977
// start with command string
let s_command = a_series[0];
1980
// command not found
if(!(s_command in h_commands)) {
	// command alias
	if(s_command in h_aliases) {
		s_command = h_aliases[s_command];
	}
	// no such command
	else {
		exit(`no such command '${s_command}'`);
	}
}
1992
try {
	// ref command
	let g_command = h_commands[s_command];
1996
	let g_options = 'function' === typeof g_command.options
		? g_command.options()
		: (g_command.options || {});
2000
	let a_decsribes = g_command.description;
	let s_describe = '';
	if(a_decsribes.length) {
		s_describe = '\nDescription:'+a_decsribes
			.map(s => '  '+s.replace(/^\$1$/, g_command.overview+'.'))
			.join('\n\n');
	}
2008
	let s_usage = [s_command, ...g_command.aliases]
		.reduce((s_out, s, i) => `${s_out}\n${i? 'Or': 'Usage'}:  $0${S_TRANSFORM_TYPE_NNSQ === g_command.type? '': ' [...]'} ${s}${g_command.syntax? ' '+g_command.syntax: ''} [OPTIONS] [ / COMMAND]*`, '');
2011
	let s_positionals = '\n'+g_command.type+'\n';
	if(g_command.positionals) {
		let n_width_positionals = Object.entries(g_command.positionals)
			.reduce((n, [s]) => Math.max(n, s.length), 10);
2016
		s_positionals += '\nArguments:';
		for(let [si_pos, g_pos] of Object.entries(g_command.positionals)) {
			s_positionals += `\n  ${si_pos.padEnd(n_width_positionals, ' ')}  [${g_pos.type}] ${g_pos.describe}`;
		}
	}
2022
	let s_examples = '';
	if(g_command.examples && g_command.examples.length) {
		s_examples = `Examples:\n`;
2026
		let a_egs = g_command.examples;
		for(let i_eg=0, nl_egs=a_egs.length; i_eg<nl_egs; i_eg++) {
			let z_eg = a_egs[i_eg];
2030
			s_examples += `  ${i_eg+1}) `;
			if('string' === typeof z_eg) {
				s_examples += z_eg+'\n';
			}
			else {
				s_examples += z_eg[0]+'\n     '+z_eg[1]+'\n';
			}
		}
	}
2040
	// build yargs
	let g_argv = mk_yargs()
		.strict()
		.usage(s_usage+'\n'+s_describe+'\n'+s_positionals)
		.options(g_options)
		.help()
		.epilog(s_examples)
		.version(false)
		.wrap(n_width_terminal)
		.parse(a_series.slice(1));
2051
	// no inputs
	if(!a_prev.length) {
		return fe_command(`The '${s_command}' command requires at least 1 input stream but 0 were piped in.`);
	}
2056
	// check input cardinality
	switch(g_command.type) {
		case S_TRANSFORM_TYPE_21QRB:
		case S_TRANSFORM_TYPE_21QRN:
		case S_TRANSFORM_TYPE_21QQ: {
			if(2 !== a_prev.length) {
				let nl_inputs = a_inputs.length;
				return fe_command(`The '${s_command}' command expects exactly 2 input streams but ${1 === nl_inputs? 'only 1 was': nl_inputs+' were'} piped in.`);
			}
2066
			break;
		}
2069
		default: {
			break;
		}
	}
2074
	// eval command with its args
	let a_curr = await g_command.command(g_argv, a_prev, fe_command, a_pipeline);
2077
	// advance inputs
	a_prev = await Promise.all(a_curr);
}
catch(e_command) {
	if(b_show_stack_trace) {
		exit(e_command.stack);
	}
	else {
		exit(e_command.message);
	}
}
}
2090
// expect single output
if(1 !== a_prev.length) {
exit(`expected a single output stream but last command produces ${a_prev.length} streams`);
}
2095
// pipe output to stdout
a_prev[0].pipe(process.stdout);
2098})();
1	`#!/usr/bin/env node`
2
3
4	`/* eslint-disable global-require */`
5	`/* eslint-disable no-console */`
6
7	`const gobble = (s_text, s_indent='') => {`
8	`let m_pad = /^(\s+)/.exec(s_text.replace(/^([ \t]*\n)/, ''));`
9	`if(m_pad) {`
10	return s_indent+s_text.replace(new RegExp(`\\n${m_pad[1]}`, 'g'), '\n'+s_indent.trim()).trim();
11	`}`
12	`else {`
13	`return s_indent+s_text.trim();`
14	`}`
15	`};`
16
17	`const fs =require('fs');`
18	`const path = require('path');`
19	`const yargs = require('yargs');`
20	`const mk_yargs = require('yargs/yargs');`
21	`const graphy = require('./api.js');`
22	`const factory = require('@graphy/core.data.factory');`
23	`const stream = require('@graphy/core.iso.stream');`
24	`const dataset_tree = require('@graphy/memory.dataset.fast');`
25
26	`const parse_filter = require('./quad-expression.js').parse;`
27	`const expression_handler = require('./expression-handler.js');`
28
29	`const F_ADAPT_STREAM = function(ds_out) {`
30	`let ds_dst = ds_out;`
31
32	`// non-object mode`
33	`if(!ds_dst._writableState.objectMode) {`
34	`// transform to JSON`
35	`ds_out = stream.quads_to_json();`
36	`}`
37	`// yes object mode and graphy writable`
38	`else if(ds_out.isGraphyWritable) {`
39	`// transform to writable data events`
40	`ds_out = stream.quads_to_writable();`