json lines reader, writer

This commit is contained in:
Jan Prochazka
2020-06-11 20:52:57 +02:00
parent 41ee6e9b91
commit b520501d1f
7 changed files with 105 additions and 29 deletions

View File

@@ -0,0 +1,32 @@
const fs = require('fs');
const stream = require('stream');
const byline = require('byline');
class ParseStream extends stream.Transform {
constructor({ header }) {
super({ objectMode: true });
this.header = header;
this.wasHeader = false;
}
_transform(chunk, encoding, done) {
const obj = JSON.parse(chunk);
if (!this.wasHeader) {
if (!this.header) this.push({ columns: Object.keys(obj).map((columnName) => ({ columnName })) });
this.wasHeader = true;
}
this.push(obj);
done();
}
}
async function jsonLinesReader({ fileName, encoding = 'utf-8', header = true }) {
console.log(`Reading file ${fileName}`);
const fileStream = fs.createReadStream(fileName, encoding);
const liner = byline(fileStream);
const parser = new ParseStream({ header });
liner.pipe(parser);
return parser;
}
module.exports = jsonLinesReader;