WME/aufgabe5/node_modules/csvtojson/test/testCSVConverter.ts

451 lines
14 KiB
TypeScript

import {Converter} from "../src/Converter";
import csv from "../src";
var assert = require("assert");
var fs = require("fs");
var sandbox = require("sinon").sandbox.create();
var file = __dirname + "/data/testData";
var trailCommaData = __dirname + "/data/trailingComma";
describe("CSV Converter", function () {
afterEach(function () {
sandbox.restore();
});
it("should create new instance of csv", function () {
var obj = new Converter();
assert(obj);
});
it("should read from a stream", function (done) {
var obj = new Converter();
var stream = fs.createReadStream(file);
obj.then(function (obj) {
assert.equal(obj.length, 2);
done();
});
stream.pipe(obj);
});
it("should call onNext once a row is parsed.", function (done) {
var obj = new Converter();
var stream = fs.createReadStream(file);
var called = false;
obj.subscribe(function (resultRow) {
assert(resultRow);
called = true;
});
obj.on("done", function () {
assert(called);
done();
});
stream.pipe(obj);
});
it("should emit end_parsed message once it is finished.", function (done) {
var obj = new Converter();
obj.then(function (result) {
assert(result);
assert(result.length === 2);
assert(result[0].date);
assert(result[0].employee);
assert(result[0].employee.name);
assert(result[0].employee.age);
assert(result[0].employee.number);
assert(result[0].employee.key.length === 2);
assert(result[0].address.length === 2);
done();
});
fs.createReadStream(file).pipe(obj);
});
it("should handle traling comma gracefully", function (done) {
var stream = fs.createReadStream(trailCommaData);
var obj = new Converter();
obj.then(function (result) {
assert(result);
assert(result.length > 0);
done();
});
stream.pipe(obj);
});
it("should handle comma in column which is surrounded by qoutes", function (done) {
var testData = __dirname + "/data/dataWithComma";
var rs = fs.createReadStream(testData);
var obj = new Converter({
"quote": "#"
});
obj.then(function (result) {
assert(result[0].col1 === "\"Mini. Sectt");
assert.equal(result[3].col2, "125001,fenvkdsf");
// console.log(result);
done();
});
rs.pipe(obj);
});
it("should be able to convert a csv to column array data", function (done) {
var columArrData = __dirname + "/data/columnArray";
var rs = fs.createReadStream(columArrData);
var result:any = {};
var csvConverter = new Converter();
//end_parsed will be emitted once parsing finished
csvConverter.then(function () {
assert(result.TIMESTAMP.length === 5);
done();
});
//record_parsed will be emitted each time a row has been parsed.
csvConverter.subscribe(function (resultRow, rowIndex) {
for (var key in resultRow) {
if (resultRow.hasOwnProperty(key)) {
if (!result[key] || !(result[key] instanceof Array)) {
result[key] = [];
}
result[key][rowIndex] = resultRow[key];
}
}
});
rs.pipe(csvConverter);
});
it("should be able to convert csv string directly", function (done) {
var testData = __dirname + "/data/testData";
var data = fs.readFileSync(testData).toString();
var csvConverter = new Converter();
//end_parsed will be emitted once parsing finished
csvConverter.then(function (jsonObj) {
assert.equal(jsonObj.length, 2);
});
csvConverter.fromString(data).then(function (jsonObj) {
assert(jsonObj.length === 2);
done();
});
});
it("should be able to convert csv string with error", function (done) {
var testData = __dirname + "/data/dataWithUnclosedQuotes";
var data = fs.readFileSync(testData).toString();
var csvConverter = new Converter();
csvConverter.fromString(data).then(undefined, function (err) {
assert(err);
assert.equal(err.err, "unclosed_quote");
done();
});
});
it("should be able to convert csv string without callback provided", function (done) {
var testData = __dirname + "/data/testData";
var data = fs.readFileSync(testData).toString();
var csvConverter = new Converter();
//end_parsed will be emitted once parsing finished
csvConverter.then(function (jsonObj) {
assert(jsonObj.length === 2);
done();
});
csvConverter.fromString(data);
});
it("should be able to handle columns with double quotes", function (done) {
var testData = __dirname + "/data/dataWithQoutes";
var data = fs.readFileSync(testData).toString();
var csvConverter = new Converter();
csvConverter.fromString(data).then(function (jsonObj) {
assert(jsonObj[0].TIMESTAMP === '13954264"22', JSON.stringify(jsonObj[0].TIMESTAMP));
assert(jsonObj[1].TIMESTAMP === 'abc, def, ccc', JSON.stringify(jsonObj[1].TIMESTAMP));
done();
});
});
it("should be able to handle columns with two double quotes", function (done) {
var testData = __dirname + "/data/twodoublequotes";
var data = fs.readFileSync(testData).toString();
var csvConverter = new Converter();
csvConverter.fromString(data).then(function (jsonObj) {
assert.equal(jsonObj[0].title, "\"");
assert.equal(jsonObj[0].data, "xyabcde");
assert.equal(jsonObj[0].uuid, "fejal\"eifa");
assert.equal(jsonObj[0].fieldA, "bnej\"\"falkfe");
assert.equal(jsonObj[0].fieldB, "\"eisjfes\"");
done();
});
});
it("should handle empty csv file", function (done) {
var testData = __dirname + "/data/emptyFile";
var rs = fs.createReadStream(testData);
var csvConverter = new Converter();
csvConverter.then(function (jsonObj) {
assert(jsonObj.length === 0);
done();
});
rs.pipe(csvConverter);
});
it("should parse large csv file", function (done) {
var testData = __dirname + "/data/large-csv-sample.csv";
var rs = fs.createReadStream(testData);
var csvConverter = new Converter();
var count = 0;
csvConverter.subscribe(function () {
//console.log(arguments);
count++;
});
csvConverter.then(function () {
assert(count === 5290);
done();
});
rs.pipe(csvConverter);
});
it("should parse data and covert to specific types", function (done) {
var testData = __dirname + "/data/dataWithType";
var rs = fs.createReadStream(testData);
var csvConverter = new Converter({
checkType: true,
colParser: {
"column6": "string",
"column7": "string"
}
});
csvConverter.subscribe(function (d) {
assert(typeof d.column1 === "number");
assert(typeof d.column2 === "string");
assert.equal(d["colume4"], "someinvaliddate");
assert(d.column5.hello === "world");
assert(d.column6 === '{"hello":"world"}');
assert(d.column7 === "1234");
assert(d.column8 === "abcd");
assert(d.column9 === true);
assert(d.column10[0] === 23);
assert(d.column10[1] === 31);
assert(d.column11[0].hello === "world");
assert(d["name#!"] === false);
});
csvConverter.on("done", function () {
done();
});
rs.pipe(csvConverter);
});
it("should turn off field type check", function (done) {
var testData = __dirname + "/data/dataWithType";
var rs = fs.createReadStream(testData);
var csvConverter = new Converter({
checkType: false
});
csvConverter.subscribe(function (d) {
assert(typeof d.column1 === "string");
assert(typeof d.column2 === "string");
assert(d["column3"] === "2012-01-01");
assert(d["colume4"] === "someinvaliddate");
assert(d.column5 === '{"hello":"world"}');
assert.equal(d["column6"], '{"hello":"world"}');
assert(d["column7"] === "1234");
assert(d["column8"] === "abcd");
assert(d.column9 === "true");
assert(d.column10[0] === "23");
assert(d.column10[1] === "31");
assert(d["name#!"] === 'false');
});
csvConverter.then(function () {
done();
});
rs.pipe(csvConverter);
});
it("should emit data event correctly", function (done) {
var testData = __dirname + "/data/large-csv-sample.csv";
var csvConverter = new Converter({
});
var count = 0;
csvConverter.on("data", function (d) {
count++;
});
csvConverter.on("end", function () {
assert.equal(count, 5290);
done();
});
var rs = fs.createReadStream(testData);
rs.pipe(csvConverter);
});
it("should process column with linebreaks", function (done) {
var testData = __dirname + "/data/lineBreak";
var rs = fs.createReadStream(testData);
var csvConverter = new Converter({
checkType: true
});
csvConverter.subscribe(function (d) {
assert(d.Period === 13);
assert(d["Apparent age"] === "Unknown");
done();
});
rs.pipe(csvConverter);
});
it("be able to ignore empty columns", function (done) {
var testData = __dirname + "/data/dataIgnoreEmpty";
var rs = fs.createReadStream(testData);
var st = rs.pipe(csv({ ignoreEmpty: true }));
st.then(function (res) {
var j = res[0];
assert(res.length === 3);
assert(j.col2.length === 2);
assert(j.col2[1] === "d3");
assert(j.col4.col3 === undefined);
assert(j.col4.col5 === "world");
assert(res[1].col1 === "d2");
assert(res[2].col1 === "d4");
done();
});
});
it("should allow no header", function (done) {
var testData = __dirname + "/data/noheadercsv";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter({ noheader: true }));
st.then(function (res) {
var j = res[0];
assert(res.length === 5);
assert(j.field1 === "CC102-PDMI-001");
assert(j.field2 === "eClass_5.1.3");
done();
});
});
it("should allow customised header", function (done) {
var testData = __dirname + "/data/noheadercsv";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter({
noheader: true,
headers: ["a", "b"]
}));
st.then(function (res) {
var j = res[0];
assert(res.length === 5);
assert(j.a === "CC102-PDMI-001");
assert(j.b === "eClass_5.1.3");
assert(j.field3 === "10/3/2014");
done();
});
});
it("should allow customised header to override existing header", function (done) {
var testData = __dirname + "/data/complexJSONCSV";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter({
headers: []
}));
st.then(function (res) {
var j = res[0];
assert(res.length === 2);
assert(j.field1 === "Food Factory");
assert(j.field2 === "Oscar");
done();
});
});
it("should handle when there is an empty string", function (done) {
var testData = __dirname + "/data/dataWithEmptyString";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter({
noheader: true,
headers: ["a", "b", "c"],
checkType: true
}));
st.then(function (res) {
var j = res[0];
// assert(res.length===2);
assert(j.a === "green");
assert(j.b === 40);
assert.equal(j.c, "");
done();
});
});
it("should detect eol correctly when first chunk is smaller than header row length", function (done) {
var testData = __dirname + "/data/dataNoTrimCRLF";
var rs = fs.createReadStream(testData, { highWaterMark: 3 });
var st = rs.pipe(new Converter({
trim: false
}));
st.then(function (res) {
var j = res[0];
assert(res.length === 2);
assert(j.name === "joe");
assert(j.age === "20");
assert.equal(res[1].name, "sam");
assert.equal(res[1].age, "30");
done();
});
});
it("should detect eol correctly when first chunk ends in middle of CRLF line break", function (done) {
var testData = __dirname + "/data/dataNoTrimCRLF";
var rs = fs.createReadStream(testData, { highWaterMark: 9 });
var st = rs.pipe(new Converter({
trim: false
}));
st.then(function (res) {
var j = res[0];
assert(res.length === 2);
assert(j.name === "joe");
assert(j.age === "20");
assert.equal(res[1].name, "sam");
assert.equal(res[1].age, "30");
done();
});
});
it("should emit eol event when line ending is detected as CRLF", function (done) {
var testData = __dirname + "/data/dataNoTrimCRLF";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter());
var eolCallback = sandbox.spy(function (eol) {
assert.equal(eol, "\r\n");
});
st.on("eol", eolCallback);
st.then(function () {
assert.equal(eolCallback.callCount, 1, 'should emit eol event once');
done();
})
});
it("should emit eol event when line ending is detected as LF", function (done) {
var testData = __dirname + "/data/columnArray";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter());
var eolCallback = sandbox.spy(function (eol) {
assert.equal(eol, "\n");
});
st.on("eol", eolCallback);
st.then(function () {
assert.equal(eolCallback.callCount, 1, 'should emit eol event once');
done();
})
});
it("should remove the Byte Order Mark (BOM) from input", function (done) {
var testData = __dirname + "/data/dataNoTrimBOM";
var rs = fs.createReadStream(testData);
var st = rs.pipe(new Converter({
trim: false
}));
st.then( function (res) {
var j = res[0];
assert(res.length===2);
assert(j.name === "joe");
assert(j.age === "20");
done();
});
});
});