budibase/packages/server/src/utilities/csvParser.js

83 lines
1.9 KiB
JavaScript
Raw Normal View History

2020-10-02 17:16:06 +02:00
const csv = require("csvtojson")
const VALIDATORS = {
string: () => true,
number: attribute => !isNaN(Number(attribute)),
datetime: attribute => !isNaN(new Date(attribute).getTime()),
}
const PARSERS = {
datetime: attribute => new Date(attribute).toISOString(),
}
function parse(path, parsers) {
2020-10-05 11:51:58 +02:00
const result = csv({ parsers }).fromFile(path)
2020-10-02 17:16:06 +02:00
const schema = {}
return new Promise((resolve, reject) => {
result.on("header", headers => {
for (let header of headers) {
schema[header] = {
type: parsers[header] ? parsers[header].type : "string",
success: true,
}
}
})
result.fromFile(path).subscribe(row => {
// For each CSV row
// parse all the columns that need parsed
for (let key in parsers) {
2020-10-05 11:51:58 +02:00
// if the parsing has already failed for a column
// skip that column
if (
!schema[key] ||
!schema[key].success ||
schema[key].type === "omit"
) {
continue
}
2020-10-02 17:16:06 +02:00
2020-10-05 11:51:58 +02:00
// get the validator for the column type
2020-10-02 17:16:06 +02:00
const validator = VALIDATORS[parsers[key].type]
try {
2020-10-05 15:07:39 +02:00
// allow null/undefined values
schema[key].success = !row[key] || !!validator(row[key])
2020-10-02 17:16:06 +02:00
} catch (err) {
schema[key].success = false
}
}
})
result.on("done", error => {
if (error) {
console.error(error)
reject(error)
}
resolve(schema)
})
})
}
async function transform({ schema, path }) {
const colParser = {}
for (let key in schema) {
2020-10-05 11:51:58 +02:00
colParser[key] = PARSERS[schema[key].type] || schema[key].type
2020-10-02 17:16:06 +02:00
}
try {
const json = await csv({ colParser }).fromFile(path)
return json
} catch (err) {
console.error(`Error transforming CSV to JSON for data import`, err)
2020-10-05 12:48:13 +02:00
throw err
2020-10-02 17:16:06 +02:00
}
}
module.exports = {
parse,
transform,
}