budibase/packages/server/src/utilities/csvParser.js

75 lines
1.7 KiB
JavaScript
Raw Normal View History

2020-10-02 17:16:06 +02:00
const csv = require("csvtojson")
const VALIDATORS = {
string: () => true,
number: attribute => !isNaN(Number(attribute)),
datetime: attribute => !isNaN(new Date(attribute).getTime()),
}
const PARSERS = {
2020-10-14 14:09:03 +02:00
number: attribute => Number(attribute),
2020-10-02 17:16:06 +02:00
datetime: attribute => new Date(attribute).toISOString(),
}
function parse(path, parsers) {
2020-10-05 15:43:34 +02:00
const result = csv().fromFile(path)
2020-10-02 17:16:06 +02:00
const schema = {}
return new Promise((resolve, reject) => {
result.on("header", headers => {
for (let header of headers) {
schema[header] = {
type: parsers[header] ? parsers[header].type : "string",
success: true,
}
}
})
2020-10-14 14:09:03 +02:00
result.subscribe((row, lineNumber) => {
2020-10-05 20:21:51 +02:00
// For each CSV row parse all the columns that need parsed
2020-10-02 17:16:06 +02:00
for (let key in parsers) {
2020-10-05 20:21:51 +02:00
if (!schema[key] || schema[key].success) {
// get the validator for the column type
const validator = VALIDATORS[parsers[key].type]
2020-10-02 17:16:06 +02:00
2020-10-05 20:21:51 +02:00
try {
// allow null/undefined values
schema[key].success = !row[key] || validator(row[key])
} catch (err) {
schema[key].success = false
}
2020-10-02 17:16:06 +02:00
}
}
})
result.on("done", error => {
if (error) {
console.error(error)
reject(error)
}
resolve(schema)
})
})
}
async function transform({ schema, path }) {
const colParser = {}
for (let key in schema) {
2020-10-05 11:51:58 +02:00
colParser[key] = PARSERS[schema[key].type] || schema[key].type
2020-10-02 17:16:06 +02:00
}
try {
const json = await csv({ colParser }).fromFile(path)
return json
} catch (err) {
console.error(`Error transforming CSV to JSON for data import`, err)
2020-10-05 12:48:13 +02:00
throw err
2020-10-02 17:16:06 +02:00
}
}
module.exports = {
parse,
transform,
}