iptv-database/scripts/db/validate.js

146 lines
3.9 KiB
JavaScript
Raw Normal View History

2022-02-11 21:55:50 -05:00
const { logger, file, csv } = require('../core')
const { program } = require('commander')
const schemes = require('./schemes')
const chalk = require('chalk')
const Joi = require('joi')
program.argument('[filepath]', 'Path to file to validate').parse(process.argv)
async function main() {
let errors = []
const files = program.args.length
? program.args
: [
2022-02-13 22:11:47 -05:00
'data/blocklist.csv',
2022-02-11 21:55:50 -05:00
'data/categories.csv',
'data/channels.csv',
'data/countries.csv',
'data/languages.csv',
'data/regions.csv',
'data/subdivisions.csv'
]
for (const filepath of files) {
if (!filepath.endsWith('.csv')) continue
2022-02-17 09:33:35 -05:00
const eol = await file.eol(filepath)
if (eol !== 'CRLF') {
logger.error(chalk.red(`\nError: file must have line endings with CRLF (${filepath})`))
process.exit(1)
}
const csvString = await file.read(filepath)
if (/\s+$/.test(csvString)) {
logger.error(chalk.red(`\nError: empty lines at the end of file not allowed (${filepath})`))
process.exit(1)
}
2022-02-11 21:55:50 -05:00
const filename = file.getFilename(filepath)
if (!schemes[filename]) {
2022-02-13 22:06:08 -05:00
logger.error(chalk.red(`\nError: "${filename}" scheme is missing`))
2022-02-11 21:55:50 -05:00
process.exit(1)
}
2022-02-21 06:07:37 -05:00
const data = await csv.fromString(csvString).catch(err => {
logger.error(chalk.red(`\n${err.message} (${filepath})`))
process.exit(1)
})
2022-02-11 21:55:50 -05:00
let fileErrors = []
if (filename === 'channels') {
2022-02-21 06:07:37 -05:00
if (/\"/.test(csvString)) {
logger.error(chalk.red(`\nError: \" character is not allowed (${filepath})`))
process.exit(1)
}
2022-02-11 21:55:50 -05:00
fileErrors = fileErrors.concat(findDuplicatesById(data))
2022-04-08 21:02:02 -04:00
let categories = await csv.fromFile('data/categories.csv').catch(err => {
logger.error(chalk.red(`\nError: ${err.message}`))
process.exit(1)
})
categories = categories.map(c => c.id)
data.forEach((row, i) => {
if (
categories.length &&
row.categories.length &&
intersection(categories, row.categories).length !== row.categories.length
) {
fileErrors.push({
line: i + 2,
message: `"${row.id}" has the wrong categories "${row.categories.join(';')}"`
})
}
})
2022-04-08 20:44:51 -04:00
} else if (filename === 'blocklist') {
let channels = await csv.fromFile('data/channels.csv').catch(err => {
logger.error(chalk.red(`\nError: ${err.message}`))
process.exit(1)
})
channels = channels.map(c => c.id)
data.forEach((row, i) => {
if (channels.length && !channels.includes(row.channel)) {
fileErrors.push({
line: i + 2,
message: `"${row.channel}" is missing in the channels.csv`
})
}
})
2022-02-11 21:55:50 -05:00
}
const schema = Joi.object(schemes[filename])
data.forEach((row, i) => {
const { error } = schema.validate(row, { abortEarly: false })
if (error) {
error.details.forEach(detail => {
fileErrors.push({ line: i + 2, message: detail.message })
})
}
})
if (fileErrors.length) {
logger.info(`\n${chalk.underline(filepath)}`)
fileErrors.forEach(err => {
const position = err.line.toString().padEnd(6, ' ')
logger.error(` ${chalk.gray(position)} ${err.message}`)
})
errors = errors.concat(fileErrors)
}
}
if (errors.length) {
logger.error(chalk.red(`\n${errors.length} error(s)`))
process.exit(1)
}
}
main()
function findDuplicatesById(data) {
data = data.map(i => {
i.id = i.id.toLowerCase()
return i
})
const errors = []
const schema = Joi.array().unique((a, b) => a.id === b.id)
const { error } = schema.validate(data, { abortEarly: false })
if (error) {
error.details.forEach(detail => {
errors.push({
line: detail.context.pos + 2,
message: `Entry with the id "${detail.context.value.id}" already exists`
})
})
}
return errors
}
2022-04-08 21:02:02 -04:00
function intersection(array1, array2) {
return array1.filter(function (n) {
return array2.indexOf(n) !== -1
})
}