trilium/src/services/consistency_checks.js

403 lines
12 KiB
JavaScript
Raw Normal View History

2017-12-15 11:16:26 +08:00
"use strict";
const sql = require('./sql');
const sqlInit = require('./sql_init');
2017-12-15 11:16:26 +08:00
const log = require('./log');
const messagingService = require('./messaging');
const syncMutexService = require('./sync_mutex');
const repository = require('./repository');
const cls = require('./cls');
const Branch = require('../entities/branch');
2017-12-15 11:16:26 +08:00
let outstandingConsistencyErrors = false;
2017-12-15 11:16:26 +08:00
async function runCheck(recoverable, query, errorText) {
const results = await sql.getRows(query);
2017-12-24 02:16:18 +08:00
if (results.length > 0) {
const resultText = results.map(row => "'" + row.value + "'").join(', ');
2017-12-15 11:16:26 +08:00
log.error(errorText + ": " + resultText);
if (!recoverable) {
outstandingConsistencyErrors = true;
}
2017-12-15 11:16:26 +08:00
}
return results;
2017-12-15 11:16:26 +08:00
}
async function checkTreeCycles() {
2018-01-02 08:41:22 +08:00
const childToParents = {};
2018-03-25 09:39:15 +08:00
const rows = await sql.getRows("SELECT noteId, parentNoteId FROM branches WHERE isDeleted = 0");
2018-01-02 08:41:22 +08:00
for (const row of rows) {
2018-01-29 08:30:14 +08:00
const childNoteId = row.noteId;
const parentNoteId = row.parentNoteId;
2018-01-02 08:41:22 +08:00
2018-10-22 03:37:34 +08:00
childToParents[childNoteId] = childToParents[childNoteId] || [];
2018-01-02 08:41:22 +08:00
childToParents[childNoteId].push(parentNoteId);
}
function checkTreeCycle(noteId, path) {
2018-01-02 08:41:22 +08:00
if (noteId === 'root') {
return;
}
if (!childToParents[noteId] || childToParents[noteId].length === 0) {
errorList.push(`No parents found for noteId=${noteId}`);
return;
}
2018-01-02 08:41:22 +08:00
for (const parentNoteId of childToParents[noteId]) {
if (path.includes(parentNoteId)) {
log.error(`Tree cycle detected at parent-child relationship: ${parentNoteId} - ${noteId}, whole path: ${path}`);
outstandingConsistencyErrors = true;
2018-01-02 08:41:22 +08:00
}
else {
const newPath = path.slice();
newPath.push(noteId);
checkTreeCycle(parentNoteId, newPath);
2018-01-02 08:41:22 +08:00
}
}
}
const noteIds = Object.keys(childToParents);
for (const noteId of noteIds) {
checkTreeCycle(noteId, []);
2018-01-02 08:41:22 +08:00
}
2018-10-22 03:37:34 +08:00
if (childToParents['root'].length !== 1 || childToParents['root'][0] !== 'none') {
log.error('Incorrect root parent: ' + JSON.stringify(childToParents['root']));
outstandingConsistencyErrors = true;
2018-10-22 03:37:34 +08:00
}
2018-01-02 08:41:22 +08:00
}
async function runSyncRowChecks(table, key) {
await runCheck(false, `
SELECT
${key} AS value
FROM
${table}
2018-01-29 08:30:14 +08:00
LEFT JOIN sync ON sync.entityName = '${table}' AND entityId = ${key}
WHERE
sync.id IS NULL AND ` + (table === 'options' ? 'isSynced = 1' : '1'),
`Missing sync records for ${key} in table ${table}`);
await runCheck(false, `
SELECT
entityId AS value
FROM
sync
2018-01-29 08:30:14 +08:00
LEFT JOIN ${table} ON entityId = ${key}
WHERE
2018-01-29 08:30:14 +08:00
sync.entityName = '${table}'
AND ${key} IS NULL`,
`Missing ${table} records for existing sync rows`);
2017-12-15 11:16:26 +08:00
}
async function fixEmptyRelationTargets() {
2018-11-13 06:34:22 +08:00
const emptyRelations = await repository.getEntities("SELECT * FROM attributes WHERE isDeleted = 0 AND type = 'relation' AND value = ''");
for (const relation of emptyRelations) {
relation.isDeleted = true;
await relation.save();
log.error(`Relation ${relation.attributeId} of name "${relation.name} has empty target. Autofixed.`);
2018-11-13 06:34:22 +08:00
}
}
async function checkMissingBranches() {
const notes = await runCheck(true, `
SELECT
noteId AS value
FROM
notes
2018-03-25 09:39:15 +08:00
LEFT JOIN branches USING(noteId)
WHERE
2018-01-29 08:30:14 +08:00
noteId != 'root'
2018-03-25 09:39:15 +08:00
AND branches.branchId IS NULL`,
"Missing branches for following note IDs");
for (const {value: noteId} of notes) {
const branch = await new Branch({
parentNoteId: 'root',
noteId: noteId,
prefix: 'recovered'
}).save();
2017-12-15 11:16:26 +08:00
log.info(`Created missing branch ${branch.branchId} for note ${noteId}`);
}
}
async function checkMissingNotes() {
const records = await runCheck(true, `
SELECT
branchId || ' > ' || branches.noteId AS value, branchId, branches.noteId
FROM
2018-03-25 09:39:15 +08:00
branches
2018-01-29 08:30:14 +08:00
LEFT JOIN notes USING(noteId)
WHERE
2018-01-29 08:30:14 +08:00
notes.noteId IS NULL`,
"Missing notes records for following branch ID > note ID");
for (const {branchId, noteId} of records) {
const branch = await repository.getBranch(branchId);
branch.isDeleted = true;
await branch.save();
log.info(`Removed ${branchId} because it pointed to the missing ${noteId}`);
}
}
2017-12-15 11:16:26 +08:00
async function checkAllDeletedNotesBranchesAreDeleted() {
const branches = await runCheck(true, `
SELECT
branchId AS value, branchId, noteId
FROM
2018-03-25 09:39:15 +08:00
branches
2018-01-29 08:30:14 +08:00
JOIN notes USING(noteId)
WHERE
2018-01-29 08:30:14 +08:00
notes.isDeleted = 1
2018-03-25 09:39:15 +08:00
AND branches.isDeleted = 0`,
"Branch is not deleted even though main note is deleted for following branch IDs");
2017-12-15 11:16:26 +08:00
for (const {branchId, noteId} of branches) {
const branch = await repository.getBranch(branchId);
branch.isDeleted = true;
await branch.save();
log.info(`Branch ${branchId} has been deleted since associated note ${noteId} is deleted.`);
}
}
async function checkAllNotesShouldHaveUndeletedBranch() {
// we do extra JOIN to eliminate orphan notes without branches (which are reported separately)
const notes = await runCheck(true, `
SELECT
DISTINCT noteId AS value
FROM
notes
2018-03-25 09:39:15 +08:00
JOIN branches USING(noteId)
WHERE
2018-03-25 09:39:15 +08:00
(SELECT COUNT(*) FROM branches WHERE notes.noteId = branches.noteId AND branches.isDeleted = 0) = 0
2018-01-29 08:30:14 +08:00
AND notes.isDeleted = 0
`, 'No undeleted branches for note IDs');
for (const {value: noteId} of notes) {
const branch = await new Branch({
parentNoteId: 'root',
noteId: noteId,
prefix: 'recovered'
}).save();
log.info(`Created missing branch ${branch.branchId} for note ${noteId}`);
}
}
async function runAllChecks() {
outstandingConsistencyErrors = false;
await checkMissingBranches();
await checkMissingNotes();
await checkAllDeletedNotesBranchesAreDeleted();
// FIXME - does this make sense? Specifically branch - branch comparison seems strange
await runCheck(false, `
SELECT
child.branchId AS value
FROM
branches AS child
WHERE
child.isDeleted = 0
AND child.parentNoteId != 'none'
AND (SELECT COUNT(*) FROM branches AS parent WHERE parent.noteId = child.parentNoteId
AND parent.isDeleted = 0) = 0`,
"All parent branches are deleted but child branch is not for these child branch IDs");
await checkAllNotesShouldHaveUndeletedBranch();
await runCheck(false, `
SELECT
child.parentNoteId || ' > ' || child.noteId AS value
2018-03-25 09:39:15 +08:00
FROM branches
AS child
2018-03-25 09:39:15 +08:00
LEFT JOIN branches AS parent ON parent.noteId = child.parentNoteId
WHERE
2018-01-29 08:30:14 +08:00
parent.noteId IS NULL
AND child.parentNoteId != 'none'`,
"Not existing parent in the following parent > child relations");
2017-12-15 11:16:26 +08:00
await runCheck(false, `
SELECT
noteRevisionId || ' > ' || note_revisions.noteId AS value
FROM
note_revisions LEFT JOIN notes USING(noteId)
WHERE
2018-01-29 08:30:14 +08:00
notes.noteId IS NULL`,
"Missing notes records for following note revision ID > note ID");
2017-12-15 11:16:26 +08:00
await runCheck(false, `
SELECT
branches.parentNoteId || ' > ' || branches.noteId AS value
FROM
2018-03-25 09:39:15 +08:00
branches
WHERE
2018-03-25 09:39:15 +08:00
branches.isDeleted = 0
GROUP BY
2018-03-25 09:39:15 +08:00
branches.parentNoteId,
branches.noteId
HAVING
COUNT(*) > 1`,
"Duplicate undeleted parent note <-> note relationship - parent note ID > note ID");
await runCheck(false, `
2018-01-21 10:56:03 +08:00
SELECT
noteId AS value
2018-01-21 10:56:03 +08:00
FROM
notes
WHERE
2018-11-08 17:11:00 +08:00
type != 'text'
AND type != 'code'
AND type != 'render'
AND type != 'file'
AND type != 'image'
AND type != 'search'
AND type != 'relation-map'`,
"Note has invalid type");
2018-01-21 10:56:03 +08:00
await runCheck(false, `
2018-11-20 06:11:36 +08:00
SELECT
noteId AS value
2018-11-20 06:11:36 +08:00
FROM
notes
WHERE
isDeleted = 0
AND content IS NULL`,
"Note content is null even though it is not deleted");
2018-11-20 06:11:36 +08:00
await runCheck(false, `
SELECT
parentNoteId AS value
FROM
2018-03-25 09:39:15 +08:00
branches
JOIN notes ON notes.noteId = branches.parentNoteId
WHERE
type == 'search'`,
"Search note has children");
await fixEmptyRelationTargets();
await runCheck(false, `
SELECT
attributeId AS value
FROM
attributes
WHERE
type != 'label'
AND type != 'label-definition'
AND type != 'relation'
AND type != 'relation-definition'`,
"Attribute has invalid type");
await runCheck(false,`
SELECT
attributeId AS value
FROM
attributes
LEFT JOIN notes ON attributes.noteId = notes.noteId AND notes.isDeleted = 0
WHERE
attributes.isDeleted = 0
AND notes.noteId IS NULL`,
"Attribute reference to the owning note is broken");
await runCheck(false, `
SELECT
attributeId AS value
FROM
attributes
LEFT JOIN notes AS targetNote ON attributes.value = targetNote.noteId AND targetNote.isDeleted = 0
WHERE
attributes.type = 'relation'
AND attributes.isDeleted = 0
AND targetNote.noteId IS NULL`,
"Relation reference to the target note is broken");
await runCheck(false, `
SELECT
linkId AS value
FROM
links
WHERE
type != 'image'
AND type != 'hyper'
AND type != 'relation-map'`,
"Link type is invalid");
await runCheck(false, `
SELECT
linkId AS value
FROM
links
LEFT JOIN notes AS sourceNote ON sourceNote.noteId = links.noteId AND sourceNote.isDeleted = 0
LEFT JOIN notes AS targetNote ON targetNote.noteId = links.noteId AND targetNote.isDeleted = 0
WHERE
links.isDeleted = 0
AND (sourceNote.noteId IS NULL
OR targetNote.noteId IS NULL)`,
"Link to source/target note link is broken");
await runSyncRowChecks("notes", "noteId");
await runSyncRowChecks("note_revisions", "noteRevisionId");
await runSyncRowChecks("branches", "branchId");
await runSyncRowChecks("recent_notes", "branchId");
await runSyncRowChecks("attributes", "attributeId");
await runSyncRowChecks("api_tokens", "apiTokenId");
await runSyncRowChecks("options", "name");
if (outstandingConsistencyErrors) {
2018-01-02 08:41:22 +08:00
// we run this only if basic checks passed since this assumes basic data consistency
await checkTreeCycles();
2018-01-02 08:41:22 +08:00
}
return !outstandingConsistencyErrors;
}
async function runChecks() {
let elapsedTimeMs;
let dbConsistent;
await syncMutexService.doExclusively(async () => {
const startTime = new Date();
dbConsistent = await runAllChecks();
elapsedTimeMs = new Date().getTime() - startTime.getTime();
});
if (!dbConsistent) {
log.info(`Consistency checks failed (took ${elapsedTimeMs}ms)`);
2018-01-02 08:41:22 +08:00
messagingService.sendMessageToAllClients({type: 'consistency-checks-failed'});
}
else {
log.info(`All consistency checks passed (took ${elapsedTimeMs}ms)`);
}
2017-12-15 11:16:26 +08:00
}
sqlInit.dbReady.then(() => {
setInterval(cls.wrap(runChecks), 60 * 60 * 1000);
2017-12-15 11:16:26 +08:00
// kickoff backup immediately
setTimeout(cls.wrap(runChecks), 10000);
2017-12-15 11:16:26 +08:00
});
module.exports = {
runChecks
};