Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Deinflection cycle testing #477

Merged
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
165 changes: 165 additions & 0 deletions test/deinflection-cycles.test.js
Original file line number Diff line number Diff line change
@@ -0,0 +1,165 @@
/*
* Copyright (C) 2024 Yomitan Authors
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*/

import {readFileSync} from 'fs';
import {join, dirname as pathDirname} from 'path';
import {fileURLToPath} from 'url';
import {describe, test} from 'vitest';
import {parseJson} from '../dev/json.js';
import {Deinflector} from '../ext/js/language/deinflector.js';

class DeinflectionNode {
/**
* @param {string} text
* @param {import('deinflector').ReasonTypeRaw[]} ruleNames
* @param {?RuleNode} ruleNode
* @param {?DeinflectionNode} previous
*/
constructor(text, ruleNames, ruleNode, previous) {
/** @type {string} */
this.text = text;
/** @type {import('deinflector').ReasonTypeRaw[]} */
this.ruleNames = ruleNames;
/** @type {?RuleNode} */
this.ruleNode = ruleNode;
/** @type {?DeinflectionNode} */
this.previous = previous;
}

/**
* @param {DeinflectionNode} other
* @returns {boolean}
*/
historyIncludes(other) {
/** @type {?DeinflectionNode} */
// eslint-disable-next-line @typescript-eslint/no-this-alias
let node = this;
for (; node !== null; node = node.previous) {
if (
node.ruleNode === other.ruleNode &&
node.text === other.text &&
arraysAreEqual(node.ruleNames, other.ruleNames)
) {
return true;
}
}
return false;
}

/**
* @returns {DeinflectionNode[]}
*/
getHistory() {
/** @type {DeinflectionNode[]} */
const results = [];
/** @type {?DeinflectionNode} */
// eslint-disable-next-line @typescript-eslint/no-this-alias
let node = this;
for (; node !== null; node = node.previous) {
results.unshift(node);
}
return results;
}
}

class RuleNode {
/**
* @param {string} groupName
* @param {import('deinflector').ReasonRaw} rule
*/
constructor(groupName, rule) {
/** @type {string} */
this.groupName = groupName;
/** @type {import('deinflector').ReasonRaw} */
this.rule = rule;
}
}

/**
* @template [T=unknown]
* @param {T[]} rules1
* @param {T[]} rules2
* @returns {boolean}
*/
function arraysAreEqual(rules1, rules2) {
if (rules1.length !== rules2.length) { return false; }
for (const rule1 of rules1) {
if (!rules2.includes(rule1)) { return false; }
}
return true;
}

describe('Deinflection data', () => {
test('Check for cycles', ({expect}) => {
const dirname = pathDirname(fileURLToPath(import.meta.url));

/** @type {import('deinflector').ReasonsRaw} */
const deinflectionReasons = parseJson(readFileSync(join(dirname, '../ext/data/deinflect.json'), {encoding: 'utf8'}));

/** @type {RuleNode[]} */
const ruleNodes = [];
for (const [groupName, reasonInfo] of Object.entries(deinflectionReasons)) {
for (const rule of reasonInfo) {
ruleNodes.push(new RuleNode(groupName, rule));
}
}

/** @type {DeinflectionNode[]} */
const deinflectionNodes = [];
for (const ruleNode of ruleNodes) {
deinflectionNodes.push(new DeinflectionNode(`?${ruleNode.rule.kanaIn}`, [], null, null));
}
for (let i = 0; i < deinflectionNodes.length; ++i) {
const deinflectionNode = deinflectionNodes[i];
const {text, ruleNames} = deinflectionNode;
for (const ruleNode of ruleNodes) {
const {kanaIn, kanaOut, rulesIn, rulesOut} = ruleNode.rule;
if (
!Deinflector.rulesMatch(Deinflector.rulesToRuleFlags(ruleNames), Deinflector.rulesToRuleFlags(rulesIn)) ||
!text.endsWith(kanaIn) ||
(text.length - kanaIn.length + kanaOut.length) <= 0
) {
continue;
}

const newDeinflectionNode = new DeinflectionNode(
text.substring(0, text.length - kanaIn.length) + kanaOut,
rulesOut,
ruleNode,
deinflectionNode
);

// Cycle check
if (deinflectionNode.historyIncludes(newDeinflectionNode)) {
const stack = [];
for (const item of newDeinflectionNode.getHistory()) {
stack.push(
item.ruleNode === null ?
`${item.text} (start)` :
`${item.text} (${item.ruleNode.groupName}, ${item.ruleNode.rule.rulesIn.join(',')}=>${item.ruleNode.rule.rulesOut.join(',')}, ${item.ruleNode.rule.kanaIn}=>${item.ruleNode.rule.kanaOut})`
);
}
const message = `Cycle detected:\n ${stack.join('\n ')}`;
expect.soft(true, message).toEqual(false);
continue;
}

deinflectionNodes.push(newDeinflectionNode);
}
}
});
});
2 changes: 1 addition & 1 deletion test/deinflector.test.js
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@ function hasTermReasons(deinflector, source, expectedTerm, expectedRule, expecte
if (term !== expectedTerm) { continue; }
if (typeof expectedRule !== 'undefined') {
const expectedFlags = Deinflector.rulesToRuleFlags([expectedRule]);
if (rules !== 0 && (rules & expectedFlags) !== expectedFlags) { continue; }
if (!Deinflector.rulesMatch(rules, expectedFlags)) { continue; }
}
let okay = true;
if (typeof expectedReasons !== 'undefined') {
Expand Down
14 changes: 8 additions & 6 deletions types/ext/deinflector.d.ts
Original file line number Diff line number Diff line change
Expand Up @@ -20,12 +20,14 @@ import type * as TranslationInternal from './translation-internal';
export type ReasonTypeRaw = 'v1' | 'v1d' | 'v1p' | 'v5' | 'vs' | 'vk' | 'vz' | 'adj-i' | 'iru';

export type ReasonsRaw = {
[reason: string]: {
kanaIn: string;
kanaOut: string;
rulesIn: ReasonTypeRaw[];
rulesOut: ReasonTypeRaw[];
}[];
[reason: string]: ReasonRaw[];
};

export type ReasonRaw = {
kanaIn: string;
kanaOut: string;
rulesIn: ReasonTypeRaw[];
rulesOut: ReasonTypeRaw[];
};

export type ReasonVariant = [
Expand Down
Loading