mirror of
https://github.com/ksyasuda/SubMiner.git
synced 2026-02-28 06:22:45 -08:00
177 lines
6.1 KiB
JavaScript
177 lines
6.1 KiB
JavaScript
/*
|
|
* Copyright (C) 2024-2025 Yomitan Authors
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
import {prefixInflection, suffixInflection} from '../language-transforms.js';
|
|
|
|
/** @typedef {keyof typeof conditions} Condition */
|
|
|
|
// https://www.dartmouth.edu/~deutsch/Grammatik/Wortbildung/Separables.html
|
|
const separablePrefixes = ['ab', 'an', 'auf', 'aus', 'auseinander', 'bei', 'da', 'dabei', 'dar', 'daran', 'dazwischen', 'durch', 'ein', 'empor', 'entgegen', 'entlang', 'entzwei', 'fehl', 'fern', 'fest', 'fort', 'frei', 'gegenüber', 'gleich', 'heim', 'her', 'herab', 'heran', 'herauf', 'heraus', 'herbei', 'herein', 'herüber', 'herum', 'herunter', 'hervor', 'hin', 'hinab', 'hinauf', 'hinaus', 'hinein', 'hinterher', 'hinunter', 'hinweg', 'hinzu', 'hoch', 'los', 'mit', 'nach', 'nebenher', 'nieder', 'statt', 'um', 'vor', 'voran', 'voraus', 'vorbei', 'vorüber', 'vorweg', 'weg', 'weiter', 'wieder', 'zu', 'zurecht', 'zurück', 'zusammen'];
|
|
const germanLetters = 'a-zA-ZäöüßÄÖÜẞ';
|
|
|
|
/**
|
|
* @param {string} prefix
|
|
* @param {Condition[]} conditionsIn
|
|
* @param {Condition[]} conditionsOut
|
|
* @returns {import('language-transformer').Rule<Condition>}
|
|
*/
|
|
function separatedPrefix(prefix, conditionsIn, conditionsOut) {
|
|
const regex = new RegExp(`^([${germanLetters}]+) .+ ${prefix}$`);
|
|
return {
|
|
type: 'other',
|
|
isInflected: regex,
|
|
deinflect: (term) => {
|
|
return term.replace(regex, '$1 ' + prefix);
|
|
},
|
|
conditionsIn,
|
|
conditionsOut,
|
|
};
|
|
}
|
|
|
|
const separatedPrefixInflections = separablePrefixes.map((prefix) => {
|
|
return separatedPrefix(prefix, [], []);
|
|
});
|
|
|
|
const zuInfinitiveInflections = separablePrefixes.map((prefix) => {
|
|
return prefixInflection(prefix + 'zu', prefix, [], ['v']);
|
|
});
|
|
|
|
/**
|
|
* @returns {import('language-transformer').Rule<Condition>[]}
|
|
*/
|
|
function getBasicPastParticiples() {
|
|
const regularPastParticiple = new RegExp(`^ge([${germanLetters}]+)t$`);
|
|
const suffixes = ['n', 'en'];
|
|
return suffixes.map((suffix) => ({
|
|
type: 'other',
|
|
isInflected: regularPastParticiple,
|
|
deinflect: (term) => {
|
|
return term.replace(regularPastParticiple, `$1${suffix}`);
|
|
},
|
|
conditionsIn: [],
|
|
conditionsOut: ['vw'],
|
|
}));
|
|
}
|
|
|
|
/**
|
|
* @returns {import('language-transformer').Rule<Condition>[]}
|
|
*/
|
|
function getSeparablePastParticiples() {
|
|
const prefixDisjunction = separablePrefixes.join('|');
|
|
const separablePastParticiple = new RegExp(`^(${prefixDisjunction})ge([${germanLetters}]+)t$`);
|
|
const suffixes = ['n', 'en'];
|
|
return suffixes.map((suffix) => ({
|
|
type: 'other',
|
|
isInflected: separablePastParticiple,
|
|
deinflect: (term) => {
|
|
return term.replace(separablePastParticiple, `$1$2${suffix}`);
|
|
},
|
|
conditionsIn: [],
|
|
conditionsOut: ['vw'],
|
|
}));
|
|
}
|
|
|
|
const conditions = {
|
|
v: {
|
|
name: 'Verb',
|
|
isDictionaryForm: true,
|
|
subConditions: ['vw', 'vs'],
|
|
},
|
|
vw: {
|
|
name: 'Weak verb',
|
|
isDictionaryForm: true,
|
|
},
|
|
vs: {
|
|
name: 'Strong verb',
|
|
isDictionaryForm: true,
|
|
},
|
|
n: {
|
|
name: 'Noun',
|
|
isDictionaryForm: true,
|
|
},
|
|
adj: {
|
|
name: 'Adjective',
|
|
isDictionaryForm: true,
|
|
},
|
|
};
|
|
|
|
export const germanTransforms = {
|
|
language: 'de',
|
|
conditions,
|
|
transforms: {
|
|
'nominalization': {
|
|
name: 'nominalization',
|
|
description: 'Noun formed from a verb',
|
|
rules: [
|
|
suffixInflection('ung', 'en', [], ['v']),
|
|
suffixInflection('lung', 'eln', [], ['v']),
|
|
suffixInflection('rung', 'rn', [], ['v']),
|
|
],
|
|
},
|
|
'-bar': {
|
|
name: '-bar',
|
|
description: '-able adjective from a verb',
|
|
rules: [
|
|
suffixInflection('bar', 'en', ['adj'], ['v']),
|
|
suffixInflection('bar', 'n', ['adj'], ['v']),
|
|
],
|
|
},
|
|
'negative': {
|
|
name: 'negative',
|
|
description: 'Negation',
|
|
rules: [
|
|
prefixInflection('un', '', [], ['adj']),
|
|
],
|
|
},
|
|
'past participle': {
|
|
name: 'past participle',
|
|
rules: [
|
|
...getBasicPastParticiples(),
|
|
...getSeparablePastParticiples(),
|
|
],
|
|
},
|
|
'separated prefix': {
|
|
name: 'separated prefix',
|
|
rules: [
|
|
...separatedPrefixInflections,
|
|
],
|
|
},
|
|
'zu-infinitive': {
|
|
name: 'zu-infinitive',
|
|
rules: [
|
|
...zuInfinitiveInflections,
|
|
],
|
|
},
|
|
'-heit': {
|
|
name: '-heit',
|
|
description:
|
|
'1. Converts an adjective into a noun and usually denotes an abstract quality of the adjectival root. ' +
|
|
'It is often equivalent to the English suffixes -ness, -th, -ty, -dom:\n' +
|
|
'\t schön (“beautiful”) + -heit → Schönheit (“beauty”)\n' +
|
|
'\t neu (“new”) + -heit → Neuheit (“novelty”)\n' +
|
|
'2. Converts concrete nouns into abstract nouns:\n' +
|
|
'\t Kind (“child”) + -heit → Kindheit (“childhood”)\n' +
|
|
'\t Christ (“Christian”) + -heit → Christenheit (“Christendom”)\n',
|
|
rules: [
|
|
suffixInflection('heit', '', ['n'], ['adj', 'n']),
|
|
suffixInflection('keit', '', ['n'], ['adj', 'n']),
|
|
],
|
|
},
|
|
|
|
},
|
|
};
|