2017-10-19 11:51:54 +02:00
|
|
|
#!/usr/bin/env node
|
|
|
|
|
2017-10-18 14:39:04 +02:00
|
|
|
/*
|
|
|
|
Copyright 2017 New Vector Ltd
|
|
|
|
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
you may not use this file except in compliance with the License.
|
|
|
|
You may obtain a copy of the License at
|
|
|
|
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
See the License for the specific language governing permissions and
|
|
|
|
limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2017-10-17 20:19:01 +02:00
|
|
|
/**
|
2017-10-18 15:45:04 +02:00
|
|
|
* Regenerates the translations en_EN file by walking the source tree and
|
2020-07-31 21:33:25 +02:00
|
|
|
* parsing each file with the appropriate parser. Emits a JSON file with the
|
2017-10-17 20:19:01 +02:00
|
|
|
* translatable strings mapped to themselves in the order they appeared
|
|
|
|
* in the files and grouped by the file they appeared in.
|
|
|
|
*
|
|
|
|
* Usage: node scripts/gen-i18n.js
|
|
|
|
*/
|
|
|
|
const fs = require('fs');
|
|
|
|
const path = require('path');
|
|
|
|
|
|
|
|
const walk = require('walk');
|
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
const parser = require("@babel/parser");
|
|
|
|
const traverse = require("@babel/traverse");
|
2017-10-17 20:19:01 +02:00
|
|
|
|
2017-11-13 20:20:14 +01:00
|
|
|
const TRANSLATIONS_FUNCS = ['_t', '_td'];
|
2017-10-17 20:19:01 +02:00
|
|
|
|
2017-10-18 15:30:55 +02:00
|
|
|
const INPUT_TRANSLATIONS_FILE = 'src/i18n/strings/en_EN.json';
|
2017-10-20 19:38:22 +02:00
|
|
|
const OUTPUT_FILE = 'src/i18n/strings/en_EN.json';
|
2017-10-17 20:19:01 +02:00
|
|
|
|
2017-10-18 20:36:07 +02:00
|
|
|
// NB. The sync version of walk is broken for single files so we walk
|
|
|
|
// all of res rather than just res/home.html.
|
|
|
|
// https://git.daplie.com/Daplie/node-walk/merge_requests/1 fixes it,
|
|
|
|
// or if we get bored waiting for it to be merged, we could switch
|
|
|
|
// to a project that's actively maintained.
|
|
|
|
const SEARCH_PATHS = ['src', 'res'];
|
|
|
|
|
2017-10-17 20:19:01 +02:00
|
|
|
function getObjectValue(obj, key) {
|
|
|
|
for (const prop of obj.properties) {
|
2020-07-31 21:33:25 +02:00
|
|
|
if (prop.key.type === 'Identifier' && prop.key.name === key) {
|
2017-10-17 20:19:01 +02:00
|
|
|
return prop.value;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
function getTKey(arg) {
|
2020-07-31 21:33:25 +02:00
|
|
|
if (arg.type === 'Literal' || arg.type === "StringLiteral") {
|
2017-10-17 20:19:01 +02:00
|
|
|
return arg.value;
|
2020-07-31 21:33:25 +02:00
|
|
|
} else if (arg.type === 'BinaryExpression' && arg.operator === '+') {
|
2017-10-17 20:19:01 +02:00
|
|
|
return getTKey(arg.left) + getTKey(arg.right);
|
2020-07-31 21:33:25 +02:00
|
|
|
} else if (arg.type === 'TemplateLiteral') {
|
2017-10-17 20:19:01 +02:00
|
|
|
return arg.quasis.map((q) => {
|
|
|
|
return q.value.raw;
|
|
|
|
}).join('');
|
|
|
|
}
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2017-10-20 19:38:22 +02:00
|
|
|
function getFormatStrings(str) {
|
|
|
|
// Match anything that starts with %
|
|
|
|
// We could make a regex that matched the full placeholder, but this
|
|
|
|
// would just not match invalid placeholders and so wouldn't help us
|
|
|
|
// detect the invalid ones.
|
|
|
|
// Also note that for simplicity, this just matches a % character and then
|
|
|
|
// anything up to the next % character (or a single %, or end of string).
|
|
|
|
const formatStringRe = /%([^%]+|%|$)/g;
|
|
|
|
const formatStrings = new Set();
|
|
|
|
|
|
|
|
let match;
|
2017-10-23 15:02:58 +02:00
|
|
|
while ( (match = formatStringRe.exec(str)) !== null ) {
|
2017-10-20 19:38:22 +02:00
|
|
|
const placeholder = match[1]; // Minus the leading '%'
|
|
|
|
if (placeholder === '%') continue; // Literal % is %%
|
|
|
|
|
|
|
|
const placeholderMatch = placeholder.match(/^\((.*?)\)(.)/);
|
|
|
|
if (placeholderMatch === null) {
|
|
|
|
throw new Error("Invalid format specifier: '"+match[0]+"'");
|
|
|
|
}
|
|
|
|
if (placeholderMatch.length < 3) {
|
|
|
|
throw new Error("Malformed format specifier");
|
|
|
|
}
|
2017-10-23 11:18:29 +02:00
|
|
|
const placeholderName = placeholderMatch[1];
|
|
|
|
const placeholderFormat = placeholderMatch[2];
|
2017-10-20 19:38:22 +02:00
|
|
|
|
2017-10-23 11:18:29 +02:00
|
|
|
if (placeholderFormat !== 's') {
|
|
|
|
throw new Error(`'${placeholderFormat}' used as format character: you probably meant 's'`);
|
2017-10-20 19:38:22 +02:00
|
|
|
}
|
|
|
|
|
2017-10-23 11:18:29 +02:00
|
|
|
formatStrings.add(placeholderName);
|
2017-10-20 19:38:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return formatStrings;
|
|
|
|
}
|
|
|
|
|
2017-10-18 20:36:07 +02:00
|
|
|
function getTranslationsJs(file) {
|
2020-07-31 21:33:25 +02:00
|
|
|
const contents = fs.readFileSync(file, { encoding: 'utf8' });
|
2017-10-17 20:19:01 +02:00
|
|
|
|
|
|
|
const trs = new Set();
|
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
try {
|
|
|
|
const plugins = [
|
|
|
|
// https://babeljs.io/docs/en/babel-parser#plugins
|
|
|
|
"classProperties",
|
|
|
|
"objectRestSpread",
|
|
|
|
"throwExpressions",
|
|
|
|
"exportDefaultFrom",
|
|
|
|
"decorators-legacy",
|
|
|
|
];
|
|
|
|
|
|
|
|
if (file.endsWith(".js") || file.endsWith(".jsx")) {
|
|
|
|
// all JS is assumed to be flow or react
|
|
|
|
plugins.push("flow", "jsx");
|
|
|
|
} else if (file.endsWith(".ts")) {
|
|
|
|
// TS can't use JSX unless it's a TSX file (otherwise angle casts fail)
|
|
|
|
plugins.push("typescript");
|
|
|
|
} else if (file.endsWith(".tsx")) {
|
|
|
|
// When the file is a TSX file though, enable JSX parsing
|
|
|
|
plugins.push("typescript", "jsx");
|
|
|
|
}
|
|
|
|
|
|
|
|
const babelParsed = parser.parse(contents, {
|
|
|
|
allowImportExportEverywhere: true,
|
|
|
|
errorRecovery: true,
|
|
|
|
sourceFilename: file,
|
|
|
|
tokens: true,
|
|
|
|
plugins,
|
|
|
|
});
|
|
|
|
traverse.default(babelParsed, {
|
|
|
|
enter: (p) => {
|
|
|
|
const node = p.node;
|
|
|
|
if (p.isCallExpression() && node.callee && TRANSLATIONS_FUNCS.includes(node.callee.name)) {
|
|
|
|
const tKey = getTKey(node.arguments[0]);
|
|
|
|
|
|
|
|
// This happens whenever we call _t with non-literals (ie. whenever we've
|
|
|
|
// had to use a _td to compensate) so is expected.
|
|
|
|
if (tKey === null) return;
|
|
|
|
|
|
|
|
// check the format string against the args
|
|
|
|
// We only check _t: _td has no args
|
|
|
|
if (node.callee.name === '_t') {
|
|
|
|
try {
|
|
|
|
const placeholders = getFormatStrings(tKey);
|
|
|
|
for (const placeholder of placeholders) {
|
|
|
|
if (node.arguments.length < 2) {
|
|
|
|
throw new Error(`Placeholder found ('${placeholder}') but no substitutions given`);
|
|
|
|
}
|
|
|
|
const value = getObjectValue(node.arguments[1], placeholder);
|
|
|
|
if (value === null) {
|
|
|
|
throw new Error(`No value found for placeholder '${placeholder}'`);
|
|
|
|
}
|
2017-10-20 19:38:22 +02:00
|
|
|
}
|
2017-11-13 20:20:14 +01:00
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
// Validate tag replacements
|
|
|
|
if (node.arguments.length > 2) {
|
|
|
|
const tagMap = node.arguments[2];
|
|
|
|
for (const prop of tagMap.properties || []) {
|
|
|
|
if (prop.key.type === 'Literal') {
|
|
|
|
const tag = prop.key.value;
|
|
|
|
// RegExp same as in src/languageHandler.js
|
|
|
|
const regexp = new RegExp(`(<${tag}>(.*?)<\\/${tag}>|<${tag}>|<${tag}\\s*\\/>)`);
|
|
|
|
if (!tKey.match(regexp)) {
|
|
|
|
throw new Error(`No match for ${regexp} in ${tKey}`);
|
|
|
|
}
|
2017-11-13 20:20:14 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
} catch (e) {
|
|
|
|
console.log();
|
|
|
|
console.error(`ERROR: ${file}:${node.loc.start.line} ${tKey}`);
|
|
|
|
console.error(e);
|
|
|
|
process.exit(1);
|
|
|
|
}
|
2017-10-20 19:38:22 +02:00
|
|
|
}
|
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
let isPlural = false;
|
|
|
|
if (node.arguments.length > 1 && node.arguments[1].type === 'ObjectExpression') {
|
|
|
|
const countVal = getObjectValue(node.arguments[1], 'count');
|
|
|
|
if (countVal) {
|
|
|
|
isPlural = true;
|
|
|
|
}
|
2017-10-17 20:19:01 +02:00
|
|
|
}
|
|
|
|
|
2020-07-31 21:33:25 +02:00
|
|
|
if (isPlural) {
|
|
|
|
trs.add(tKey + "|other");
|
|
|
|
const plurals = enPlurals[tKey];
|
|
|
|
if (plurals) {
|
|
|
|
for (const pluralType of Object.keys(plurals)) {
|
|
|
|
trs.add(tKey + "|" + pluralType);
|
|
|
|
}
|
2017-10-18 15:30:55 +02:00
|
|
|
}
|
2020-07-31 21:33:25 +02:00
|
|
|
} else {
|
|
|
|
trs.add(tKey);
|
2017-10-17 20:19:01 +02:00
|
|
|
}
|
|
|
|
}
|
2020-07-31 21:33:25 +02:00
|
|
|
},
|
|
|
|
});
|
|
|
|
} catch (e) {
|
|
|
|
console.error(e);
|
|
|
|
process.exit(1);
|
|
|
|
}
|
2017-10-17 20:19:01 +02:00
|
|
|
|
|
|
|
return trs;
|
|
|
|
}
|
|
|
|
|
2017-10-18 20:36:07 +02:00
|
|
|
function getTranslationsOther(file) {
|
|
|
|
const contents = fs.readFileSync(file, { encoding: 'utf8' });
|
|
|
|
|
|
|
|
const trs = new Set();
|
|
|
|
|
|
|
|
// Taken from riot-web src/components/structures/HomePage.js
|
|
|
|
const translationsRegex = /_t\(['"]([\s\S]*?)['"]\)/mg;
|
|
|
|
let matches;
|
|
|
|
while (matches = translationsRegex.exec(contents)) {
|
|
|
|
trs.add(matches[1]);
|
|
|
|
}
|
|
|
|
return trs;
|
|
|
|
}
|
|
|
|
|
2017-10-18 15:30:55 +02:00
|
|
|
// gather en_EN plural strings from the input translations file:
|
|
|
|
// the en_EN strings are all in the source with the exception of
|
|
|
|
// pluralised strings, which we need to pull in from elsewhere.
|
|
|
|
const inputTranslationsRaw = JSON.parse(fs.readFileSync(INPUT_TRANSLATIONS_FILE, { encoding: 'utf8' }));
|
|
|
|
const enPlurals = {};
|
|
|
|
|
|
|
|
for (const key of Object.keys(inputTranslationsRaw)) {
|
|
|
|
const parts = key.split("|");
|
|
|
|
if (parts.length > 1) {
|
|
|
|
const plurals = enPlurals[parts[0]] || {};
|
|
|
|
plurals[parts[1]] = inputTranslationsRaw[key];
|
|
|
|
enPlurals[parts[0]] = plurals;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-10-17 20:19:01 +02:00
|
|
|
const translatables = new Set();
|
|
|
|
|
2017-10-18 20:36:07 +02:00
|
|
|
const walkOpts = {
|
2017-10-17 20:19:01 +02:00
|
|
|
listeners: {
|
2018-12-05 19:52:10 +01:00
|
|
|
names: function(root, nodeNamesArray) {
|
|
|
|
// Sort the names case insensitively and alphabetically to
|
|
|
|
// maintain some sense of order between the different strings.
|
|
|
|
nodeNamesArray.sort((a, b) => {
|
|
|
|
a = a.toLowerCase();
|
|
|
|
b = b.toLowerCase();
|
|
|
|
if (a > b) return 1;
|
|
|
|
if (a < b) return -1;
|
|
|
|
return 0;
|
|
|
|
});
|
|
|
|
},
|
2017-10-17 20:19:01 +02:00
|
|
|
file: function(root, fileStats, next) {
|
|
|
|
const fullPath = path.join(root, fileStats.name);
|
2017-10-18 20:36:07 +02:00
|
|
|
|
2018-12-05 19:52:10 +01:00
|
|
|
let trs;
|
2020-04-08 22:42:12 +02:00
|
|
|
if (fileStats.name.endsWith('.js') || fileStats.name.endsWith('.ts') || fileStats.name.endsWith('.tsx')) {
|
2017-10-18 20:36:07 +02:00
|
|
|
trs = getTranslationsJs(fullPath);
|
|
|
|
} else if (fileStats.name.endsWith('.html')) {
|
|
|
|
trs = getTranslationsOther(fullPath);
|
|
|
|
} else {
|
|
|
|
return;
|
|
|
|
}
|
2017-10-17 20:19:01 +02:00
|
|
|
console.log(`${fullPath} (${trs.size} strings)`);
|
|
|
|
for (const tr of trs.values()) {
|
2018-12-05 19:52:10 +01:00
|
|
|
// Convert DOS line endings to unix
|
|
|
|
translatables.add(tr.replace(/\r\n/g, "\n"));
|
2017-10-17 20:19:01 +02:00
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
2017-10-18 20:36:07 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
for (const path of SEARCH_PATHS) {
|
|
|
|
if (fs.existsSync(path)) {
|
|
|
|
walk.walkSync(path, walkOpts);
|
|
|
|
}
|
|
|
|
}
|
2017-10-17 20:19:01 +02:00
|
|
|
|
|
|
|
const trObj = {};
|
|
|
|
for (const tr of translatables) {
|
2017-10-24 15:26:30 +02:00
|
|
|
if (tr.includes("|")) {
|
|
|
|
if (inputTranslationsRaw[tr]) {
|
|
|
|
trObj[tr] = inputTranslationsRaw[tr];
|
|
|
|
} else {
|
|
|
|
trObj[tr] = tr.split("|")[0];
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
trObj[tr] = tr;
|
2017-10-18 15:30:55 +02:00
|
|
|
}
|
2017-10-17 20:19:01 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fs.writeFileSync(
|
2017-10-20 19:38:22 +02:00
|
|
|
OUTPUT_FILE,
|
2017-10-17 20:19:01 +02:00
|
|
|
JSON.stringify(trObj, translatables.values(), 4) + "\n"
|
|
|
|
);
|
|
|
|
|
2017-10-20 19:38:22 +02:00
|
|
|
console.log();
|
|
|
|
console.log(`Wrote ${translatables.size} strings to ${OUTPUT_FILE}`);
|