dify/web/i18n-config/auto-gen-i18n.js

337 lines
10 KiB
JavaScript
Raw Permalink Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

import fs from 'node:fs'
import path from 'node:path'
import { fileURLToPath } from 'node:url'
import { translate } from 'bing-translate-api'
import data from './languages'
const __filename = fileURLToPath(import.meta.url)
const __dirname = path.dirname(__filename)
const targetLanguage = 'en-US'
const i18nFolder = '../i18n' // Path to i18n folder relative to this script
// https://github.com/plainheart/bing-translate-api/blob/master/src/met/lang.json
const languageKeyMap = data.languages.reduce((map, language) => {
if (language.supported) {
if (language.value === 'zh-Hans' || language.value === 'zh-Hant')
map[language.value] = language.value
else
map[language.value] = language.value.split('-')[0]
}
return map
}, {})
const supportedLanguages = Object.keys(languageKeyMap)
function parseArgs(argv) {
const args = {
files: [],
languages: [],
isDryRun: false,
help: false,
errors: [],
}
const collectValues = (startIndex) => {
const values = []
let cursor = startIndex + 1
while (cursor < argv.length && !argv[cursor].startsWith('--')) {
const value = argv[cursor].trim()
if (value)
values.push(value)
cursor++
}
return { values, nextIndex: cursor - 1 }
}
const validateList = (values, flag) => {
if (!values.length) {
args.errors.push(`${flag} requires at least one value. Example: ${flag} app billing`)
return false
}
const invalid = values.find(value => value.includes(','))
if (invalid) {
args.errors.push(`${flag} expects space-separated values. Example: ${flag} app billing`)
return false
}
return true
}
for (let index = 2; index < argv.length; index++) {
const arg = argv[index]
if (arg === '--dry-run') {
args.isDryRun = true
continue
}
if (arg === '--help' || arg === '-h') {
args.help = true
break
}
if (arg.startsWith('--file=')) {
args.errors.push('--file expects space-separated values. Example: --file app billing')
continue
}
if (arg === '--file') {
const { values, nextIndex } = collectValues(index)
if (validateList(values, '--file'))
args.files.push(...values)
index = nextIndex
continue
}
if (arg.startsWith('--lang=')) {
args.errors.push('--lang expects space-separated values. Example: --lang zh-Hans ja-JP')
continue
}
if (arg === '--lang') {
const { values, nextIndex } = collectValues(index)
if (validateList(values, '--lang'))
args.languages.push(...values)
index = nextIndex
continue
}
}
return args
}
function printHelp() {
console.log(`Usage: pnpm run auto-gen-i18n [options]
Options:
--file <name...> Process only specific files; provide space-separated names and repeat --file if needed
--lang <locale> Process only specific locales; provide space-separated locales and repeat --lang if needed (default: all supported except en-US)
--dry-run Preview changes without writing files
-h, --help Show help
Examples:
pnpm run auto-gen-i18n --file app common --lang zh-Hans ja-JP
pnpm run auto-gen-i18n --dry-run
`)
}
function protectPlaceholders(text) {
const placeholders = []
let safeText = text
const patterns = [
/\{\{[^{}]+\}\}/g, // mustache
/\$\{[^{}]+\}/g, // template expressions
/<[^>]+>/g, // html-like tags
]
patterns.forEach((pattern) => {
safeText = safeText.replace(pattern, (match) => {
const token = `__PH_${placeholders.length}__`
placeholders.push({ token, value: match })
return token
})
})
return {
safeText,
restore(translated) {
return placeholders.reduce((result, { token, value }) => result.replace(new RegExp(token, 'g'), value), translated)
},
}
}
async function translateText(source, toLanguage) {
if (typeof source !== 'string')
return { value: source, skipped: false }
const trimmed = source.trim()
if (!trimmed)
return { value: source, skipped: false }
const { safeText, restore } = protectPlaceholders(source)
try {
const { translation } = await translate(safeText, null, languageKeyMap[toLanguage])
return { value: restore(translation), skipped: false }
}
catch (error) {
console.error(`❌ Error translating to ${toLanguage}:`, error.message)
return { value: source, skipped: true, error: error.message }
}
}
async function translateMissingKeys(sourceObj, targetObject, toLanguage) {
const skippedKeys = []
const translatedKeys = []
for (const key of Object.keys(sourceObj)) {
const sourceValue = sourceObj[key]
const targetValue = targetObject[key]
// Skip if target already has this key
if (targetValue !== undefined)
continue
const translationResult = await translateText(sourceValue, toLanguage)
targetObject[key] = translationResult.value ?? ''
if (translationResult.skipped)
skippedKeys.push(`${key}: ${sourceValue}`)
else
translatedKeys.push(key)
}
return { skipped: skippedKeys, translated: translatedKeys }
}
async function autoGenTrans(fileName, toGenLanguage, isDryRun = false) {
const fullKeyFilePath = path.resolve(__dirname, i18nFolder, targetLanguage, `${fileName}.json`)
const toGenLanguageFilePath = path.resolve(__dirname, i18nFolder, toGenLanguage, `${fileName}.json`)
try {
const content = fs.readFileSync(fullKeyFilePath, 'utf8')
const fullKeyContent = JSON.parse(content)
if (!fullKeyContent || typeof fullKeyContent !== 'object')
throw new Error(`Failed to extract translation object from ${fullKeyFilePath}`)
// if toGenLanguageFilePath does not exist, create it with empty object
let toGenOutPut = {}
if (fs.existsSync(toGenLanguageFilePath)) {
const existingContent = fs.readFileSync(toGenLanguageFilePath, 'utf8')
toGenOutPut = JSON.parse(existingContent)
}
console.log(`\n🌍 Processing ${fileName} for ${toGenLanguage}...`)
const result = await translateMissingKeys(fullKeyContent, toGenOutPut, toGenLanguage)
// Generate summary report
console.log(`\n📊 Translation Summary for ${fileName} -> ${toGenLanguage}:`)
console.log(` ✅ Translated: ${result.translated.length} keys`)
console.log(` ⏭️ Skipped: ${result.skipped.length} keys`)
if (result.skipped.length > 0) {
console.log(`\n⚠️ Skipped keys in ${fileName} (${toGenLanguage}):`)
result.skipped.slice(0, 5).forEach(item => console.log(` - ${item}`))
if (result.skipped.length > 5)
console.log(` ... and ${result.skipped.length - 5} more`)
}
const res = `${JSON.stringify(toGenOutPut, null, 2)}\n`
if (!isDryRun) {
fs.writeFileSync(toGenLanguageFilePath, res)
console.log(`💾 Saved translations to ${toGenLanguageFilePath}`)
}
else {
console.log(`🔍 [DRY RUN] Would save translations to ${toGenLanguageFilePath}`)
}
return result
}
catch (error) {
console.error(`Error processing file ${fullKeyFilePath}:`, error.message)
throw error
}
}
// Add command line argument support
const args = parseArgs(process.argv)
const isDryRun = args.isDryRun
const targetFiles = args.files
const targetLangs = args.languages
// Rate limiting helper
function delay(ms) {
return new Promise(resolve => setTimeout(resolve, ms))
}
async function main() {
if (args.help) {
printHelp()
return
}
if (args.errors.length) {
args.errors.forEach(message => console.error(`${message}`))
printHelp()
process.exit(1)
return
}
console.log('🚀 Starting auto-gen-i18n script...')
console.log(`📋 Mode: ${isDryRun ? 'DRY RUN (no files will be modified)' : 'LIVE MODE'}`)
const filesInEn = fs
.readdirSync(path.resolve(__dirname, i18nFolder, targetLanguage))
.filter(file => /\.json$/.test(file)) // Only process .json files
.map(file => file.replace(/\.json$/, ''))
// Filter by target files if specified
const filesToProcess = targetFiles.length > 0 ? filesInEn.filter(f => targetFiles.includes(f)) : filesInEn
const languagesToProcess = Array.from(new Set((targetLangs.length > 0 ? targetLangs : supportedLanguages)
.filter(lang => lang !== targetLanguage)))
const unknownLangs = languagesToProcess.filter(lang => !languageKeyMap[lang])
if (unknownLangs.length) {
console.error(`❌ Unsupported languages: ${unknownLangs.join(', ')}`)
process.exit(1)
}
if (!filesToProcess.length) {
console.log(' No files to process based on provided arguments')
return
}
if (!languagesToProcess.length) {
console.log(' No languages to process (did you only specify en-US?)')
return
}
console.log(`📁 Files to process: ${filesToProcess.join(', ')}`)
console.log(`🌍 Languages to process: ${languagesToProcess.join(', ')}`)
let totalTranslated = 0
let totalSkipped = 0
let totalErrors = 0
// Process files sequentially to avoid API rate limits
for (const file of filesToProcess) {
console.log(`\n📄 Processing file: ${file}`)
// Process languages with rate limiting
for (const language of languagesToProcess) {
try {
const result = await autoGenTrans(file, language, isDryRun)
totalTranslated += result.translated.length
totalSkipped += result.skipped.length
// Rate limiting: wait 500ms between language processing
await delay(500)
}
catch (e) {
console.error(`❌ Error translating ${file} to ${language}:`, e.message)
totalErrors++
}
}
}
// Final summary
console.log('\n🎉 Auto-translation completed!')
console.log('📊 Final Summary:')
console.log(` ✅ Total keys translated: ${totalTranslated}`)
console.log(` ⏭️ Total keys skipped: ${totalSkipped}`)
console.log(` ❌ Total errors: ${totalErrors}`)
if (isDryRun)
console.log('\n💡 This was a dry run. To actually translate, run without --dry-run flag.')
if (totalErrors > 0)
process.exitCode = 1
}
main().catch((error) => {
console.error('❌ Unexpected error:', error.message)
process.exit(1)
})