From 552a368482f5d1347e6f07acb621ebe59cae46f1 Mon Sep 17 00:00:00 2001 From: Charles Zhao Date: Tue, 25 Mar 2025 11:32:54 +0800 Subject: [PATCH] refactor(translate): improve prompts to better support i18n suffixes (#7167) * refactor(translate): improve prompts to better support i18n suffixes * chore: add changeset --- .changeset/hungry-terms-smash.md | 5 ++++ packages/translate/src/prompts.ts | 38 ++++++++++++++++++++++++++++--- 2 files changed, 40 insertions(+), 3 deletions(-) create mode 100644 .changeset/hungry-terms-smash.md diff --git a/.changeset/hungry-terms-smash.md b/.changeset/hungry-terms-smash.md new file mode 100644 index 000000000..4ac10487f --- /dev/null +++ b/.changeset/hungry-terms-smash.md @@ -0,0 +1,5 @@ +--- +"@logto/translate": patch +--- + +improve openai prompt to better support i18n plural form suffixes diff --git a/packages/translate/src/prompts.ts b/packages/translate/src/prompts.ts index 5b928b8aa..75fe680ae 100644 --- a/packages/translate/src/prompts.ts +++ b/packages/translate/src/prompts.ts @@ -22,9 +22,41 @@ export const getTranslationPromptMessages = ({ }: GetTranslationPromptProperties) => [ { role: 'assistant', - content: `You are a assistant translator and will receive a TypeScript object. Traverse and find object values with "${untranslatedMark}" annotation on the top, then translate these values to target locale "${targetLanguage}". Remove the "${untranslatedMark}" annotations from output. Escape the single quotes (if any) in translated results by prepending a backslash. Keep the interpolation double curly brackets and their inner values intact. Make sure there is a space between the CJK and non-CJK characters. Prefer using "你" instead of "您" in Chinese. Do not include sample code snippet below in the final output. ${conditionalString( - extraPrompt - )} + content: ` +You are a assistant translator and will receive a TypeScript object. +Traverse and find object values with "${untranslatedMark}" annotation on the top, +then translate these values to target locale "${targetLanguage}". +Remove the "${untranslatedMark}" annotations from output. +Escape the single quotes (if any) in translated results by prepending a backslash. +Keep the interpolation double curly brackets and their inner values intact. +Make sure there is a space between the CJK and non-CJK characters. +Prefer using "你" instead of "您" in Chinese. +Do not include sample code snippet below in the final output. +When translating phrases whose keys have plural suffixes, pay attention to the plural rules of the target language. +For example, the plural suffixes in English are "_one" and "_other". But other languages may have additional suffixes like "_two", "_few" and "_many". +These suffixed phrases always have a "{{count}}" variable. When translating these phrases, you need to imagine the variable is replaced with the number indicated by the suffix, and use proper plural forms in the final translation. +For example, you may meet these phrases in English: +\`\`\`ts +const password_requirement = { + length_one: 'requires a minimum of {{count}} character', + length_two: 'requires a minimum of {{count}} characters', + length_few: 'requires a minimum of {{count}} characters', + length_many: 'requires a minimum of {{count}} characters', + length_other: 'requires a minimum of {{count}} characters', +}; +\`\`\` +And the proper translation in Russian would be: +\`\`\`ts +const password_requirement = { + length_one: 'Требуется минимум {{count}} символ', + length_two: 'Требуется минимум {{count}} символа', + length_few: 'Требуется минимум {{count}} символа', + length_many: 'Требуется минимум {{count}} символов', + length_other: 'Требуется минимум {{count}} символов', +}; +\`\`\` + +${conditionalString(extraPrompt)} Take translating to zh-CN as an example, if the input is: \`\`\`ts