# Copyright (c) 2021, Frappe Technologies Pvt. Ltd. and Contributors # License: MIT. See LICENSE """ frappe.translate ~~~~~~~~~~~~~~~~ Translation tools for frappe """ import functools import io import itertools import json import operator import os import re from csv import reader from babel.messages.extract import extract_python from babel.messages.jslexer import Token, tokenize, unquote_string from pypika.terms import PseudoColumn import frappe from frappe.model.utils import InvalidIncludePath, render_include from frappe.query_builder import DocType, Field from frappe.utils import cstr, get_bench_path, is_html, strip, strip_html_tags, unique TRANSLATE_PATTERN = re.compile( r"_\(\s*" # starts with literal `_(`, ignore following whitespace/newlines # BEGIN: message search r"([\"']{,3})" # start of message string identifier - allows: ', ", """, '''; 1st capture group r"(?P((?!\1).)*)" # Keep matching until string closing identifier is met which is same as 1st capture group r"\1" # match exact string closing identifier # END: message search # BEGIN: python context search r"(\s*,\s*context\s*=\s*" # capture `context=` with ignoring whitespace r"([\"'])" # start of context string identifier; 5th capture group r"(?P((?!\5).)*)" # capture context string till closing id is found r"\5" # match context string closure r")?" # match 0 or 1 context strings # END: python context search # BEGIN: JS context search r"(\s*,\s*(.)*?\s*(,\s*" # skip message format replacements: ["format", ...] | null | [] r"([\"'])" # start of context string; 11th capture group r"(?P((?!\11).)*)" # capture context string till closing id is found r"\11" # match context string closure r")*" r")*" # match one or more context string # END: JS context search r"\s*\)" # Closing function call ignore leading whitespace/newlines ) REPORT_TRANSLATE_PATTERN = re.compile('"([^:,^"]*):') CSV_STRIP_WHITESPACE_PATTERN = re.compile(r"{\s?([0-9]+)\s?}") # Cache keys MERGED_TRANSLATION_KEY = "merged_translations" APP_TRANSLATION_KEY = "translations_from_apps" USER_TRANSLATION_KEY = "lang_user_translations" def get_language(lang_list: list = None) -> str: """Set `frappe.local.lang` from HTTP headers at beginning of request Order of priority for setting language: 1. Form Dict => _lang 2. Cookie => preferred_language (Non authorized user) 3. Request Header => Accept-Language (Non authorized user) 4. User document => language 5. System Settings => language """ is_logged_in = frappe.session.user != "Guest" # fetch language from form_dict if frappe.form_dict._lang: language = get_lang_code(frappe.form_dict._lang or get_parent_language(frappe.form_dict._lang)) if language: return language # use language set in User or System Settings if user is logged in if is_logged_in: return frappe.local.lang lang_set = set(lang_list or get_all_languages() or []) # fetch language from cookie preferred_language_cookie = get_preferred_language_cookie() if preferred_language_cookie: if preferred_language_cookie in lang_set: return preferred_language_cookie parent_language = get_parent_language(language) if parent_language in lang_set: return parent_language # fetch language from request headers accept_language = list(frappe.request.accept_languages.values()) for language in accept_language: if language in lang_set: return language parent_language = get_parent_language(language) if parent_language in lang_set: return parent_language # fallback to language set in System Settings or "en" return frappe.db.get_default("lang") or "en" @functools.lru_cache def get_parent_language(lang: str) -> str: """If the passed language is a variant, return its parent Eg: 1. zh-TW -> zh 2. sr-BA -> sr """ is_language_variant = "-" in lang if is_language_variant: return lang[: lang.index("-")] def get_user_lang(user: str = None) -> str: """Set frappe.local.lang from user preferences on session beginning or resumption""" user = user or frappe.session.user lang = frappe.cache().hget("lang", user) if not lang: # User.language => Session Defaults => frappe.local.lang => 'en' lang = ( frappe.db.get_value("User", user, "language") or frappe.db.get_default("lang") or frappe.local.lang or "en" ) frappe.cache().hset("lang", user, lang) return lang def get_lang_code(lang: str) -> str | None: return frappe.db.get_value("Language", {"name": lang}) or frappe.db.get_value( "Language", {"language_name": lang} ) def set_default_language(lang): """Set Global default language""" if frappe.db.get_default("lang") != lang: frappe.db.set_default("lang", lang) frappe.local.lang = lang def get_lang_dict(): """Returns all languages in dict format, full name is the key e.g. `{"english":"en"}`""" return dict( frappe.get_all("Language", fields=["language_name", "name"], order_by="modified", as_list=True) ) def get_dict(fortype: str, name: str | None = None) -> dict[str, str]: """Returns translation dict for a type of object. :param fortype: must be one of `doctype`, `page`, `report`, `include`, `jsfile`, `boot` :param name: name of the document for which assets are to be returned. """ fortype = fortype.lower() cache = frappe.cache() asset_key = fortype + ":" + (name or "-") translation_assets = cache.hget("translation_assets", frappe.local.lang, shared=True) or {} if asset_key not in translation_assets: messages = [] if fortype == "doctype": messages = get_messages_from_doctype(name) elif fortype == "page": messages = get_messages_from_page(name) elif fortype == "report": messages = get_messages_from_report(name) elif fortype == "include": messages = get_messages_from_include_files() elif fortype == "jsfile": messages = get_messages_from_file(name) elif fortype == "boot": apps = frappe.get_all_apps(True) for app in apps: messages.extend(get_server_messages(app)) messages += get_messages_from_navbar() messages += get_messages_from_include_files() messages += ( frappe.qb.from_("Print Format").select(PseudoColumn("'Print Format:'"), "name") ).run() messages += (frappe.qb.from_("DocType").select(PseudoColumn("'DocType:'"), "name")).run() messages += frappe.qb.from_("Role").select(PseudoColumn("'Role:'"), "name").run() messages += (frappe.qb.from_("Module Def").select(PseudoColumn("'Module:'"), "name")).run() messages += ( frappe.qb.from_("Workspace Shortcut") .where(Field("format").isnotnull()) .select(PseudoColumn("''"), "format") ).run() messages += (frappe.qb.from_("Onboarding Step").select(PseudoColumn("''"), "title")).run() messages = deduplicate_messages(messages) message_dict = make_dict_from_messages(messages, load_user_translation=False) message_dict.update(get_dict_from_hooks(fortype, name)) # remove untranslated message_dict = {k: v for k, v in message_dict.items() if k != v} translation_assets[asset_key] = message_dict cache.hset("translation_assets", frappe.local.lang, translation_assets, shared=True) translation_map: dict = translation_assets[asset_key] translation_map.update(get_user_translations(frappe.local.lang)) return translation_map def get_messages_for_boot(): """Return all message translations that are required on boot.""" messages = get_all_translations(frappe.local.lang) messages.update(get_dict_from_hooks("boot", None)) return messages def get_dict_from_hooks(fortype, name): translated_dict = {} hooks = frappe.get_hooks("get_translated_dict") for (hook_fortype, fortype_name) in hooks: if hook_fortype == fortype and fortype_name == name: for method in hooks[(hook_fortype, fortype_name)]: translated_dict.update(frappe.get_attr(method)()) return translated_dict def make_dict_from_messages(messages, full_dict=None, load_user_translation=True): """Returns translated messages as a dict in Language specified in `frappe.local.lang` :param messages: List of untranslated messages """ out = {} if full_dict is None: if load_user_translation: full_dict = get_all_translations(frappe.local.lang) else: full_dict = get_translations_from_apps(frappe.local.lang) for m in messages: if m[1] in full_dict: out[m[1]] = full_dict[m[1]] # check if msg with context as key exist eg. msg:context if len(m) > 2 and m[2]: key = m[1] + ":" + m[2] if full_dict.get(key): out[key] = full_dict[key] return out def get_lang_js(fortype: str, name: str) -> str: """Returns code snippet to be appended at the end of a JS script. :param fortype: Type of object, e.g. `DocType` :param name: Document name """ return f"\n\n$.extend(frappe._messages, {json.dumps(get_dict(fortype, name))})" def get_all_translations(lang: str) -> dict[str, str]: """Load and return the entire translations dictionary for a language from apps + user translations. :param lang: Language Code, e.g. `hi` """ if not lang: return {} def _merge_translations(): all_translations = get_translations_from_apps(lang).copy() try: # get user specific translation data user_translations = get_user_translations(lang) all_translations.update(user_translations) except Exception: pass return all_translations try: return frappe.cache().hget(MERGED_TRANSLATION_KEY, lang, generator=_merge_translations) except Exception: # People mistakenly call translation function on global variables # where locals are not initalized, translations dont make much sense there return {} def get_translations_from_apps(lang, apps=None): """Combine all translations from `.csv` files in all `apps`. For derivative languages (es-GT), take translations from the base language (es) and then update translations from the child (es-GT)""" if lang == "en": return {} def _get_from_disk(): translations = {} for app in apps or frappe.get_all_apps(True): path = os.path.join(frappe.get_pymodule_path(app), "translations", lang + ".csv") translations.update(get_translation_dict_from_file(path, lang, app) or {}) if "-" in lang: parent = lang.split("-")[0] parent_translations = get_translations_from_apps(parent) parent_translations.update(translations) return parent_translations return translations return frappe.cache().hget(APP_TRANSLATION_KEY, lang, shared=True, generator=_get_from_disk) def get_translation_dict_from_file(path, lang, app, throw=False) -> dict[str, str]: """load translation dict from given path""" translation_map = {} if os.path.exists(path): csv_content = read_csv_file(path) for item in csv_content: if len(item) == 3 and item[2]: key = item[0] + ":" + item[2] translation_map[key] = strip(item[1]) elif len(item) in [2, 3]: translation_map[item[0]] = strip(item[1]) elif item: msg = "Bad translation in '{app}' for language '{lang}': {values}".format( app=app, lang=lang, values=cstr(item) ) frappe.log_error(message=msg, title="Error in translation file") if throw: frappe.throw(msg, title="Error in translation file") return translation_map def get_user_translations(lang): if not frappe.db: frappe.connect() def _read_from_db(): user_translations = {} translations = frappe.get_all( "Translation", fields=["source_text", "translated_text", "context"], filters={"language": lang} ) for t in translations: key = t.source_text value = t.translated_text if t.context: key += ":" + t.context user_translations[key] = value return user_translations return frappe.cache().hget(USER_TRANSLATION_KEY, lang, generator=_read_from_db) def clear_cache(): """Clear all translation assets from :meth:`frappe.cache`""" cache = frappe.cache() cache.delete_key("langinfo") # clear translations saved in boot cache cache.delete_key("bootinfo") cache.delete_key("translation_assets", shared=True) cache.delete_key(APP_TRANSLATION_KEY, shared=True) cache.delete_key(USER_TRANSLATION_KEY) cache.delete_key(MERGED_TRANSLATION_KEY) def get_messages_for_app(app, deduplicate=True): """Returns all messages (list) for a specified `app`""" messages = [] modules = [frappe.unscrub(m) for m in frappe.local.app_modules[app]] # doctypes if modules: if isinstance(modules, str): modules = [modules] filtered_doctypes = ( frappe.qb.from_("DocType").where(Field("module").isin(modules)).select("name").run(pluck=True) ) for name in filtered_doctypes: messages.extend(get_messages_from_doctype(name)) # pages filtered_pages = ( frappe.qb.from_("Page").where(Field("module").isin(modules)).select("name", "title").run() ) for name, title in filtered_pages: messages.append((None, title or name)) messages.extend(get_messages_from_page(name)) # reports report = DocType("Report") doctype = DocType("DocType") names = ( frappe.qb.from_(doctype) .from_(report) .where((report.ref_doctype == doctype.name) & doctype.module.isin(modules)) .select(report.name) .run(pluck=True) ) for name in names: messages.append((None, name)) messages.extend(get_messages_from_report(name)) for i in messages: if not isinstance(i, tuple): raise Exception # workflow based on app.hooks.fixtures messages.extend(get_messages_from_workflow(app_name=app)) # custom fields based on app.hooks.fixtures messages.extend(get_messages_from_custom_fields(app_name=app)) # app_include_files messages.extend(get_all_messages_from_js_files(app)) # server_messages messages.extend(get_server_messages(app)) # messages from navbar settings messages.extend(get_messages_from_navbar()) if deduplicate: messages = deduplicate_messages(messages) return messages def get_messages_from_navbar(): """Return all labels from Navbar Items, as specified in Navbar Settings.""" labels = frappe.get_all("Navbar Item", filters={"item_label": ("is", "set")}, pluck="item_label") return [("Navbar:", label, "Label of a Navbar Item") for label in labels] def get_messages_from_doctype(name): """Extract all translatable messages for a doctype. Includes labels, Python code, Javascript code, html templates""" messages = [] meta = frappe.get_meta(name) messages = [meta.name, meta.module] if meta.description: messages.append(meta.description) # translations of field labels, description and options for d in meta.get("fields"): messages.extend([d.label, d.description]) if d.fieldtype == "Select" and d.options: options = d.options.split("\n") if not "icon" in options[0]: messages.extend(options) if d.fieldtype == "HTML" and d.options: messages.append(d.options) # translations of roles for d in meta.get("permissions"): if d.role: messages.append(d.role) messages = [message for message in messages if message] messages = [("DocType: " + name, message) for message in messages if is_translatable(message)] # extract from js, py files if not meta.custom: doctype_file_path = frappe.get_module_path(meta.module, "doctype", meta.name, meta.name) messages.extend(get_messages_from_file(doctype_file_path + ".js")) messages.extend(get_messages_from_file(doctype_file_path + "_list.js")) messages.extend(get_messages_from_file(doctype_file_path + "_list.html")) messages.extend(get_messages_from_file(doctype_file_path + "_calendar.js")) messages.extend(get_messages_from_file(doctype_file_path + "_dashboard.html")) # workflow based on doctype messages.extend(get_messages_from_workflow(doctype=name)) return messages def get_messages_from_workflow(doctype=None, app_name=None): assert doctype or app_name, "doctype or app_name should be provided" # translations for Workflows workflows = [] if doctype: workflows = frappe.get_all("Workflow", filters={"document_type": doctype}) else: fixtures = frappe.get_hooks("fixtures", app_name=app_name) or [] for fixture in fixtures: if isinstance(fixture, str) and fixture == "Worflow": workflows = frappe.get_all("Workflow") break elif isinstance(fixture, dict) and fixture.get("dt", fixture.get("doctype")) == "Workflow": workflows.extend(frappe.get_all("Workflow", filters=fixture.get("filters"))) messages = [] document_state = DocType("Workflow Document State") for w in workflows: states = frappe.db.get_values( document_state, filters=document_state.parent == w["name"], fieldname="state", distinct=True, as_dict=True, order_by=None, ) messages.extend( [ ("Workflow: " + w["name"], state["state"]) for state in states if is_translatable(state["state"]) ] ) states = frappe.db.get_values( document_state, filters=(document_state.parent == w["name"]) & (document_state.message.isnotnull()), fieldname="message", distinct=True, order_by=None, as_dict=True, ) messages.extend( [ ("Workflow: " + w["name"], state["message"]) for state in states if is_translatable(state["message"]) ] ) actions = frappe.db.get_values( "Workflow Transition", filters={"parent": w["name"]}, fieldname="action", as_dict=True, distinct=True, order_by=None, ) messages.extend( [ ("Workflow: " + w["name"], action["action"]) for action in actions if is_translatable(action["action"]) ] ) return messages def get_messages_from_custom_fields(app_name): fixtures = frappe.get_hooks("fixtures", app_name=app_name) or [] custom_fields = [] for fixture in fixtures: if isinstance(fixture, str) and fixture == "Custom Field": custom_fields = frappe.get_all( "Custom Field", fields=["name", "label", "description", "fieldtype", "options"] ) break elif isinstance(fixture, dict) and fixture.get("dt", fixture.get("doctype")) == "Custom Field": custom_fields.extend( frappe.get_all( "Custom Field", filters=fixture.get("filters"), fields=["name", "label", "description", "fieldtype", "options"], ) ) messages = [] for cf in custom_fields: for prop in ("label", "description"): if not cf.get(prop) or not is_translatable(cf[prop]): continue messages.append(("Custom Field - {}: {}".format(prop, cf["name"]), cf[prop])) if cf["fieldtype"] == "Selection" and cf.get("options"): for option in cf["options"].split("\n"): if option and "icon" not in option and is_translatable(option): messages.append(("Custom Field - Description: " + cf["name"], option)) return messages def get_messages_from_page(name): """Returns all translatable strings from a :class:`frappe.core.doctype.Page`""" return _get_messages_from_page_or_report("Page", name) def get_messages_from_report(name): """Returns all translatable strings from a :class:`frappe.core.doctype.Report`""" report = frappe.get_doc("Report", name) messages = _get_messages_from_page_or_report( "Report", name, frappe.db.get_value("DocType", report.ref_doctype, "module") ) if report.columns: context = ( "Column of report '%s'" % report.name ) # context has to match context in `prepare_columns` in query_report.js messages.extend([(None, report_column.label, context) for report_column in report.columns]) if report.filters: messages.extend([(None, report_filter.label) for report_filter in report.filters]) if report.query: messages.extend( [ (None, message) for message in REPORT_TRANSLATE_PATTERN.findall(report.query) if is_translatable(message) ] ) messages.append((None, report.report_name)) return messages def _get_messages_from_page_or_report(doctype, name, module=None): if not module: module = frappe.db.get_value(doctype, name, "module") doc_path = frappe.get_module_path(module, doctype, name) messages = get_messages_from_file(os.path.join(doc_path, frappe.scrub(name) + ".py")) if os.path.exists(doc_path): for filename in os.listdir(doc_path): if filename.endswith(".js") or filename.endswith(".html"): messages += get_messages_from_file(os.path.join(doc_path, filename)) return messages def get_server_messages(app): """Extracts all translatable strings (tagged with :func:`frappe._`) from Python modules inside an app""" messages = [] file_extensions = (".py", ".html", ".js", ".vue") app_walk = os.walk(frappe.get_pymodule_path(app)) for basepath, folders, files in app_walk: folders[:] = [folder for folder in folders if folder not in {".git", "__pycache__"}] if "public/dist" in basepath: continue for f in files: f = frappe.as_unicode(f) if f.endswith(file_extensions): messages.extend(get_messages_from_file(os.path.join(basepath, f))) return messages def get_messages_from_include_files(app_name=None): """Returns messages from js files included at time of boot like desk.min.js for desk and web""" from frappe.utils.jinja_globals import bundled_asset messages = [] app_include_js = frappe.get_hooks("app_include_js", app_name=app_name) or [] web_include_js = frappe.get_hooks("web_include_js", app_name=app_name) or [] include_js = app_include_js + web_include_js for js_path in include_js: file_path = bundled_asset(js_path) relative_path = os.path.join(frappe.local.sites_path, file_path.lstrip("/")) messages_from_file = get_messages_from_file(relative_path) messages.extend(messages_from_file) return messages def get_all_messages_from_js_files(app_name=None): """Extracts all translatable strings from app `.js` files""" messages = [] for app in [app_name] if app_name else frappe.get_installed_apps(): if os.path.exists(frappe.get_app_path(app, "public")): for basepath, folders, files in os.walk(frappe.get_app_path(app, "public")): if "frappe/public/js/lib" in basepath: continue for fname in files: if fname.endswith(".js") or fname.endswith(".html") or fname.endswith(".vue"): messages.extend(get_messages_from_file(os.path.join(basepath, fname))) return messages def get_messages_from_file(path: str) -> list[tuple[str, str, str | None, int]]: """Returns a list of transatable strings from a code file :param path: path of the code file """ frappe.flags.setdefault("scanned_files", set()) # TODO: Find better alternative # To avoid duplicate scan if path in frappe.flags.scanned_files: return [] frappe.flags.scanned_files.add(path) bench_path = get_bench_path() if not os.path.exists(path): return [] with open(path) as sourcefile: try: file_contents = sourcefile.read() except Exception: print(f"Could not scan file for translation: {path}") return [] messages = [] if path.lower().endswith(".py"): messages += extract_messages_from_python_code(file_contents) else: messages += extract_messages_from_code(file_contents) if path.lower().endswith(".js"): # For JS also use JS parser to extract strings possibly missed out # by regex based extractor. messages += extract_messages_from_javascript_code(file_contents) return [ (os.path.relpath(path, bench_path), message, context, line) for (line, message, context) in messages ] def extract_messages_from_python_code(code: str) -> list[tuple[int, str, str | None]]: """Extracts translatable strings from Python code using babel.""" messages = [] for message in extract_python( io.BytesIO(code.encode()), keywords=["_"], comment_tags=(), options={}, ): lineno, _func, args, _comments = message if not args or not args[0]: continue source_text = args[0] if isinstance(args, tuple) else args context = args[1] if len(args) == 2 else None messages.append((lineno, source_text, context)) return messages def extract_messages_from_javascript_code(code: str) -> list[tuple[int, str, str | None]]: """Extracts translatable strings from JavaScript code using babel.""" messages = [] for message in extract_javascript( code, keywords=["__"], options={}, ): lineno, _func, args = message if not args or not args[0]: continue source_text = args[0] if isinstance(args, tuple) else args context = None if isinstance(args, tuple) and len(args) == 3 and isinstance(args[2], str): context = args[2] messages.append((lineno, source_text, context)) return messages def extract_javascript(code, keywords=("__",), options=None): """Extract messages from JavaScript source code. This is a modified version of babel's JS parser. Reused under BSD license. License: https://github.com/python-babel/babel/blob/master/LICENSE Changes from upstream: - Preserve arguments, babel's parser flattened all values in args, we need order because we use different syntax for translation which can contain 2nd arg which is array of many values. If argument is non-primitive type then value is NOT returned in args. E.g. __("0", ["1", "2"], "3") -> ("0", None, "3") - remove comments support - changed signature to accept string directly. :param code: code as string :param keywords: a list of keywords (i.e. function names) that should be recognized as translation functions :param options: a dictionary of additional options (optional) Supported options are: * `template_string` -- set to false to disable ES6 template string support. """ if options is None: options = {} funcname = message_lineno = None messages = [] last_argument = None concatenate_next = False last_token = None call_stack = -1 # Tree level = depth inside function call tree # Example: __("0", ["1", "2"], "3") # Depth __() # / | \ # 0 "0" [...] "3" <- only 0th level strings matter # / \ # 1 "1" "2" tree_level = 0 opening_operators = {"[", "{"} closing_operators = {"]", "}"} all_container_operators = opening_operators.union(closing_operators) dotted = any("." in kw for kw in keywords) for token in tokenize( code, jsx=True, template_string=options.get("template_string", True), dotted=dotted, ): if ( # Turn keyword`foo` expressions into keyword("foo") calls: funcname and (last_token and last_token.type == "name") # have a keyword... and token.type # we've seen nothing after the keyword... == "template_string" # this is a template string ): message_lineno = token.lineno messages = [unquote_string(token.value)] call_stack = 0 tree_level = 0 token = Token("operator", ")", token.lineno) if token.type == "operator" and token.value == "(": if funcname: message_lineno = token.lineno call_stack += 1 elif call_stack >= 0 and token.type == "operator" and token.value in all_container_operators: if token.value in opening_operators: tree_level += 1 if token.value in closing_operators: tree_level -= 1 elif call_stack == -1 and token.type == "linecomment" or token.type == "multilinecomment": pass # ignore comments elif funcname and call_stack == 0: if token.type == "operator" and token.value == ")": if last_argument is not None: messages.append(last_argument) if len(messages) > 1: messages = tuple(messages) elif messages: messages = messages[0] else: messages = None if messages is not None: yield (message_lineno, funcname, messages) funcname = message_lineno = last_argument = None concatenate_next = False messages = [] call_stack = -1 tree_level = 0 elif token.type in ("string", "template_string"): new_value = unquote_string(token.value) if tree_level > 0: pass elif concatenate_next: last_argument = (last_argument or "") + new_value concatenate_next = False else: last_argument = new_value elif token.type == "operator": if token.value == ",": if last_argument is not None: messages.append(last_argument) last_argument = None else: if tree_level == 0: messages.append(None) concatenate_next = False elif token.value == "+": concatenate_next = True elif call_stack > 0 and token.type == "operator" and token.value == ")": call_stack -= 1 tree_level = 0 elif funcname and call_stack == -1: funcname = None elif ( call_stack == -1 and token.type == "name" and token.value in keywords and (last_token is None or last_token.type != "name" or last_token.value != "function") ): funcname = token.value last_token = token def extract_messages_from_code(code): """ Extracts translatable strings from a code file :param code: code from which translatable files are to be extracted """ from jinja2 import TemplateError try: code = frappe.as_unicode(render_include(code)) # Exception will occur when it encounters John Resig's microtemplating code except (TemplateError, ImportError, InvalidIncludePath, OSError) as e: if isinstance(e, InvalidIncludePath): frappe.clear_last_message() messages = [] for m in TRANSLATE_PATTERN.finditer(code): message = m.group("message") context = m.group("py_context") or m.group("js_context") pos = m.start() if is_translatable(message): messages.append([pos, message, context]) return add_line_number(messages, code) def is_translatable(m): if ( re.search("[a-zA-Z]", m) and not m.startswith("fa fa-") and not m.endswith("px") and not m.startswith("eval:") ): return True return False def add_line_number(messages, code): ret = [] messages = sorted(messages, key=lambda x: x[0]) newlines = [m.start() for m in re.compile(r"\n").finditer(code)] line = 1 newline_i = 0 for pos, message, context in messages: while newline_i < len(newlines) and pos > newlines[newline_i]: line += 1 newline_i += 1 ret.append([line, message, context]) return ret def read_csv_file(path): """Read CSV file and return as list of list :param path: File path""" with open(path, encoding="utf-8", newline="") as msgfile: data = reader(msgfile) newdata = [[val for val in row] for row in data] return newdata def write_csv_file(path, app_messages, lang_dict): """Write translation CSV file. :param path: File path, usually `[app]/translations`. :param app_messages: Translatable strings for this app. :param lang_dict: Full translated dict. """ app_messages.sort(key=lambda x: x[1]) from csv import writer with open(path, "w", newline="") as msgfile: w = writer(msgfile, lineterminator="\n") for app_message in app_messages: context = None if len(app_message) == 2: path, message = app_message elif len(app_message) == 3: path, message, lineno = app_message elif len(app_message) == 4: path, message, context, lineno = app_message else: continue t = lang_dict.get(message, "") # strip whitespaces translated_string = CSV_STRIP_WHITESPACE_PATTERN.sub(r"{\g<1>}", t) if translated_string: w.writerow([message, translated_string, context]) def get_untranslated(lang, untranslated_file, get_all=False, app="_ALL_APPS"): """Returns all untranslated strings for a language and writes in a file :param lang: Language code. :param untranslated_file: Output file path. :param get_all: Return all strings, translated or not.""" clear_cache() apps = frappe.get_all_apps(True) if app != "_ALL_APPS": if app not in apps: print(f"Application {app} not found!") return apps = [app] messages = [] untranslated = [] for app_name in apps: messages.extend(get_messages_for_app(app_name)) messages = deduplicate_messages(messages) def escape_newlines(s): return s.replace("\\\n", "|||||").replace("\\n", "||||").replace("\n", "|||") if get_all: print(str(len(messages)) + " messages") with open(untranslated_file, "wb") as f: for m in messages: # replace \n with ||| so that internal linebreaks don't get split f.write((escape_newlines(m[1]) + os.linesep).encode("utf-8")) else: full_dict = get_all_translations(lang) for m in messages: if not full_dict.get(m[1]): untranslated.append(m[1]) if untranslated: print(str(len(untranslated)) + " missing translations of " + str(len(messages))) with open(untranslated_file, "wb") as f: for m in untranslated: # replace \n with ||| so that internal linebreaks don't get split f.write((escape_newlines(m) + os.linesep).encode("utf-8")) else: print("all translated!") def update_translations(lang, untranslated_file, translated_file, app="_ALL_APPS"): """Update translations from a source and target file for a given language. :param lang: Language code (e.g. `en`). :param untranslated_file: File path with the messages in English. :param translated_file: File path with messages in language to be updated.""" clear_cache() full_dict = get_all_translations(lang) def restore_newlines(s): return ( s.replace("|||||", "\\\n") .replace("| | | | |", "\\\n") .replace("||||", "\\n") .replace("| | | |", "\\n") .replace("|||", "\n") .replace("| | |", "\n") ) translation_dict = {} for key, value in zip( frappe.get_file_items(untranslated_file, ignore_empty_lines=False), frappe.get_file_items(translated_file, ignore_empty_lines=False), ): # undo hack in get_untranslated translation_dict[restore_newlines(key)] = restore_newlines(value) full_dict.update(translation_dict) apps = frappe.get_all_apps(True) if app != "_ALL_APPS": if app not in apps: print(f"Application {app} not found!") return apps = [app] for app_name in apps: write_translations_file(app_name, lang, full_dict) def import_translations(lang, path): """Import translations from file in standard format""" clear_cache() full_dict = get_all_translations(lang) full_dict.update(get_translation_dict_from_file(path, lang, "import")) for app in frappe.get_all_apps(True): write_translations_file(app, lang, full_dict) def rebuild_all_translation_files(): """Rebuild all translation files: `[app]/translations/[lang].csv`.""" for lang in get_all_languages(): for app in frappe.get_all_apps(): write_translations_file(app, lang) def write_translations_file(app, lang, full_dict=None, app_messages=None): """Write a translation file for a given language. :param app: `app` for which translations are to be written. :param lang: Language code. :param full_dict: Full translated language dict (optional). :param app_messages: Source strings (optional). """ if not app_messages: app_messages = get_messages_for_app(app) if not app_messages: return tpath = frappe.get_pymodule_path(app, "translations") frappe.create_folder(tpath) write_csv_file( os.path.join(tpath, lang + ".csv"), app_messages, full_dict or get_all_translations(lang) ) def send_translations(translation_dict): """Append translated dict in `frappe.local.response`""" if "__messages" not in frappe.local.response: frappe.local.response["__messages"] = {} frappe.local.response["__messages"].update(translation_dict) def deduplicate_messages(messages): ret = [] op = operator.itemgetter(1) messages = sorted(messages, key=op) for k, g in itertools.groupby(messages, op): ret.append(next(g)) return ret def rename_language(old_name, new_name): if not frappe.db.exists("Language", new_name): return language_in_system_settings = frappe.db.get_single_value("System Settings", "language") if language_in_system_settings == old_name: frappe.db.set_value("System Settings", "System Settings", "language", new_name) frappe.db.sql( """update `tabUser` set language=%(new_name)s where language=%(old_name)s""", {"old_name": old_name, "new_name": new_name}, ) @frappe.whitelist() def update_translations_for_source(source=None, translation_dict=None): if not (source and translation_dict): return translation_dict = json.loads(translation_dict) if is_html(source): source = strip_html_tags(source) # for existing records translation_records = frappe.db.get_values( "Translation", {"source_text": source}, ["name", "language"], as_dict=1 ) for d in translation_records: if translation_dict.get(d.language, None): doc = frappe.get_doc("Translation", d.name) doc.translated_text = translation_dict.get(d.language) doc.save() # done with this lang value translation_dict.pop(d.language) else: frappe.delete_doc("Translation", d.name) # remaining values are to be inserted for lang, translated_text in translation_dict.items(): doc = frappe.new_doc("Translation") doc.language = lang doc.source_text = source doc.translated_text = translated_text doc.save() return translation_records @frappe.whitelist() def get_translations(source_text): if is_html(source_text): source_text = strip_html_tags(source_text) return frappe.db.get_list( "Translation", fields=["name", "language", "translated_text as translation"], filters={"source_text": source_text}, ) @frappe.whitelist() def get_messages(language, start=0, page_length=100, search_text=""): from frappe.frappeclient import FrappeClient translator = FrappeClient(get_translator_url()) translated_dict = translator.post_api( "translator.api.get_strings_for_translation", params=locals() ) return translated_dict @frappe.whitelist() def get_source_additional_info(source, language=""): from frappe.frappeclient import FrappeClient translator = FrappeClient(get_translator_url()) return translator.post_api("translator.api.get_source_additional_info", params=locals()) @frappe.whitelist() def get_contributions(language): return frappe.get_all( "Translation", fields=["*"], filters={ "contributed": 1, }, ) @frappe.whitelist() def get_contribution_status(message_id): from frappe.frappeclient import FrappeClient doc = frappe.get_doc("Translation", message_id) translator = FrappeClient(get_translator_url()) contributed_translation = translator.get_api( "translator.api.get_contribution_status", params={"translation_id": doc.contribution_docname} ) return contributed_translation def get_translator_url(): return frappe.get_hooks()["translator_url"][0] @frappe.whitelist(allow_guest=True) def get_all_languages(with_language_name=False): """Returns all enabled language codes ar, ch etc""" def get_language_codes(): return frappe.get_all("Language", filters={"enabled": 1}, pluck="name") def get_all_language_with_name(): return frappe.get_all("Language", ["language_code", "language_name"], {"enabled": 1}) if not frappe.db: frappe.connect() if with_language_name: return frappe.cache().get_value("languages_with_name", get_all_language_with_name) else: return frappe.cache().get_value("languages", get_language_codes) @frappe.whitelist(allow_guest=True) def set_preferred_language_cookie(preferred_language): frappe.local.cookie_manager.set_cookie("preferred_language", preferred_language) def get_preferred_language_cookie(): return frappe.request.cookies.get("preferred_language") def get_translated_doctypes(): dts = frappe.get_all("DocType", {"translated_doctype": 1}, pluck="name") custom_dts = frappe.get_all( "Property Setter", {"property": "translated_doctype", "value": "1"}, pluck="doc_type" ) return unique(dts + custom_dts) # Backward compatibility get_full_dict = get_all_translations load_lang = get_translations_from_apps