Allow different quotes in f-string translations

janezd · Dec 28, 2024 · 1982a71 · 1982a71
1 parent ad3f04d
commit 1982a71
Show file tree

Hide file tree

Showing 2 changed files with 100 additions and 104 deletions.
diff --git a/trubar/actions.py b/trubar/actions.py
@@ -1,15 +1,15 @@
+import ast
 import dataclasses
 import os
 import re
 import shutil
 import json
-from itertools import islice
 from typing import Union, List, Optional, NamedTuple, Tuple, Dict
 
 import libcst as cst
 from libcst.metadata import ParentNodeProvider
 
-from trubar.utils import walk_files, make_list
+from trubar.utils import walk_files
 from trubar.messages import MsgNode, MsgDict
 from trubar.config import config
 
@@ -350,82 +350,99 @@ def push_context(self, node: NamespaceNode) -> None:
     @classmethod
     def _f_string_languages(cls,
                             node: SomeString,
-                            messages: List[str]) -> List[str]:
-        # Don't prefix if auto_prefix is off, or we already have it,
-        # or the original already has braces (although without the f-prefix)
-        if not config.auto_prefix \
-                or "f" in node.prefix \
-                or re_braced.search(messages[0]):
-            return []
-
-        quotes = (node.quote, ) + (all_quotes if config.smart_quotes else ())
+                            messages: List[str]) -> set[int]:
+        """
+        For the given messages, return a set of indices of languages that
+        requires an f-prefix. This includes the original language, 0.
+
+        This is determined by checking that the string includes braces and,
+        if so, that it compiles to something that includes an f-string after
+        trying all quote types.
+
+        Empty set if
+         - the original string is not an f-stirng and auto_prefix is disabled
+         - the original string already has braces but no f-prefix.
+        """
+        add_f = set()
+        prefix = node.prefix
+        if "f" not in prefix:
+            if not config.auto_prefix or re_braced.search(messages[0]):
+                return add_f
+            prefix += "f"
+        else:
+            add_f.add(0)
 
-        add_f = []
-        for translation, langdef in zip(messages[1:],
-                                        islice(config.languages.values(), 1, None)):
+        for i, translation in enumerate(messages[1:], start=1):
             if not re_braced.search(translation):
                 continue
-            for quote in quotes:
+            for quote in all_quotes:
                 try:
                     new_node = cst.parse_expression(
-                        f'f{node.prefix}{quote}{translation}{quote}')
+                        f'{prefix}{quote}{translation}{quote}')
                     assert isinstance(new_node, cst.FormattedString)
                 except cst.ParserSyntaxError:
                     continue
                 if any(isinstance(part, cst.FormattedStringExpression)
                        for part in new_node.parts):
-                    add_f.append(f"{langdef.international_name} ({translation})")
+                    add_f.add(i)
                     break
         return add_f
 
-    @staticmethod
-    def _get_quote(node: SomeString,
+    @classmethod
+    def _get_quote(cls,
+                   node: SomeString,
                    orig_str: str,
-                   messages: List[str],
-                   prefix: str, need_f: List[str]) -> str:
+                   translation: str,
+                   language_index: int,
+                   prefix: str) -> str:
+        """
+        Return a suitable quote for the given translation.
+
+        The method tries all quote types (starting with the original) and
+        returns the first one that compiles. If none compiles, raises a
+        TranslationError.
+
+        The method is used for f-strings.
+        """
         quotes = (node.quote, ) + (all_quotes if config.smart_quotes else ())
-
-        for fquote in quotes:
-            for translation in messages:
-                try:
-                    compile(f"{prefix}{fquote}{translation}{fquote}",
-                            '<string>', 'eval')
-                except SyntaxError:
-                    break
+        for quote in quotes:
+            try:
+                compiled = ast.parse(
+                    f"{prefix}{quote}{translation}{quote}",
+                    mode="eval")
+            except SyntaxError:
+                pass
             else:
-                return fquote
+                compiled = compiled.body
+                if isinstance(compiled, ast.JoinedStr) \
+                        or isinstance(compiled, ast.Constant) \
+                        and isinstance(compiled.value, str):
+                    return quote
 
         # No suitable quotes, raise an exception
         hints = ""
         if "f" in node.prefix:
             hints += f"\n- String {orig_str} is an f-string"
         else:
             hints += (
-                f"\n- Original string, {orig_str}, is not an f-string, "
-                f"but {make_list(need_f, 'seem')} to require f-strings "
-                "and auto-prefix option is set.")
+                "\n- Original string is not an f-string, but the translation \n"
+                "seems to be an f-string and auto-prefix option is set.")
         if config.smart_quotes:
             hints += \
                 "\n- I tried all quote types, even triple-quotes"
         else:
             hints += \
                 "\n- Try enabling smart quotes to allow changing the quote type"
-        if any(map(re_single_quote.search, messages)) \
-                and any(map(re_double_quote.search, messages)):
-            hints += \
-                "\n- Some translations use single quotes and some use double"
-        if len(fquote) != 3 and "\n" in "".join(messages[1:]):
+        if len(quote) != 3 and "\n" in translation:
             hints += \
                 "\n- Check for any unescaped \\n's"
 
-        languages = iter(config.languages.values())
-        original = f"{orig_str} ({next(languages).international_name})"
-        trans = "\n".join(f"  - {msg} ({langdef.international_name})"
-                          for msg, langdef in zip(messages[1:], languages))
+        languages = list(config.languages.values())
+        language = languages[language_index].international_name
         raise TranslationError(
-            f"Probable syntax error in translation of {orig_str}.\n"
-            f"Original: {original}\n"
-            f"Translations:\n{trans}\n"
+            f"Probable syntax error in translation to {language}.\n"
+            f"Original: {orig_str}\n"
+            f"Translation to {language}:\n  {translation}\n"
             "Some hints:" + hints)
 
     def translate(
@@ -450,13 +467,17 @@ def translate(
             translation if isinstance(translation, str) else original
             for translation in messages]
 
-        need_f = self._f_string_languages(node, messages)
-        prefix = "f" + node.prefix if need_f else node.prefix
-
         idx = len(self.message_tables[0])
-        if "f" in prefix:
-            quote = self._get_quote(node, orig_str, messages, prefix, need_f)
-            for message, table in zip(messages, self.message_tables):
+        need_f = self._f_string_languages(node, messages)
+        if need_f:
+            fprefix = node.prefix
+            if "f" not in fprefix:
+                fprefix = "f" + fprefix
+            for lang_idx, (message, table) in \
+                    enumerate(zip(messages, self.message_tables)):
+                prefix = fprefix if lang_idx in need_f else node.prefix
+                quote = self._get_quote(
+                    node, orig_str, message, lang_idx, prefix)
                 table.append(f"{prefix}{quote}{message}{quote}")
             trans = f'_tr.e(_tr.c({idx}, {orig_str}))'
         else:

diff --git a/trubar/tests/test_actions.py b/trubar/tests/test_actions.py
@@ -387,35 +387,31 @@ def test_f_string_languages(self):
 
         node.prefix = "f"
         node.quote = "'"
-        # Original is an f-string - don't add
-        self.assertEqual(m(node, ["a string", "one", "two{x}"]), [])
+        # Original is an f-string, and so is one of translations
+        self.assertEqual(m(node, ["a {s}tring", "one", "two{x}"]), {0, 2})
+
+        # Only original needs it
+        self.assertEqual(m(node, ["a {s}tring", "one", "two"]), {0})
 
         node.prefix = ""
         m = StringTranslatorMultilingual._f_string_languages
         # No language needs it
-        self.assertEqual(m(node, ["a string", "one", "two"]),
-                         [])
-
-        # English needs it
-        self.assertEqual(m(node, ["a string", "one", "two{x}"]),
-                         ["English (two{x})"])
-        # Slovenian and English needs it
-        self.assertEqual(m(node, ["a string", "one{y}", "two{x}"]),
-                         ["Slovenian (one{y})", "English (two{x})"])
+        self.assertEqual(m(node, ["a string", "one", "two"]), set())
+
         # Original is not an f-string, but has {},
         # hence translations are supposed to have them without being f-strings
-        self.assertEqual(m(node, ["a string{x}", "one{y}", "two{x}"]),
-                         [])
+        self.assertEqual(m(node, ["a string{x}", "one{y}", "two{x}"]), set())
 
+        # Original is not an f-string, but one of translations is
         for quote in ['"', "'", "'''", '"""']:
             self.assertEqual(m(node, ["a string", "one", f"t{quote}wo{{x}}"]),
-                             [f"English (t{quote}wo{{x}})"])
+                             {2})
 
-        # No smart quotes
-        with patch("trubar.config.config.smart_quotes", False):
+        # Original is not an f-string, and auto-prefix is off
+        with patch("trubar.config.config.auto_prefix", False):
             self.assertEqual(
                 m(node, ["a string", "on'e", "tw'o{x}"]),
-                [])
+                set())
 
     def test_get_quote(self):
         node = Mock()
@@ -424,65 +420,44 @@ def test_get_quote(self):
         node.prefix = ""
         node.quote = '"'
         self.assertEqual(
-            m(node, "'a string'", ["a string", "one", "two{x}"],
-              "", ["English"]),
-            '"')
+            m(node, "'a string'", "a string", 2, ""), '"')
 
         node.quote = "'''"
         self.assertEqual(
-            m(node, "'a string'", ["a string", "one", "two{x}"],
-              "", ["English"]),
-            "'''")
+            m(node, "'a string'", "a string", 2, ""), "'''")
 
         node.quote = "'"
         self.assertEqual(
-            m(node, "'a string'", ["a string", "one", "two{x}"],
-              "", ["English"]),
-            "'")
+            m(node, "'a string'", "a string", 2, ""), "'")
 
         node.quote = "'"
         self.assertEqual(
-            m(node, "'a string'", ["a string", "one", "tw'o{x}"],
-              "", ["English"]),
-            '"')
+            m(node, "'a string'", "tw'o{x}", 2, ""), '"')
 
         node.quote = "'"
-        self.assertEqual(
-            m(node, "'a str'ing'", ["a str'ing", "one", "two{x}"],
-              "", ["English"]),
-            '"')
-
-        node.quote = "'"
-        self.assertEqual(
-            m(node, "'a str'ing'", ["a str'ing", "on\"e", "two{x}"],
-              "", ["English"]),
-            "'''")
+        self.assertIn(
+            m(node, "'a str'ing'", "a str'i\"ng", 2, ""),
+            ("'''", '"""'))
 
         node.quote = "'"
         self.assertEqual(
-            m(node, "'a str'''ing'", ["a str'''ing", "on\"e", "two{x}"],
-              "", ["English"]),
-            '"""')
+            m(node, "'a str'''ing'", "s\"tr'''i'n\"g", 2, ""), '"""')
 
         node.quote = "'"
         self.assertRaises(
             TranslationError,
-            m, node, "'a str'''ing'", ["a str'''ing", "one", "tw\"\"\"o{x}"],
-            "", ["English"])
+            m, node, "'a str'''ing'", "a \"\"\"s\"t\"r'''in'g", 2, "")
 
         with patch("trubar.config.config.smart_quotes", False):
             node.quote = "'"
             self.assertRaises(
                 TranslationError,
-                m, node, "'a str'ing'", ["a str'ing", "one", "two{x}"],
-                "", ["English"])
+                m, node, "'a str'ing'", "a str'ing", 2, "")
 
             node.quote = "'"
             self.assertRaises(
                 TranslationError,
-                m, node, "'a str'''ing'",
-                ["a str'''ing", "one", "tw\"\"\"o{x}"],
-                "", ["English"])
+                m, node, "'a str'''ing'", "a str'''ing", 2, "")
 
     def test_auto_prefix(self):
         # No f-strings, no problems
@@ -503,11 +478,11 @@ def test_auto_prefix(self):
         self.assertEqual(translation, "print(_tr.e(_tr.c(0, f'fo{o}')))")
         self.assertEqual(tables, [["f'fo{o}'"], ["f'dont'"], ["f'fo{o}'"]])
 
-        # Original is not an f-string, one of translations is
+        # Original is not an f-string, one of translations is, one is not
         translation, tables = self._translate(
             "print('foo')", [{"foo": "do{n}t"}, {"foo": "bar"}])
         self.assertEqual(translation, "print(_tr.e(_tr.c(0, 'foo')))")
-        self.assertEqual(tables, [["f'foo'"], ["f'do{n}t'"], ["f'bar'"]])
+        self.assertEqual(tables, [["'foo'"], ["f'do{n}t'"], ["'bar'"]])
 
         with patch("trubar.config.config.auto_prefix", False):
             translation, tables = self._translate(
@@ -522,15 +497,15 @@ def test_smart_quotes_and_f(self):
         self.assertEqual(translation, "print(_tr.e(_tr.c(0, f'foo')))")
         self.assertEqual(
             tables,
-            [["f'''foo'''"], ["f'''don't'''"], ["f'''x\"y'''"]])
+            [["f'foo'"], ["f\"don't\""], ["f'x\"y'"]])
 
         # One language has an f-string, and translations have different quotes
         self._translate(
             "print('foo')", [{"foo": "d{o}n't"}, {"foo": 'x"y'}])
         self.assertEqual(translation, "print(_tr.e(_tr.c(0, f'foo')))")
         self.assertEqual(
             tables,
-            [["f'''foo'''"], ["f'''don't'''"], ["f'''x\"y'''"]])
+            [["f'foo'"], ["f\"don't\""], ["f'x\"y'"]])
 
         with patch("trubar.config.config.smart_quotes", False):
             # Mismatching quotes