[IMP] translations: parse views iteratively instead of recursively

[odoo/odoo.git] / openerp / tools / translate.py
diff --git a/openerp/tools/translate.py b/openerp/tools/translate.py

index f373f71..37e6492 100644 (file)
--- a/openerp/tools/translate.py
+++ b/openerp/tools/translate.py
@@ -25,7 +25,6 @@ import fnmatch
  import inspect
  import locale
  import os
-import openerp.pooler as pooler
  import openerp.sql_db as sql_db
  import re
  import logging
@@ -40,9 +39,9 @@ from lxml import etree
  
  import config
  import misc
-from misc import UpdateableStr
  from misc import SKIPPED_ELEMENT_TYPES
  import osutil
+import openerp
  from openerp import SUPERUSER_ID
  
  _logger = logging.getLogger(__name__)
@@ -50,13 +49,15 @@ _logger = logging.getLogger(__name__)
  # used to notify web client that these translations should be loaded in the UI
  WEB_TRANSLATION_COMMENT = "openerp-web"
  
+SKIPPED_ELEMENTS = ('script', 'style')
+
  _LOCALE2WIN32 = {
      'af_ZA': 'Afrikaans_South Africa',
      'sq_AL': 'Albanian_Albania',
      'ar_SA': 'Arabic_Saudi Arabia',
      'eu_ES': 'Basque_Spain',
      'be_BY': 'Belarusian_Belarus',
-    'bs_BA': 'Serbian (Latin)',
+    'bs_BA': 'Bosnian_Bosnia and Herzegovina',
      'bg_BG': 'Bulgarian_Bulgaria',
      'ca_ES': 'Catalan_Spain',
      'hr_HR': 'Croatian_Croatia',
@@ -93,7 +94,6 @@ _LOCALE2WIN32 = {
      'lt_LT': 'Lithuanian_Lithuania',
      'lat': 'Latvian_Latvia',
      'ml_IN': 'Malayalam_India',
-    'id_ID': 'Indonesian_indonesia',
      'mi_NZ': 'Maori',
      'mn': 'Cyrillic_Mongolian',
      'no_NO': 'Norwegian_Norway',
@@ -103,7 +103,6 @@ _LOCALE2WIN32 = {
      'pt_BR': 'Portuguese_Brazil',
      'ro_RO': 'Romanian_Romania',
      'ru_RU': 'Russian_Russia',
-    'mi_NZ': 'Maori',
      'sr_CS': 'Serbian (Cyrillic)_Serbia and Montenegro',
      'sk_SK': 'Slovak_Slovakia',
      'sl_SI': 'Slovenian_Slovenia',
@@ -131,7 +130,6 @@ _LOCALE2WIN32 = {
      'sv_SE': 'Swedish_Sweden',
      'ta_IN': 'English_Australia',
      'th_TH': 'Thai_Thailand',
-    'mi_NZ': 'Maori',
      'tr_TR': 'Turkish_Turkey',
      'uk_UA': 'Ukrainian_Ukraine',
      'vi_VN': 'Vietnamese_Viet Nam',
@@ -167,38 +165,60 @@ class GettextAlias(object):
          if db_name:
              return sql_db.db_connect(db_name)
  
-    def _get_cr(self, frame):
-        is_new_cr = False
-        cr = frame.f_locals.get('cr', frame.f_locals.get('cursor'))
-        if not cr:
-            s = frame.f_locals.get('self', {})
-            cr = getattr(s, 'cr', None)
-        if not cr:
+    def _get_cr(self, frame, allow_create=True):
+        # try, in order: cr, cursor, self.env.cr, self.cr
+        if 'cr' in frame.f_locals:
+            return frame.f_locals['cr'], False
+        if 'cursor' in frame.f_locals:
+            return frame.f_locals['cursor'], False
+        s = frame.f_locals.get('self')
+        if hasattr(s, 'env'):
+            return s.env.cr, False
+        if hasattr(s, 'cr'):
+            return s.cr, False
+        if allow_create:
+            # create a new cursor
              db = self._get_db()
-            if db:
-                cr = db.cursor()
-                is_new_cr = True
-        return cr, is_new_cr
+            if db is not None:
+                return db.cursor(), True
+        return None, False
+
+    def _get_uid(self, frame):
+        # try, in order: uid, user, self.env.uid
+        if 'uid' in frame.f_locals:
+            return frame.f_locals['uid']
+        if 'user' in frame.f_locals:
+            return int(frame.f_locals['user'])      # user may be a record
+        s = frame.f_locals.get('self')
+        return s.env.uid
  
      def _get_lang(self, frame):
+        # try, in order: context.get('lang'), kwargs['context'].get('lang'),
+        # self.env.lang, self.localcontext.get('lang')
          lang = None
-        ctx = frame.f_locals.get('context')
-        if not ctx:
-            kwargs = frame.f_locals.get('kwargs')
-            if kwargs is None:
-                args = frame.f_locals.get('args')
-                if args and isinstance(args, (list, tuple)) \
-                        and isinstance(args[-1], dict):
-                    ctx = args[-1]
-            elif isinstance(kwargs, dict):
-                ctx = kwargs.get('context')
-        if ctx:
-            lang = ctx.get('lang')
+        if frame.f_locals.get('context'):
+            lang = frame.f_locals['context'].get('lang')
+        if not lang:
+            kwargs = frame.f_locals.get('kwargs', {})
+            if kwargs.get('context'):
+                lang = kwargs['context'].get('lang')
          if not lang:
-            s = frame.f_locals.get('self', {})
-            c = getattr(s, 'localcontext', None)
-            if c:
-                lang = c.get('lang')
+            s = frame.f_locals.get('self')
+            if hasattr(s, 'env'):
+                lang = s.env.lang
+            if not lang:
+                if hasattr(s, 'localcontext'):
+                    lang = s.localcontext.get('lang')
+            if not lang:
+                # Last resort: attempt to guess the language of the user
+                # Pitfall: some operations are performed in sudo mode, and we
+                #          don't know the originial uid, so the language may
+                #          be wrong when the admin language differs.
+                pool = getattr(s, 'pool', None)
+                (cr, dummy) = self._get_cr(frame, allow_create=False)
+                uid = self._get_uid(frame)
+                if pool and cr and uid:
+                    lang = pool['res.users'].context_get(cr, uid)['lang']
          return lang
  
      def __call__(self, source):
@@ -217,8 +237,8 @@ class GettextAlias(object):
                  cr, is_new_cr = self._get_cr(frame)
                  if cr:
                      # Try to use ir.translation to benefit from global cache if possible
-                    pool = pooler.get_pool(cr.dbname)
-                    res = pool.get('ir.translation')._get_source(cr, SUPERUSER_ID, None, ('code','sql_constraint'), lang, source)
+                    registry = openerp.registry(cr.dbname)
+                    res = registry['ir.translation']._get_source(cr, SUPERUSER_ID, None, ('code','sql_constraint'), lang, source)
                  else:
                      _logger.debug('no context cursor detected, skipping translation for "%r"', source)
              else:
@@ -262,7 +282,7 @@ class TinyPoFile(object):
      def __iter__(self):
          self.buffer.seek(0)
          self.lines = self._get_lines()
-        self.lines_count = len(self.lines);
+        self.lines_count = len(self.lines)
  
          self.first = True
          self.extra_lines= []
@@ -278,7 +298,7 @@ class TinyPoFile(object):
          return lines
  
      def cur_line(self):
-        return (self.lines_count - len(self.lines))
+        return self.lines_count - len(self.lines)
  
      def next(self):
          trans_type = name = res_id = source = trad = None
@@ -291,7 +311,7 @@ class TinyPoFile(object):
              targets = []
              line = None
              fuzzy = False
-            while (not line):
+            while not line:
                  if 0 == len(self.lines):
                      raise StopIteration()
                  line = self.lines.pop(0).strip()
@@ -303,6 +323,10 @@ class TinyPoFile(object):
                      if not line.startswith('module:'):
                          comments.append(line)
                  elif line.startswith('#:'):
+                    # Process the `reference` comments. Each line can specify
+                    # multiple targets (e.g. model, view, code, selection,
+                    # ...). For each target, we will return an additional
+                    # entry.
                      for lpart in line[2:].strip().split(' '):
                          trans_info = lpart.strip().split(':',2)
                          if trans_info and len(trans_info) == 2:
@@ -352,6 +376,9 @@ class TinyPoFile(object):
                  line = self.lines.pop(0).strip()
  
              if targets and not fuzzy:
+                # Use the first target for the current entry (returned at the
+                # end of this next() call), and keep the others to generate
+                # additional entries (returned the next next() calls).
                  trans_type, name, res_id = targets.pop(0)
                  for t, n, r in targets:
                      if t == trans_type == 'code': continue
@@ -443,12 +470,17 @@ def trans_export(lang, modules, buffer, format, cr):
              for module, type, name, res_id, src, trad, comments in rows:
                  row = grouped_rows.setdefault(src, {})
                  row.setdefault('modules', set()).add(module)
-                if ('translation' not in row) or (not row['translation']):
+                if not row.get('translation') and trad != src:
                      row['translation'] = trad
                  row.setdefault('tnrs', []).append((type, name, res_id))
                  row.setdefault('comments', set()).update(comments)
  
-            for src, row in grouped_rows.items():
+            for src, row in sorted(grouped_rows.items()):
+                if not lang:
+                    # translation template, so no translation value
+                    row['translation'] = ''
+                elif not row.get('translation'):
+                    row['translation'] = src
                  writer.write(row['modules'], row['tnrs'], src, row['translation'], row['comments'])
  
          elif format == 'tgz':
@@ -484,16 +516,25 @@ def trans_export(lang, modules, buffer, format, cr):
      del translations
  
  def trans_parse_xsl(de):
+    return list(set(trans_parse_xsl_aux(de, False)))
+
+def trans_parse_xsl_aux(de, t):
      res = []
+
      for n in de:
-        if n.get("t"):
-            for m in n:
-                if isinstance(m, SKIPPED_ELEMENT_TYPES) or not m.text:
+        t = t or n.get("t")
+        if t:
+                if isinstance(n, SKIPPED_ELEMENT_TYPES) or n.tag.startswith('{http://www.w3.org/1999/XSL/Transform}'):
                      continue
-                l = m.text.strip().replace('\n',' ')
-                if len(l):
-                    res.append(l.encode("utf8"))
-        res.extend(trans_parse_xsl(n))
+                if n.text:
+                    l = n.text.strip().replace('\n',' ')
+                    if len(l):
+                        res.append(l.encode("utf8"))
+                if n.tail:
+                    l = n.tail.strip().replace('\n',' ')
+                    if len(l):
+                        res.append(l.encode("utf8"))
+        res.extend(trans_parse_xsl_aux(n, t))
      return res
  
  def trans_parse_rml(de):
@@ -509,26 +550,33 @@ def trans_parse_rml(de):
          res.extend(trans_parse_rml(n))
      return res
  
-def trans_parse_view(de):
-    res = []
-    if de.text and de.text.strip():
-        res.append(de.text.strip().encode("utf8"))
-    if de.tail and de.tail.strip():
-        res.append(de.tail.strip().encode("utf8"))
-    if de.tag == 'attribute' and de.get("name") == 'string':
-        if de.text:
-            res.append(de.text.encode("utf8"))
-    if de.get("string"):
-        res.append(de.get('string').encode("utf8"))
-    if de.get("help"):
-        res.append(de.get('help').encode("utf8"))
-    if de.get("sum"):
-        res.append(de.get('sum').encode("utf8"))
-    if de.get("confirm"):
-        res.append(de.get('confirm').encode("utf8"))
-    for n in de:
-        res.extend(trans_parse_view(n))
-    return res
+def _push(callback, term, source_line):
+    """ Sanity check before pushing translation terms """
+    term = (term or "").strip().encode('utf8')
+    # Avoid non-char tokens like ':' '...' '.00' etc.
+    if len(term) > 8 or any(x.isalpha() for x in term):
+        callback(term, source_line)
+
+def trans_parse_view(element, callback):
+    """ Helper method to recursively walk an etree document representing a
+        regular view and call ``callback(term)`` for each translatable term
+        that is found in the document.
+
+        :param ElementTree element: root of etree document to extract terms from
+        :param callable callback: a callable in the form ``f(term, source_line)``,
+            that will be called for each extracted term.
+    """
+    for el in element.iter():
+        if (not isinstance(el, SKIPPED_ELEMENT_TYPES)
+                and el.tag.lower() not in SKIPPED_ELEMENTS
+                and el.text):
+            _push(callback, el.text, el.sourceline)
+        if el.tail:
+            _push(callback, el.tail, el.sourceline)
+        for attr in ('string', 'help', 'sum', 'confirm', 'placeholder'):
+            value = el.get(attr)
+            if value:
+                _push(callback, value, el.sourceline)
  
  # tests whether an object is in a list of modules
  def in_modules(object_name, modules):
@@ -544,9 +592,34 @@ def in_modules(object_name, modules):
      module = module_dict.get(module, module)
      return module in modules
  
+def _extract_translatable_qweb_terms(element, callback):
+    """ Helper method to walk an etree document representing
+        a QWeb template, and call ``callback(term)`` for each
+        translatable term that is found in the document.
+
+        :param etree._Element element: root of etree document to extract terms from
+        :param Callable callback: a callable in the form ``f(term, source_line)``,
+                                  that will be called for each extracted term.
+    """
+    # not using elementTree.iterparse because we need to skip sub-trees in case
+    # the ancestor element had a reason to be skipped
+    for el in element:
+        if isinstance(el, SKIPPED_ELEMENT_TYPES): continue
+        if (el.tag.lower() not in SKIPPED_ELEMENTS
+                and "t-js" not in el.attrib
+                and not ("t-jquery" in el.attrib and "t-operation" not in el.attrib)
+                and not ("t-translation" in el.attrib and
+                         el.attrib["t-translation"].strip() == "off")):
+            _push(callback, el.text, el.sourceline)
+            for att in ('title', 'alt', 'label', 'placeholder'):
+                if att in el.attrib:
+                    _push(callback, el.attrib[att], el.sourceline)
+            _extract_translatable_qweb_terms(el, callback)
+        _push(callback, el.tail, el.sourceline)
  
  def babel_extract_qweb(fileobj, keywords, comment_tags, options):
      """Babel message extractor for qweb template files.
+
      :param fileobj: the file-like object the messages should be extracted from
      :param keywords: a list of keywords (i.e. function names) that should
                       be recognized as translation functions
@@ -555,43 +628,23 @@ def babel_extract_qweb(fileobj, keywords, comment_tags, options):
      :param options: a dictionary of additional options (optional)
      :return: an iterator over ``(lineno, funcname, message, comments)``
               tuples
-    :rtype: ``iterator``
+    :rtype: Iterable
      """
      result = []
      def handle_text(text, lineno):
-        text = (text or "").strip()
-        if len(text) > 1: # Avoid mono-char tokens like ':' ',' etc.
-            result.append((lineno, None, text, []))
-
-    # not using elementTree.iterparse because we need to skip sub-trees in case
-    # the ancestor element had a reason to be skipped
-    def iter_elements(current_element):
-        for el in current_element:
-            if isinstance(el, SKIPPED_ELEMENT_TYPES): continue
-            if "t-js" not in el.attrib and \
-                    not ("t-jquery" in el.attrib and "t-operation" not in el.attrib) and \
-                    not ("t-translation" in el.attrib and el.attrib["t-translation"].strip() == "off"):
-                handle_text(el.text, el.sourceline)
-                for att in ('title', 'alt', 'label', 'placeholder'):
-                    if att in el.attrib:
-                        handle_text(el.attrib[att], el.sourceline)
-                iter_elements(el)
-            handle_text(el.tail, el.sourceline)
-
+        result.append((lineno, None, text, []))
      tree = etree.parse(fileobj)
-    iter_elements(tree.getroot())
-
+    _extract_translatable_qweb_terms(tree.getroot(), handle_text)
      return result
  
-
  def trans_generate(lang, modules, cr):
      dbname = cr.dbname
  
-    pool = pooler.get_pool(dbname)
-    trans_obj = pool.get('ir.translation')
-    model_data_obj = pool.get('ir.model.data')
+    registry = openerp.registry(dbname)
+    trans_obj = registry.get('ir.translation')
+    model_data_obj = registry.get('ir.model.data')
      uid = 1
-    l = pool.models.items()
+    l = registry.models.items()
      l.sort()
  
      query = 'SELECT name, model, res_id, module'    \
@@ -620,7 +673,6 @@ def trans_generate(lang, modules, cr):
          # empty and one-letter terms are ignored, they probably are not meant to be
          # translated, and would be very hard to translate anyway.
          if not source or len(source.strip()) <= 1:
-            _logger.debug("Ignoring empty or 1-letter source term: %r", tuple)
              return
          if tuple not in _to_translate:
              _to_translate.append(tuple)
@@ -630,69 +682,49 @@ def trans_generate(lang, modules, cr):
              return s.encode('utf8')
          return s
  
+    def push(mod, type, name, res_id, term):
+        term = (term or '').strip()
+        if len(term) > 2:
+            push_translation(mod, type, name, res_id, term)
+
+    def get_root_view(xml_id):
+        view = model_data_obj.xmlid_to_object(cr, uid, xml_id)
+        if view:
+            while view.mode != 'primary':
+                view = view.inherit_id
+        xml_id = view.get_external_id(cr, uid).get(view.id, xml_id)
+        return xml_id
+
      for (xml_name,model,res_id,module) in cr.fetchall():
          module = encode(module)
          model = encode(model)
          xml_name = "%s.%s" % (module, encode(xml_name))
  
-        if not pool.get(model):
+        if model not in registry:
              _logger.error("Unable to find object %r", model)
              continue
  
-        exists = pool.get(model).exists(cr, uid, res_id)
+        if not registry[model]._translate:
+            # explicitly disabled
+            continue
+
+        exists = registry[model].exists(cr, uid, res_id)
          if not exists:
              _logger.warning("Unable to find object %r with id %d", model, res_id)
              continue
-        obj = pool.get(model).browse(cr, uid, res_id)
+        obj = registry[model].browse(cr, uid, res_id)
  
          if model=='ir.ui.view':
              d = etree.XML(encode(obj.arch))
-            for t in trans_parse_view(d):
-                push_translation(module, 'view', encode(obj.model), 0, t)
+            if obj.type == 'qweb':
+                view_id = get_root_view(xml_name)
+                push_qweb = lambda t,l: push(module, 'view', 'website', view_id, t)
+                _extract_translatable_qweb_terms(d, push_qweb)
+            else:
+                push_view = lambda t,l: push(module, 'view', obj.model, xml_name, t)
+                trans_parse_view(d, push_view)
          elif model=='ir.actions.wizard':
-            service_name = 'wizard.'+encode(obj.wiz_name)
-            import openerp.netsvc as netsvc
-            if netsvc.Service._services.get(service_name):
-                obj2 = netsvc.Service._services[service_name]
-                for state_name, state_def in obj2.states.iteritems():
-                    if 'result' in state_def:
-                        result = state_def['result']
-                        if result['type'] != 'form':
-                            continue
-                        name = "%s,%s" % (encode(obj.wiz_name), state_name)
-
-                        def_params = {
-                            'string': ('wizard_field', lambda s: [encode(s)]),
-                            'selection': ('selection', lambda s: [encode(e[1]) for e in ((not callable(s)) and s or [])]),
-                            'help': ('help', lambda s: [encode(s)]),
-                        }
-
-                        # export fields
-                        if not result.has_key('fields'):
-                            _logger.warning("res has no fields: %r", result)
-                            continue
-                        for field_name, field_def in result['fields'].iteritems():
-                            res_name = name + ',' + field_name
-
-                            for fn in def_params:
-                                if fn in field_def:
-                                    transtype, modifier = def_params[fn]
-                                    for val in modifier(field_def[fn]):
-                                        push_translation(module, transtype, res_name, 0, val)
-
-                        # export arch
-                        arch = result['arch']
-                        if arch and not isinstance(arch, UpdateableStr):
-                            d = etree.XML(arch)
-                            for t in trans_parse_view(d):
-                                push_translation(module, 'wizard_view', name, 0, t)
-
-                        # export button labels
-                        for but_args in result['state']:
-                            button_name = but_args[0]
-                            button_label = but_args[1]
-                            res_name = name + ',' + button_name
-                            push_translation(module, 'wizard_button', res_name, 0, button_label)
+            pass # TODO Can model really be 'ir.actions.wizard' ?
  
          elif model=='ir.model.fields':
              try:
@@ -700,8 +732,9 @@ def trans_generate(lang, modules, cr):
              except AttributeError, exc:
                  _logger.error("name error in %s: %s", xml_name, str(exc))
                  continue
-            objmodel = pool.get(obj.model)
-            if not objmodel or not field_name in objmodel._columns:
+            objmodel = registry.get(obj.model)
+            if (objmodel is None or field_name not in objmodel._columns
+                    or not objmodel._translate):
                  continue
              field_def = objmodel._columns[field_name]
  
@@ -752,85 +785,77 @@ def trans_generate(lang, modules, cr):
                  except (IOError, etree.XMLSyntaxError):
                      _logger.exception("couldn't export translation for report %s %s %s", name, report_type, fname)
  
-        for field_name,field_def in obj._table._columns.items():
+        for field_name, field_def in obj._columns.items():
+            if model == 'ir.model' and field_name == 'name' and obj.name == obj.model:
+                # ignore model name if it is the technical one, nothing to translate
+                continue
              if field_def.translate:
                  name = model + "," + field_name
                  try:
-                    trad = getattr(obj, field_name) or ''
+                    term = obj[field_name] or ''
                  except:
-                    trad = ''
-                push_translation(module, 'model', name, xml_name, encode(trad))
+                    term = ''
+                push_translation(module, 'model', name, xml_name, encode(term))
  
          # End of data for ir.model.data query results
  
      cr.execute(query_models, query_param)
  
      def push_constraint_msg(module, term_type, model, msg):
-        # Check presence of __call__ directly instead of using
-        # callable() because it will be deprecated as of Python 3.0
          if not hasattr(msg, '__call__'):
-            push_translation(module, term_type, model, 0, encode(msg))
-
+            push_translation(encode(module), term_type, encode(model), 0, encode(msg))
+
+    def push_local_constraints(module, model, cons_type='sql_constraints'):
+        """Climb up the class hierarchy and ignore inherited constraints
+           from other modules"""
+        term_type = 'sql_constraint' if cons_type == 'sql_constraints' else 'constraint'
+        msg_pos = 2 if cons_type == 'sql_constraints' else 1
+        for cls in model.__class__.__mro__:
+            if getattr(cls, '_module', None) != module:
+                continue
+            constraints = getattr(cls, '_local_' + cons_type, [])
+            for constraint in constraints:
+                push_constraint_msg(module, term_type, model._name, constraint[msg_pos])
+            
      for (_, model, module) in cr.fetchall():
-        module = encode(module)
-        model = encode(model)
-
-        model_obj = pool.get(model)
-
-        if not model_obj:
+        if model not in registry:
              _logger.error("Unable to find object %r", model)
              continue
  
-        for constraint in getattr(model_obj, '_constraints', []):
-            push_constraint_msg(module, 'constraint', model, constraint[1])
-
-        for constraint in getattr(model_obj, '_sql_constraints', []):
-            push_constraint_msg(module, 'sql_constraint', model, constraint[2])
-
-    def get_module_from_path(path, mod_paths=None):
-        if not mod_paths:
-            # First, construct a list of possible paths
-            def_path = os.path.abspath(os.path.join(config.config['root_path'], 'addons'))     # default addons path (base)
-            ad_paths= map(lambda m: os.path.abspath(m.strip()),config.config['addons_path'].split(','))
-            mod_paths=[def_path]
-            for adp in ad_paths:
-                mod_paths.append(adp)
-                if not os.path.isabs(adp):
-                    mod_paths.append(adp)
-                elif adp.startswith(def_path):
-                    mod_paths.append(adp[len(def_path)+1:])
-        for mp in mod_paths:
-            if path.startswith(mp) and (os.path.dirname(path) != mp):
-                path = path[len(mp)+1:]
-                return path.split(os.path.sep)[0]
-        return 'base'   # files that are not in a module are considered as being in 'base' module
+        model_obj = registry[model]
  
-    modobj = pool.get('ir.module.module')
-    installed_modids = modobj.search(cr, uid, [('state', '=', 'installed')])
-    installed_modules = map(lambda m: m['name'], modobj.read(cr, uid, installed_modids, ['name']))
+        if model_obj._constraints:
+            push_local_constraints(module, model_obj, 'constraints')
  
-    root_path = os.path.join(config.config['root_path'], 'addons')
+        if model_obj._sql_constraints:
+            push_local_constraints(module, model_obj, 'sql_constraints')
  
-    apaths = map(os.path.abspath, map(str.strip, config.config['addons_path'].split(',')))
-    if root_path in apaths:
-        path_list = apaths
-    else :
-        path_list = [root_path,] + apaths
+    modobj = registry['ir.module.module']
+    installed_modids = modobj.search(cr, uid, [('state', '=', 'installed')])
+    installed_modules = map(lambda m: m['name'], modobj.read(cr, uid, installed_modids, ['name']))
  
+    path_list = list(openerp.modules.module.ad_paths)
      # Also scan these non-addon paths
      for bin_path in ['osv', 'report' ]:
          path_list.append(os.path.join(config.config['root_path'], bin_path))
  
-    _logger.debug("Scanning modules at paths: ", path_list)
+    _logger.debug("Scanning modules at paths: %s", path_list)
  
-    mod_paths = []
+    mod_paths = list(path_list)
+
+    def get_module_from_path(path):
+        for mp in mod_paths:
+            if path.startswith(mp) and (os.path.dirname(path) != mp):
+                path = path[len(mp)+1:]
+                return path.split(os.path.sep)[0]
+        return 'base'   # files that are not in a module are considered as being in 'base' module
  
      def verified_module_filepaths(fname, path, root):
          fabsolutepath = join(root, fname)
          frelativepath = fabsolutepath[len(path):]
          display_path = "addons%s" % frelativepath
-        module = get_module_from_path(fabsolutepath, mod_paths=mod_paths)
-        if (('all' in modules) or (module in modules)) and module in installed_modules:
+        module = get_module_from_path(fabsolutepath)
+        if ('all' in modules or module in modules) and module in installed_modules:
              return module, fabsolutepath, frelativepath, display_path
          return None, None, None, None
  
@@ -841,8 +866,11 @@ def trans_generate(lang, modules, cr):
          if module:
              src_file = open(fabsolutepath, 'r')
              try:
-                for lineno, message, comments in extract.extract(extract_method, src_file,
-                                                                 keywords=extract_keywords):
+                for extracted in extract.extract(extract_method, src_file,
+                                                 keywords=extract_keywords):
+                    # Babel 0.9.6 yields lineno, message, comments
+                    # Babel 1.3 yields lineno, message, comments, context
+                    lineno, message, comments = extracted[:3] 
                      push_translation(module, trans_type, display_path, lineno,
                                       encode(message), comments + extra_comments)
              except Exception:
@@ -855,8 +883,9 @@ def trans_generate(lang, modules, cr):
          for root, dummy, files in osutil.walksymlinks(path):
              for fname in fnmatch.filter(files, '*.py'):
                  babel_extract_terms(fname, path, root)
+            # mako provides a babel extractor: http://docs.makotemplates.org/en/latest/usage.html#babel
              for fname in fnmatch.filter(files, '*.mako'):
-                babel_extract_terms(fname, path, root, trans_type='report')
+                babel_extract_terms(fname, path, root, 'mako', trans_type='report')
              # Javascript source files in the static/src/js directory, rest is ignored (libs)
              if fnmatch.fnmatch(root, '*/static/src/js*'):
                  for fname in fnmatch.filter(files, '*.js'):
@@ -897,9 +926,9 @@ def trans_load_data(cr, fileobj, fileformat, lang, lang_name=None, verbose=True,
      if context is None:
          context = {}
      db_name = cr.dbname
-    pool = pooler.get_pool(db_name)
-    lang_obj = pool.get('res.lang')
-    trans_obj = pool.get('ir.translation')
+    registry = openerp.registry(db_name)
+    lang_obj = registry.get('res.lang')
+    trans_obj = registry.get('ir.translation')
      iso_lang = misc.get_iso_codes(lang)
      try:
          ids = lang_obj.search(cr, SUPERUSER_ID, [('code','=', lang)])
@@ -908,6 +937,10 @@ def trans_load_data(cr, fileobj, fileformat, lang, lang_name=None, verbose=True,
              # lets create the language with locale information
              lang_obj.load_lang(cr, SUPERUSER_ID, lang=lang, lang_name=lang_name)
  
+        # Parse also the POT: it will possibly provide additional targets.
+        # (Because the POT comments are correct on Launchpad but not the
+        # PO comments due to a Launchpad limitation. See LP bug 933496.)
+        pot_reader = []
  
          # now, the serious things: we read the language file
          fileobj.seek(0)
@@ -920,19 +953,42 @@ def trans_load_data(cr, fileobj, fileformat, lang, lang_name=None, verbose=True,
          elif fileformat == 'po':
              reader = TinyPoFile(fileobj)
              f = ['type', 'name', 'res_id', 'src', 'value', 'comments']
+
+            # Make a reader for the POT file and be somewhat defensive for the
+            # stable branch.
+            if fileobj.name.endswith('.po'):
+                try:
+                    # Normally the path looks like /path/to/xxx/i18n/lang.po
+                    # and we try to find the corresponding
+                    # /path/to/xxx/i18n/xxx.pot file.
+                    head, _ = os.path.split(fileobj.name)
+                    head2, _ = os.path.split(head)
+                    head3, tail3 = os.path.split(head2)
+                    pot_handle = misc.file_open(os.path.join(head3, tail3, 'i18n', tail3 + '.pot'))
+                    pot_reader = TinyPoFile(pot_handle)
+                except:
+                    pass
+
          else:
              _logger.error('Bad file format: %s', fileformat)
              raise Exception(_('Bad file format'))
  
+        # Read the POT `reference` comments, and keep them indexed by source
+        # string.
+        pot_targets = {}
+        for type, name, res_id, src, _, comments in pot_reader:
+            if type is not None:
+                pot_targets.setdefault(src, {'value': None, 'targets': []})
+                pot_targets[src]['targets'].append((type, name, res_id))
+
          # read the rest of the file
-        line = 1
          irt_cursor = trans_obj._get_import_cursor(cr, SUPERUSER_ID, context=context)
  
-        for row in reader:
-            line += 1
+        def process_row(row):
+            """Process a single PO (or POT) entry."""
              # skip empty rows and rows where the translation field (=last fiefd) is empty
              #if (not row) or (not row[-1]):
-            #    continue
+            #    return
  
              # dictionary which holds values for this line of the csv file
              # {'lang': ..., 'type': ..., 'name': ..., 'res_id': ...,
@@ -942,9 +998,17 @@ def trans_load_data(cr, fileobj, fileformat, lang, lang_name=None, verbose=True,
              for i, field in enumerate(f):
                  dic[field] = row[i]
  
+            # Get the `reference` comments from the POT.
+            src = row[3]
+            if pot_reader and src in pot_targets:
+                pot_targets[src]['targets'] = filter(lambda x: x != row[:3], pot_targets[src]['targets'])
+                pot_targets[src]['value'] = row[4]
+                if not pot_targets[src]['targets']:
+                    del pot_targets[src]
+
              # This would skip terms that fail to specify a res_id
              if not dic.get('res_id'):
-                continue
+                return
  
              res_id = dic.pop('res_id')
              if res_id and isinstance(res_id, (int, long)) \
@@ -965,7 +1029,23 @@ def trans_load_data(cr, fileobj, fileformat, lang, lang_name=None, verbose=True,
  
              irt_cursor.push(dic)
  
+        # First process the entries from the PO file (doing so also fills/removes
+        # the entries from the POT file).
+        for row in reader:
+            process_row(row)
+
+        # Then process the entries implied by the POT file (which is more
+        # correct w.r.t. the targets) if some of them remain.
+        pot_rows = []
+        for src in pot_targets:
+            value = pot_targets[src]['value']
+            for type, name, res_id in pot_targets[src]['targets']:
+                pot_rows.append((type, name, res_id, src, value, comments))
+        for row in pot_rows:
+            process_row(row)
+
          irt_cursor.finish()
+        trans_obj.clear_caches()
          if verbose:
              _logger.info("translation file loaded succesfully")
      except IOError:
@@ -1019,11 +1099,10 @@ def load_language(cr, lang):
      :param lang: language ISO code with optional _underscore_ and l10n flavor (ex: 'fr', 'fr_BE', but not 'fr-BE')
      :type lang: str
      """
-    pool = pooler.get_pool(cr.dbname)
-    language_installer = pool.get('base.language.install')
-    uid = 1
-    oid = language_installer.create(cr, uid, {'lang': lang})
-    language_installer.lang_install(cr, uid, [oid], context=None)
+    registry = openerp.registry(cr.dbname)
+    language_installer = registry['base.language.install']
+    oid = language_installer.create(cr, SUPERUSER_ID, {'lang': lang})
+    language_installer.lang_install(cr, SUPERUSER_ID, [oid], context=None)
  
  # vim:expandtab:smartindent:tabstop=4:softtabstop=4:shiftwidth=4: