mirror of
https://github.com/sphinx-doc/sphinx.git
synced 2025-02-25 18:55:22 -06:00
285 lines
10 KiB
Python
285 lines
10 KiB
Python
# -*- coding: utf-8 -*-
|
||
"""
|
||
sphinx.util.i18n
|
||
~~~~~~~~~~~~~~~~
|
||
|
||
Builder superclass for all builders.
|
||
|
||
:copyright: Copyright 2007-2018 by the Sphinx team, see AUTHORS.
|
||
:license: BSD, see LICENSE for details.
|
||
"""
|
||
from __future__ import absolute_import
|
||
|
||
import gettext
|
||
import io
|
||
import os
|
||
import re
|
||
from collections import namedtuple
|
||
from datetime import datetime
|
||
from os import path
|
||
from typing import TYPE_CHECKING
|
||
|
||
import babel.dates
|
||
from babel.messages.mofile import write_mo
|
||
from babel.messages.pofile import read_po
|
||
|
||
from sphinx.errors import SphinxError
|
||
from sphinx.locale import __
|
||
from sphinx.util import logging
|
||
from sphinx.util.osutil import SEP, walk
|
||
|
||
logger = logging.getLogger(__name__)
|
||
|
||
if TYPE_CHECKING:
|
||
from typing import Callable, List, Set # NOQA
|
||
from sphinx.environment import BuildEnvironment # NOQA
|
||
|
||
LocaleFileInfoBase = namedtuple('CatalogInfo', 'base_dir,domain,charset')
|
||
|
||
|
||
class CatalogInfo(LocaleFileInfoBase):
|
||
|
||
@property
|
||
def po_file(self):
|
||
# type: () -> unicode
|
||
return self.domain + '.po'
|
||
|
||
@property
|
||
def mo_file(self):
|
||
# type: () -> unicode
|
||
return self.domain + '.mo'
|
||
|
||
@property
|
||
def po_path(self):
|
||
# type: () -> unicode
|
||
return path.join(self.base_dir, self.po_file)
|
||
|
||
@property
|
||
def mo_path(self):
|
||
# type: () -> unicode
|
||
return path.join(self.base_dir, self.mo_file)
|
||
|
||
def is_outdated(self):
|
||
# type: () -> bool
|
||
return (
|
||
not path.exists(self.mo_path) or
|
||
path.getmtime(self.mo_path) < path.getmtime(self.po_path))
|
||
|
||
def write_mo(self, locale):
|
||
# type: (unicode) -> None
|
||
with io.open(self.po_path, 'rt', encoding=self.charset) as file_po:
|
||
try:
|
||
po = read_po(file_po, locale)
|
||
except Exception as exc:
|
||
logger.warning(__('reading error: %s, %s'), self.po_path, exc)
|
||
return
|
||
|
||
with io.open(self.mo_path, 'wb') as file_mo:
|
||
try:
|
||
write_mo(file_mo, po)
|
||
except Exception as exc:
|
||
logger.warning(__('writing error: %s, %s'), self.mo_path, exc)
|
||
|
||
|
||
def find_catalog(docname, compaction):
|
||
# type: (unicode, bool) -> unicode
|
||
if compaction:
|
||
ret = docname.split(SEP, 1)[0]
|
||
else:
|
||
ret = docname
|
||
|
||
return ret
|
||
|
||
|
||
def find_catalog_files(docname, srcdir, locale_dirs, lang, compaction):
|
||
# type: (unicode, unicode, List[unicode], unicode, bool) -> List[unicode]
|
||
if not(lang and locale_dirs):
|
||
return []
|
||
|
||
domain = find_catalog(docname, compaction)
|
||
files = [gettext.find(domain, path.join(srcdir, dir_), [lang]) # type: ignore
|
||
for dir_ in locale_dirs]
|
||
files = [path.relpath(f, srcdir) for f in files if f] # type: ignore
|
||
return files # type: ignore
|
||
|
||
|
||
def find_catalog_source_files(locale_dirs, locale, domains=None, gettext_compact=False,
|
||
charset='utf-8', force_all=False):
|
||
# type: (List[unicode], unicode, List[unicode], bool, unicode, bool) -> Set[CatalogInfo]
|
||
"""
|
||
:param list locale_dirs:
|
||
list of path as `['locale_dir1', 'locale_dir2', ...]` to find
|
||
translation catalogs. Each path contains a structure such as
|
||
`<locale>/LC_MESSAGES/domain.po`.
|
||
:param str locale: a language as `'en'`
|
||
:param list domains: list of domain names to get. If empty list or None
|
||
is specified, get all domain names. default is None.
|
||
:param boolean gettext_compact:
|
||
* False: keep domains directory structure (default).
|
||
* True: domains in the sub directory will be merged into 1 file.
|
||
:param boolean force_all:
|
||
Set True if you want to get all catalogs rather than updated catalogs.
|
||
default is False.
|
||
:return: [CatalogInfo(), ...]
|
||
"""
|
||
catalogs = set() # type: Set[CatalogInfo]
|
||
|
||
if not locale:
|
||
return catalogs # locale is not specified
|
||
|
||
for locale_dir in locale_dirs:
|
||
if not locale_dir:
|
||
continue # skip system locale directory
|
||
|
||
base_dir = path.join(locale_dir, locale, 'LC_MESSAGES')
|
||
|
||
if not path.exists(base_dir):
|
||
continue # locale path is not found
|
||
|
||
for dirpath, dirnames, filenames in walk(base_dir, followlinks=True):
|
||
filenames = [f for f in filenames if f.endswith('.po')]
|
||
for filename in filenames:
|
||
base = path.splitext(filename)[0]
|
||
domain = path.relpath(path.join(dirpath, base), base_dir)
|
||
if gettext_compact and path.sep in domain:
|
||
domain = path.split(domain)[0]
|
||
domain = domain.replace(path.sep, SEP)
|
||
if domains and domain not in domains:
|
||
continue
|
||
cat = CatalogInfo(base_dir, domain, charset)
|
||
if force_all or cat.is_outdated():
|
||
catalogs.add(cat)
|
||
|
||
return catalogs
|
||
|
||
|
||
# date_format mappings: ustrftime() to bable.dates.format_datetime()
|
||
date_format_mappings = {
|
||
'%a': 'EEE', # Weekday as locale’s abbreviated name.
|
||
'%A': 'EEEE', # Weekday as locale’s full name.
|
||
'%b': 'MMM', # Month as locale’s abbreviated name.
|
||
'%B': 'MMMM', # Month as locale’s full name.
|
||
'%c': 'medium', # Locale’s appropriate date and time representation.
|
||
'%-d': 'd', # Day of the month as a decimal number.
|
||
'%d': 'dd', # Day of the month as a zero-padded decimal number.
|
||
'%-H': 'H', # Hour (24-hour clock) as a decimal number [0,23].
|
||
'%H': 'HH', # Hour (24-hour clock) as a zero-padded decimal number [00,23].
|
||
'%-I': 'h', # Hour (12-hour clock) as a decimal number [1,12].
|
||
'%I': 'hh', # Hour (12-hour clock) as a zero-padded decimal number [01,12].
|
||
'%-j': 'D', # Day of the year as a decimal number.
|
||
'%j': 'DDD', # Day of the year as a zero-padded decimal number.
|
||
'%-m': 'M', # Month as a decimal number.
|
||
'%m': 'MM', # Month as a zero-padded decimal number.
|
||
'%-M': 'm', # Minute as a decimal number [0,59].
|
||
'%M': 'mm', # Minute as a zero-padded decimal number [00,59].
|
||
'%p': 'a', # Locale’s equivalent of either AM or PM.
|
||
'%-S': 's', # Second as a decimal number.
|
||
'%S': 'ss', # Second as a zero-padded decimal number.
|
||
'%U': 'WW', # Week number of the year (Sunday as the first day of the week)
|
||
# as a zero padded decimal number. All days in a new year preceding
|
||
# the first Sunday are considered to be in week 0.
|
||
'%w': 'e', # Weekday as a decimal number, where 0 is Sunday and 6 is Saturday.
|
||
'%-W': 'W', # Week number of the year (Monday as the first day of the week)
|
||
# as a decimal number. All days in a new year preceding the first
|
||
# Monday are considered to be in week 0.
|
||
'%W': 'WW', # Week number of the year (Monday as the first day of the week)
|
||
# as a zero-padded decimal number.
|
||
'%x': 'medium', # Locale’s appropriate date representation.
|
||
'%X': 'medium', # Locale’s appropriate time representation.
|
||
'%y': 'YY', # Year without century as a zero-padded decimal number.
|
||
'%Y': 'YYYY', # Year with century as a decimal number.
|
||
'%Z': 'zzzz', # Time zone name (no characters if no time zone exists).
|
||
'%%': '%',
|
||
}
|
||
|
||
date_format_re = re.compile('(%s)' % '|'.join(date_format_mappings))
|
||
|
||
|
||
def babel_format_date(date, format, locale, formatter=babel.dates.format_date):
|
||
# type: (datetime, unicode, unicode, Callable) -> unicode
|
||
if locale is None:
|
||
locale = 'en'
|
||
|
||
# Check if we have the tzinfo attribute. If not we cannot do any time
|
||
# related formats.
|
||
if not hasattr(date, 'tzinfo'):
|
||
formatter = babel.dates.format_date
|
||
|
||
try:
|
||
return formatter(date, format, locale=locale)
|
||
except (ValueError, babel.core.UnknownLocaleError):
|
||
# fallback to English
|
||
return formatter(date, format, locale='en')
|
||
except AttributeError:
|
||
logger.warning(__('Invalid date format. Quote the string by single quote '
|
||
'if you want to output it directly: %s'), format)
|
||
return format
|
||
|
||
|
||
def format_date(format, date=None, language=None):
|
||
# type: (str, datetime, unicode) -> unicode
|
||
if date is None:
|
||
# If time is not specified, try to use $SOURCE_DATE_EPOCH variable
|
||
# See https://wiki.debian.org/ReproducibleBuilds/TimestampsProposal
|
||
source_date_epoch = os.getenv('SOURCE_DATE_EPOCH')
|
||
if source_date_epoch is not None:
|
||
date = datetime.utcfromtimestamp(float(source_date_epoch))
|
||
else:
|
||
date = datetime.now()
|
||
|
||
result = []
|
||
tokens = date_format_re.split(format)
|
||
for token in tokens:
|
||
if token in date_format_mappings:
|
||
babel_format = date_format_mappings.get(token, '')
|
||
|
||
# Check if we have to use a different babel formatter then
|
||
# format_datetime, because we only want to format a date
|
||
# or a time.
|
||
if token == '%x':
|
||
function = babel.dates.format_date
|
||
elif token == '%X':
|
||
function = babel.dates.format_time
|
||
else:
|
||
function = babel.dates.format_datetime
|
||
|
||
result.append(babel_format_date(date, babel_format, locale=language,
|
||
formatter=function))
|
||
else:
|
||
result.append(token)
|
||
|
||
return "".join(result)
|
||
|
||
|
||
def get_image_filename_for_language(filename, env):
|
||
# type: (unicode, BuildEnvironment) -> unicode
|
||
if not env.config.language:
|
||
return filename
|
||
|
||
filename_format = env.config.figure_language_filename
|
||
d = dict()
|
||
d['root'], d['ext'] = path.splitext(filename)
|
||
dirname = path.dirname(d['root'])
|
||
if dirname and not dirname.endswith(path.sep):
|
||
dirname += path.sep
|
||
d['path'] = dirname
|
||
d['basename'] = path.basename(d['root'])
|
||
d['language'] = env.config.language
|
||
try:
|
||
return filename_format.format(**d)
|
||
except KeyError as exc:
|
||
raise SphinxError('Invalid figure_language_filename: %r' % exc)
|
||
|
||
|
||
def search_image_for_language(filename, env):
|
||
# type: (unicode, BuildEnvironment) -> unicode
|
||
if not env.config.language:
|
||
return filename
|
||
|
||
translated = get_image_filename_for_language(filename, env)
|
||
dirname = path.dirname(env.docname)
|
||
if path.exists(path.join(env.srcdir, dirname, translated)):
|
||
return translated
|
||
else:
|
||
return filename
|