Left: | ||
Right: |
LEFT | RIGHT |
---|---|
1 # coding: utf-8 | 1 # coding: utf-8 |
2 | 2 |
3 # This file is part of the Adblock Plus web scripts, | 3 # This file is part of the Adblock Plus web scripts, |
4 # Copyright (C) 2006-2013 Eyeo GmbH | 4 # Copyright (C) 2006-2013 Eyeo GmbH |
5 # | 5 # |
6 # Adblock Plus is free software: you can redistribute it and/or modify | 6 # Adblock Plus is free software: you can redistribute it and/or modify |
7 # it under the terms of the GNU General Public License version 3 as | 7 # it under the terms of the GNU General Public License version 3 as |
8 # published by the Free Software Foundation. | 8 # published by the Free Software Foundation. |
9 # | 9 # |
10 # Adblock Plus is distributed in the hope that it will be useful, | 10 # Adblock Plus is distributed in the hope that it will be useful, |
(...skipping 25 matching lines...) Expand all Loading... | |
36 "'": "'", | 36 "'": "'", |
37 } | 37 } |
38 | 38 |
39 class Converter: | 39 class Converter: |
40 def __init__(self, params, key="pagedata"): | 40 def __init__(self, params, key="pagedata"): |
41 self._params = params | 41 self._params = params |
42 self._key = key | 42 self._key = key |
43 | 43 |
44 # Read in any parameters specified at the beginning of the file | 44 # Read in any parameters specified at the beginning of the file |
45 lines = params[key].splitlines(True) | 45 lines = params[key].splitlines(True) |
46 while len(lines) and re.search(r"^\s*[\w\-]+\s*=", lines[0]): | 46 while lines and re.search(r"^\s*[\w\-]+\s*=", lines[0]): |
47 name, value = lines.pop(0).split("=", 1) | 47 name, value = lines.pop(0).split("=", 1) |
48 params[name.strip()] = value.strip() | 48 params[name.strip()] = value.strip() |
49 params[key] = "".join(lines) | 49 params[key] = "".join(lines) |
50 | 50 |
51 def insert_localized_strings(self, text, escapes): | 51 def localize_string(self, name, localedata, escapes, links=[]): |
52 def escape(s): | 52 def escape(s): |
53 return re.sub(r".", | 53 return re.sub(r".", |
54 lambda match: escapes.get(match.group(0), match.group(0)), | 54 lambda match: escapes.get(match.group(0), match.group(0)), |
55 s, flags=re.S) | 55 s, flags=re.S) |
56 | 56 def re_escape(s): |
57 return re.escape(escape(s)) | |
58 | |
59 try: | |
60 result = localedata[name].strip() | |
61 except KeyError: | |
62 raise Exception("Lookup failed for string %s used on page %s" % (name, sel f._params["page"])) | |
63 | |
64 # Insert links | |
65 result = escape(result) | |
66 while links: | |
67 result = re.sub( | |
68 r"%s([^<>]*?)%s" % (re_escape("<a>"), re_escape("</a>")), | |
69 r'<a href="%s">\1</a>' % links.pop(0), | |
70 result, 1, flags=re.S | |
71 ) | |
72 | |
73 # <strong> and <em> tags are allowed | |
74 result = re.sub( | |
75 r"%s([^<>]*?)%s" % (re_escape("<strong>"), re_escape("</strong>")), | |
76 r"<strong>\1</strong>", | |
77 result, flags=re.S | |
78 ) | |
79 result = re.sub( | |
80 r"%s([^<>]*?)%s" % (re_escape("<em>"), re_escape("</em>")), | |
81 r"<em>\1</em>", | |
82 result, flags=re.S | |
83 ) | |
84 return result | |
85 | |
86 def insert_localized_strings(self, text, escapes): | |
57 def lookup_string(match): | 87 def lookup_string(match): |
58 name, links = match.groups() | 88 name, links = match.groups() |
59 try: | |
60 result = self._params["localedata"][name].strip() | |
61 except KeyError: | |
62 raise Exception("Lookup failed for string %s used on page %s" % (name, s elf._params["page"])) | |
63 | |
64 result = escape(result) | |
65 if links: | 89 if links: |
66 links = map(unicode.strip, links.strip("()").split(",")) | 90 links = map(unicode.strip, links.strip("()").split(",")) |
67 while len(links): | 91 else: |
Sebastian Noack
2013/10/29 11:04:17
len() isn't needed here. Lists evaluate to True wh
| |
68 result = re.sub( | 92 links = [] |
69 r"%s(.*?)%s" % (escape("<a>"), escape("</a>")), | 93 return self.localize_string(name, self._params["localedata"], escapes, lin ks) |
70 r'<a href="%s">\1</a>' % links.pop(0), | |
71 result, 1, flags=re.S | |
72 ) | |
73 return result | |
74 | 94 |
75 return re.sub( | 95 return re.sub( |
76 r"\$([\w\-]+)(\([^()$]+\))?\$", | 96 r"\$([\w\-]+)(\([^()$]+\))?\$", |
77 lookup_string, | 97 lookup_string, |
78 text | 98 text |
79 ) | 99 ) |
80 | 100 |
81 def process_links(self, text): | 101 def process_links(self, text): |
82 def process_link(match): | 102 def process_link(match): |
83 pre, attr, url, post = match.groups() | 103 pre, attr, url, post = match.groups() |
84 url = jinja2.Markup(url).unescape() | 104 url = jinja2.Markup(url).unescape() |
85 | 105 |
86 locale, new_url = self._params["source"].resolve_link(url, self._params["l ocale"]) | 106 locale, new_url = self._params["source"].resolve_link(url, self._params["l ocale"]) |
87 if new_url != None: | 107 if new_url != None: |
88 url = new_url | 108 url = new_url |
89 if attr == "href": | 109 if attr == "href": |
90 post += ' hreflang="%s"' % jinja2.Markup.escape(locale) | 110 post += ' hreflang="%s"' % jinja2.Markup.escape(locale) |
91 | 111 |
92 return "".join((pre, jinja2.Markup.escape(url), post)) | 112 return "".join((pre, jinja2.Markup.escape(url), post)) |
93 | 113 |
94 text = re.sub(r"(<a [^<>]*\b(href)=\")([^<>\"]+)(\")", process_link, text) | 114 text = re.sub(r"(<a\s[^<>]*\b(href)=\")([^<>\"]+)(\")", process_link, text) |
95 text = re.sub(r"(<img [^<>]*\b(src)=\")([^<>\"]+)(\")", process_link, text) | 115 text = re.sub(r"(<img\s[^<>]*\b(src)=\")([^<>\"]+)(\")", process_link, text) |
96 return text | 116 return text |
97 | 117 |
98 def resolve_includes(self, text): | 118 def resolve_includes(self, text): |
99 def resolve_include(match): | 119 def resolve_include(match): |
100 global converters | 120 global converters |
101 name = match.group(1) | 121 name = match.group(1) |
102 for format, converter_class in converters.iteritems(): | 122 for format, converter_class in converters.iteritems(): |
103 if self._params["source"].has_include(name, format): | 123 if self._params["source"].has_include(name, format): |
104 self._params["includedata"] = self._params["source"].read_include(name , format) | 124 self._params["includedata"] = self._params["source"].read_include(name , format) |
105 converter = converter_class(self._params, key="includedata") | 125 converter = converter_class(self._params, key="includedata") |
(...skipping 50 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
156 "translate": self.translate, | 176 "translate": self.translate, |
157 "linkify": self.linkify, | 177 "linkify": self.linkify, |
158 "toclist": self.toclist, | 178 "toclist": self.toclist, |
159 } | 179 } |
160 self._env = get_custom_template_environment(filters) | 180 self._env = get_custom_template_environment(filters) |
161 | 181 |
162 def get_html(self, source): | 182 def get_html(self, source): |
163 template = self._env.from_string(source) | 183 template = self._env.from_string(source) |
164 return template.render(self._params) | 184 return template.render(self._params) |
165 | 185 |
166 def translate(self, name, page=None): | 186 def translate(self, name, page=None, links=[]): |
167 if page == None: | 187 if page == None: |
168 localedata = self._params["localedata"] | 188 localedata = self._params["localedata"] |
169 else: | 189 else: |
170 localedata = self._params["source"].read_locale(self._params["locale"], pa ge) | 190 localedata = self._params["source"].read_locale(self._params["locale"], pa ge) |
171 | 191 return jinja2.Markup(self.localize_string(name, localedata, html_escapes, li nks=links)) |
172 try: | |
173 return localedata[name] | |
174 except KeyError: | |
175 raise Exception("Lookup failed for string %s used on page %s" % (name, sel f._params["page"])) | |
176 | 192 |
177 def linkify(self, page, locale=None): | 193 def linkify(self, page, locale=None): |
178 if locale == None: | 194 if locale == None: |
179 locale = self._params["locale"] | 195 locale = self._params["locale"] |
180 | 196 |
181 locale, url = self._params["source"].resolve_link(page, locale) | 197 locale, url = self._params["source"].resolve_link(page, locale) |
182 return jinja2.Markup('<a href="%s" hreflang="%s">' % ( | 198 return jinja2.Markup('<a href="%s" hreflang="%s">' % ( |
183 jinja2.Markup.escape(url), | 199 jinja2.Markup.escape(url), |
184 jinja2.Markup.escape(locale) | 200 jinja2.Markup.escape(locale) |
185 )) | 201 )) |
186 | 202 |
187 def toclist(self, content): | 203 def toclist(self, content): |
188 flat = [] | 204 flat = [] |
189 for match in re.finditer(r'<h(\d) [^<>]*\bid="([^<>"]+)"[^<>]*>(.*?)</h\1>', content, re.S): | 205 for match in re.finditer(r'<h(\d)\s[^<>]*\bid="([^<>"]+)"[^<>]*>(.*?)</h\1>' , content, re.S): |
Sebastian Noack
2013/10/29 11:04:17
I would use \s instead of a whitespace, after the
| |
190 flat.append({ | 206 flat.append({ |
191 "level": int(match.group(1)), | 207 "level": int(match.group(1)), |
192 "anchor": jinja2.Markup(match.group(2)).unescape(), | 208 "anchor": jinja2.Markup(match.group(2)).unescape(), |
193 "title": jinja2.Markup(match.group(3)).unescape(), | 209 "title": jinja2.Markup(match.group(3)).unescape(), |
194 "subitems": [], | 210 "subitems": [], |
195 }) | 211 }) |
196 | 212 |
197 structured = [] | 213 structured = [] |
198 stack = [{"level": 0, "subitems": structured}] | 214 stack = [{"level": 0, "subitems": structured}] |
199 for item in flat: | 215 for item in flat: |
200 while stack[-1]["level"] >= item["level"]: | 216 while stack[-1]["level"] >= item["level"]: |
201 stack.pop() | 217 stack.pop() |
202 stack[-1]["subitems"].append(item) | 218 stack[-1]["subitems"].append(item) |
203 stack.append(item) | 219 stack.append(item) |
204 return structured | 220 return structured |
205 | 221 |
206 converters = { | 222 converters = { |
207 "raw": RawConverter, | 223 "raw": RawConverter, |
208 "md": MarkdownConverter, | 224 "md": MarkdownConverter, |
209 "tmpl": TemplateConverter, | 225 "tmpl": TemplateConverter, |
210 } | 226 } |
LEFT | RIGHT |