Index: sitescripts/web/bin/generate_static_pages.py |
=================================================================== |
new file mode 100644 |
--- /dev/null |
+++ b/sitescripts/web/bin/generate_static_pages.py |
@@ -0,0 +1,89 @@ |
+# coding: utf-8 |
+ |
+# This file is part of the Adblock Plus web scripts, |
+# Copyright (C) 2006-2013 Eyeo GmbH |
+# |
+# Adblock Plus is free software: you can redistribute it and/or modify |
+# it under the terms of the GNU General Public License version 3 as |
+# published by the Free Software Foundation. |
+# |
+# Adblock Plus is distributed in the hope that it will be useful, |
+# but WITHOUT ANY WARRANTY; without even the implied warranty of |
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
+# GNU General Public License for more details. |
+# |
+# You should have received a copy of the GNU General Public License |
+# along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. |
+ |
+import sys, os, re, codecs |
+from ...utils import setupStderr |
+from ..utils import process_page |
+from ..sources import MercurialSource |
+ |
+def generate_pages(repo, output_dir): |
+ known_files = set() |
+ |
+ def write_file(path_parts, contents, binary=False): |
+ encoding = None if binary else "utf-8" |
+ outfile = os.path.join(output_dir, *path_parts) |
+ if outfile in known_files: |
+ print >>sys.stderr, "Warning: File %s has multiple sources" % outfile |
+ return |
+ known_files.add(outfile) |
+ |
+ if os.path.exists(outfile): |
+ with codecs.open(outfile, "rb", encoding=encoding) as handle: |
+ if handle.read() == contents: |
+ return |
+ |
+ try: |
+ os.makedirs(os.path.dirname(outfile)) |
+ except OSError: |
+ pass |
Sebastian Noack
2013/10/29 11:04:17
I would check if we got EEXIST here and only then
|
+ |
+ with codecs.open(outfile, "wb", encoding=encoding) as handle: |
+ handle.write(contents) |
+ |
+ with MercurialSource(repo) as source: |
+ locales = list(source.list_locales()) |
+ for page, format in source.list_pages(): |
+ for locale in locales: |
+ if source.has_locale(locale, page): |
+ pagedata = process_page(source, locale, page, format) |
+ |
+ # Make sure links to static files are versioned |
+ pagedata = re.sub(r'(<script\s[^<>]*\bsrc="/[^"<>]+)', r"\1?%s" % source.version, pagedata) |
Sebastian Noack
2013/10/29 11:04:17
When you inject text into regular expressions alwa
Wladimir Palant
2013/11/04 09:49:21
I'm not injecting into a regular expression here,
Sebastian Noack
2013/11/04 13:28:18
Yes, you are right.
|
+ pagedata = re.sub(r'(<link\s[^<>]*\bhref="/[^"<>]+)', r"\1?%s" % source.version, pagedata) |
+ pagedata = re.sub(r'(<img\s[^<>]*\bsrc="/[^"<>]+)', r"\1?%s" % source.version, pagedata) |
+ |
+ write_file([locale] + page.split("/"), pagedata) |
+ |
+ for filename in source.list_localizable_files(): |
+ for locale in locales: |
+ if source.has_localizable_file(locale, filename): |
+ filedata = source.read_localizable_file(locale, filename) |
+ write_file([locale] + filename.split("/"), filedata, binary=True) |
+ |
+ for filename in source.list_static(): |
+ write_file(filename.split("/"), source.read_static(filename), binary=True) |
+ |
+ def remove_unknown(dir): |
+ files = os.listdir(dir) |
+ for filename in files: |
+ path = os.path.join(dir, filename) |
+ if os.path.isfile(path) and path not in known_files: |
+ os.remove(path) |
+ elif os.path.isdir(path): |
+ remove_unknown(path) |
+ if not os.listdir(path): |
+ os.rmdir(path) |
Sebastian Noack
2013/10/29 11:04:17
You might want to remove directories recursively.
Wladimir Palant
2013/11/04 09:49:21
We are already removing directories recursively. r
Sebastian Noack
2013/11/04 13:28:18
You are right.
|
+ remove_unknown(output_dir) |
+ |
+if __name__ == "__main__": |
+ setupStderr() |
+ if len(sys.argv) < 3: |
+ print >>sys.stderr, "Usage: %s source_repository output_dir" % sys.argv[0] |
+ sys.exit(1) |
+ |
+ repo, output_dir = sys.argv[1:3] |
+ generate_pages(repo, output_dir) |