Index: sitescripts/filterhits/common.py |
diff --git a/sitescripts/filterhits/common.py b/sitescripts/filterhits/common.py |
new file mode 100644 |
index 0000000000000000000000000000000000000000..8c3a651cd032c8e108de370141fbecd11000cf7e |
--- /dev/null |
+++ b/sitescripts/filterhits/common.py |
@@ -0,0 +1,80 @@ |
+# coding: utf-8 |
+ |
+# This file is part of the Adblock Plus web scripts, |
+# Copyright (C) 2006-2014 Eyeo GmbH |
+# |
+# Adblock Plus is free software: you can redistribute it and/or modify |
+# it under the terms of the GNU General Public License version 3 as |
+# published by the Free Software Foundation. |
+# |
+# Adblock Plus is distributed in the hope that it will be useful, |
+# but WITHOUT ANY WARRANTY; without even the implied warranty of |
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
+# GNU General Public License for more details. |
+# |
+# You should have received a copy of the GNU General Public License |
+# along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. |
+ |
+from datetime import datetime |
+import json, tempfile, os |
+ |
+def showError(message, start_response, status="400 Processing Error"): |
+ start_response(status, [("Content-Type", "text/plain; charset=utf-8")]) |
+ return [message.encode("utf-8")] |
+ |
+def valid_filter_hit(filter_hit): |
+ return ( |
+ isinstance(filter_hit, dict) and |
+ "thirdParty" in filter_hit and |
+ isinstance(filter_hit["thirdParty"], dict) and |
+ "firstParty" in filter_hit and |
+ isinstance(filter_hit["firstParty"], dict) and |
+ "subscriptions" in filter_hit and |
+ isinstance(filter_hit["subscriptions"], (list, tuple)) |
+ ) |
+ |
+def valid_log_data(data): |
+ """ |
+ This returns True if the filterhits data passed is structured |
+ roughly OK. Used as a quick check, it's not comprehensive. |
+ """ |
+ return ( |
Sebastian Noack
2015/02/11 16:00:12
I wonder whether we should rather properly check f
kzar
2015/02/17 10:52:24
Done.
|
+ isinstance(data, dict) and |
+ "version" in data and |
+ "timeSincePush" in data and |
+ "addonName" in data and |
+ "addonVersion" in data and |
+ "application" in data and |
+ "applicationVersion" in data and |
+ "platform" in data and |
+ "platformVersion" in data and |
+ "filters" in data and |
+ isinstance(data["filters"], dict) and |
+ (not len(data["filters"]) or |
+ valid_filter_hit(data["filters"].itervalues().next())) |
+ ) |
+ |
+def datetime_to_timestamp(dt): |
+ return int((dt - datetime(1970, 1, 1)).total_seconds()) |
Sebastian Noack
2015/02/11 16:00:12
Hardcoding the epoch looks like a hack to me. Did
kzar
2015/02/17 10:52:24
Done.
|
+ |
+def log_filterhits(data, basepath, query_string): |
+ """ |
+ This logs the provided filterhits data as JSON to a file named after |
+ the current timestamp in a directory named after the current date. |
+ """ |
+ now = datetime.now() |
+ |
+ dir_name = now.strftime("%Y-%m-%d") |
+ path = os.path.join(basepath, dir_name) |
+ if not os.path.exists(path): |
Sebastian Noack
2015/02/11 16:00:12
I'd rather catch the OSError, checking for e.errno
kzar
2015/02/17 10:52:24
Done.
|
+ os.makedirs(path) |
+ |
+ with tempfile.NamedTemporaryFile( |
+ prefix = str(datetime_to_timestamp(now)) + "-", |
+ suffix = ".log", |
+ dir = path, |
+ delete = False |
+ ) as f: |
+ f.write("[%s] \"%s\" %s\n" % (now.strftime('%d/%b/%Y:%H:%M:%S %z'), |
+ query_string, json.dumps(data))) |
+ return f.name |