]> git.deb.at Git - deb/hackedgotchi.git/blobdiff - filters/remove-trackers-and-ads.plugin
Add patch from Paul Wise to filter out various unwanted stuff
[deb/hackedgotchi.git] / filters / remove-trackers-and-ads.plugin
diff --git a/filters/remove-trackers-and-ads.plugin b/filters/remove-trackers-and-ads.plugin
new file mode 100644 (file)
index 0000000..84c2a04
--- /dev/null
@@ -0,0 +1,26 @@
+import sys
+import re
+
+data = sys.stdin.read()
+
+regexes = [
+       # Blogger tracking images
+       r"""<img [^>]*?src=["']https?://blogger\.googleusercontent\.com/tracker/[^'"]*['"][^>]*>""",
+       # Feedburner ads
+       r"""<p><a href=['"]https?://[a-zA-Z0-9\-\.]*/~a/[a-zA-Z0-9]*\?a=[a-zA-Z0-9]*['"]><img border=['"]0['"] src=['"]https?://[a-zA-Z0-9\.\-]*/~a/[a-zA-Z0-9/]*\?i=[a-zA-Z0-9]*['"]/></a></p>""",
+       # Feedburner tracking images
+       r"""<img [^>]*?src=['"]https?://feeds\.feedburner\.com/~r/[^"']*['"][^>]*>""",
+       # Wordpress tracking images
+       r"""<img [^>]*?src=['"]https?://stats\.wordpress\.com/b\.gif[^"']*['"][^>]*>""",
+       # Amazon tracking images
+       r"""<img [^>]*?src=['"]https?://www\.assoc-amazon\.com/e/ir[^"']*['"][^>]*>""",
+       # Paypal tracking images
+       r"""<img [^>]*?src=['"]https?://www\.paypalobjects\.com/[^/]*/i/scr/pixel.gif[^"']*['"][^>]*>""",
+       # Other tracking images
+       r'<img [^>]*?width=["']1["'][^>]*?height=["']1["'][^>]*>',
+       r'<img [^>]*?height=["']1["'][^>]*?width=["']1["'][^>]*>',
+]
+
+for regex in regexes: data = re.sub(regex, '', data)
+
+sys.stdout.write(data)