aboutsummaryrefslogtreecommitdiffstats
path: root/roles/web/templates/sites/233233.g.conf.j2
diff options
context:
space:
mode:
Diffstat (limited to 'roles/web/templates/sites/233233.g.conf.j2')
-rw-r--r--roles/web/templates/sites/233233.g.conf.j2164
1 files changed, 164 insertions, 0 deletions
diff --git a/roles/web/templates/sites/233233.g.conf.j2 b/roles/web/templates/sites/233233.g.conf.j2
new file mode 100644
index 0000000..1197b9f
--- /dev/null
+++ b/roles/web/templates/sites/233233.g.conf.j2
@@ -0,0 +1,164 @@
+{% set domain = "233233.xyz" %}
+#
+# nginx/sites: reverse proxy to Google Search (with images and webcache))
+#
+# Credit:
+# * Nginx rewrite append a parameter at the end of an URL
+# https://serverfault.com/a/311660/387898
+# * https://github.com/tracycool/Reverse-Proxy-for-Google
+# * https://github.com/caiguanhao/nginx-bypass-gfw/blob/master/google.conf
+#
+# References:
+# * Google Custom Search - CSE parameters list
+# https://developers.google.com/custom-search/json-api/v1/reference/cse/list
+#
+#
+# Aaron LI
+# 2017-05-23
+#
+
+{% if domains_hascert[domain] %}
+server {
+ listen 443 ssl http2;
+ listen [::]:443 ssl http2;
+ server_name g.{{ domain }};
+
+ # SSL/TLS Certificate kindly provided by Let's Encrypt
+ ssl_certificate /usr/local/etc/ssl/acme/{{ domain }}/fullchain.pem;
+ ssl_certificate_key /usr/local/etc/ssl/acme/private/{{ domain }}.pem;
+
+ # Enable caching
+ #proxy_cache CACHE;
+
+ # Tune buffer
+ proxy_buffer_size 64k;
+ proxy_buffers 4 128k;
+ proxy_busy_buffers_size 128k;
+
+ # Replace cookie domain
+ proxy_cookie_domain google.com $host;
+
+ # Hide some upstream headers to avoid duplicates/overrideing
+ proxy_hide_header Strict-Transport-Security;
+ proxy_hide_header Content-Security-Policy;
+ proxy_hide_header X-Frame-Options;
+ proxy_hide_header X-XSS-Protection;
+ proxy_hide_header X-Content-Type-Options;
+ proxy_hide_header Referrer-Policy;
+
+ # Substitute links in contents
+ # NOTE: Require to set Accept-Encoding="" header in order to request
+ # *uncompressed* data from upstream, otherwise won't work!
+ sub_filter_types text/css text/javascript application/json;
+ sub_filter_once off;
+ sub_filter //www.google.com/ //$host/;
+ sub_filter //apis.google.com/ //$host/__gapis/;
+ sub_filter //ajax.googleapis.com/ //$host/__gajax/;
+ sub_filter //fonts.googleapis.com/ //$host/__gfonts/;
+ sub_filter //www.gstatic.com/ //$host/__gstatic/www/;
+ sub_filter //ssl.gstatic.com/ //$host/__gstatic/ssl/;
+ sub_filter //encrypted-tbn0.gstatic.com/ //$host/__gstatic/enc-tbn0/;
+ # Google Images
+ sub_filter //webcache.googleusercontent.com/ //$host/__gwebcache/;
+
+ # WARNING:
+ # The "proxy_set_header" directives are inherited from the previous
+ # level *if and only if* there are *no* such directives defined on
+ # the current level!
+
+ #
+ # Reverse proxy to Google search and its friends :-)
+ #
+ location / {
+ proxy_pass https://www.google.com;
+
+ # These header need set explicitly, otherwise the browser will
+ # be redirected to Google's URL without proxy...
+ proxy_set_header Host www.google.com;
+ proxy_set_header Referer https://www.google.com;
+ # Set other necessary headers
+ # NOTE: Set Accept-Encoding="" to request *uncompressed* data
+ # from upstream, otherwise "sub_filter" doesn't work!
+ # Credit: https://stackoverflow.com/a/36274259
+ {% block proxy_set_header_common %}
+ proxy_set_header User-Agent $http_user_agent;
+ proxy_set_header X-Real-IP $remote_addr;
+ proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+ proxy_set_header X-Forwarded-Proto $scheme;
+ proxy_set_header Cookie "";
+ proxy_set_header Accept-Language "en-US";
+ proxy_set_header Accept-Encoding "";
+ {% endblock %}
+
+ # Append "&gfe_rd=cr&gws_rd=cr" to disable country redirection.
+ # Append "&hl=en" to set interface language to English.
+ #
+ # "rewrite" matches against URL's *path* part only, which means
+ # "$1" will *not* contain the query string. And Nginx appends
+ # original query string to the rewrite replacement by default.
+ #
+ # Credit: https://serverfault.com/a/311660/387898
+ rewrite ^(.*)$ $1?gfe_rd=cr&gws_rd=cr&hl=en break;
+ }
+
+ location ^~ /__gwebcache/ {
+ # ^~ will make location search stop here if matched.
+ proxy_pass https://webcache.googleusercontent.com/;
+ # Note the trailing '/' above, which tells Nginx to strip the
+ # matched URI.
+ # Credit: https://serverfault.com/a/725433/387898
+
+ proxy_set_header Host webcache.googleusercontent.com;
+ proxy_set_header Referer https://webcache.googleusercontent.com;
+ # NOTE: The upper level "proxy_set_header" directives are *not*
+ # inherited since there are such directives on this level!
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gstatic/ssl/ {
+ proxy_pass https://ssl.gstatic.com/;
+ proxy_set_header Host ssl.gstatic.com;
+ proxy_set_header Referer https://ssl.gstatic.com;
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gstatic/www/ {
+ proxy_pass https://www.gstatic.com/;
+ proxy_set_header Host ssl.gstatic.com;
+ proxy_set_header Referer https://ssl.gstatic.com;
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gstatic/enc-tbn0/ {
+ proxy_pass https://encrypted-tbn0.gstatic.com/;
+ proxy_set_header Host encrypted-tbn0.gstatic.com;
+ proxy_set_header Referer https://encrypted-tbn0.gstatic.com;
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gapis/ {
+ proxy_pass https://apis.google.com/;
+ proxy_set_header Host apis.google.com;
+ proxy_set_header Referer https://apis.google.com;
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gfonts/ {
+ proxy_pass https://fonts.googleapis.com/;
+ proxy_set_header Host fonts.googleapis.com;
+ proxy_set_header Referer https://fonts.googleapis.com;
+ {{ self.proxy_set_header_common() }}
+ }
+ location ^~ /__gajax/ {
+ proxy_pass https://ajax.googleapis.com/;
+ proxy_set_header Host ajax.googleapis.com;
+ proxy_set_header Referer https://ajax.googleapis.com;
+ {{ self.proxy_set_header_common() }}
+ }
+
+ # Forbid spider
+ if ($http_user_agent ~* "qihoobot|Baiduspider|Googlebot|Googlebot-Mobile|Googlebot-Image|Mediapartners-Google|Adsbot-Google|Feedfetcher-Google|Yahoo! Slurp|Yahoo! Slurp China|YoudaoBot|Sosospider|Sogou spider|Sogou web spider|MSNBot|ia_archiver|Tomato Bot") {
+ return 403;
+ }
+
+ location /robots.txt {
+ default_type text/plain;
+ return 200 "User-agent: *\nDisallow: /\n";
+ }
+}
+{% endif %}