nand2 · hanshuebner · Apr 5, 2014 · Apr 5, 2014 · Apr 5, 2014 · Apr 5, 2014
diff --git a/README.rst b/README.rst
@@ -19,14 +19,25 @@ import throttle;
 DESCRIPTION
 ===========
 
-This vmod most obvious uses are to handle denial of services by a single user (or bot) punching through the cache, or to set rate limits to API calls you provide.
-
-It will allow you to set rate limiting, on several different time windows, per path/IP/whatever you want. If a time window limit was reached, this vmod will return you the time to wait before this call will be authorized.
-With this return information, you can handle rate limit overflow by either abruptly returning an error, or by actually waiting the necessary time if you deems it reasonable, for a smoother rate limit overflow handling.
-
-Please note that at the moment, there is no native way (AFAIK) to wait within Varnish (and no, using sleep() in the VCL is a *bad* idea), so you'll have to hack your way to it, e.g. redirect to a separate server that will wait for you and come back later.
-
-Please read carefully the "Memory management and denial of service" section below to avoid misuses that could lead to denial of services.
+This vmod most obvious uses are to handle denial of services by a
+single user (or bot) punching through the cache, or to set rate limits
+to API calls you provide.
+
+It will allow you to set rate limiting, on several different time
+windows, per path/IP/whatever you want. If a time window limit was
+reached, this vmod will return you the time to wait before this call
+will be authorized.  With this return information, you can handle rate
+limit overflow by either abruptly returning an error, or by actually
+waiting the necessary time if you deems it reasonable, for a smoother
+rate limit overflow handling.
+
+Please note that at the moment, there is no native way (AFAIK) to wait
+within Varnish (and no, using sleep() in the VCL is a *bad* idea), so
+you'll have to hack your way to it, e.g. redirect to a separate server
+that will wait for you and come back later.
+
+Please read carefully the "Memory management and denial of service"
+section below to avoid misuses that could lead to denial of services.
 
     "This is far better than any result I've seen from either HAProxy or Nginx doing layer 7 inspection on such modest [test] hardware."
 
@@ -45,14 +56,23 @@ Prototype
 Arguments
     key: A unique key that will identify what you are throttling. Can be used in may ways. See the examples below.
 
-    rate_limits: A list of different rate limits you want to put on this call. The syntax is the following: "[nb_of_calls]req/[duration][durations_size], ...". Example: "3req/s, 10req/30s, 30req/5m, 100req/h". Please note that we are using the Varnish duration size identifiers: s, m (and not mn/min), h, d. WARNING: You cannot define different rate_limits for a same key. If you do, only the one given in the first call will be used. See API rate limiting example below.
+    rate_limits: A list of different rate limits you want to put on
+    this call. The syntax is the following:
+    "[nb_of_calls]req/[duration][durations_size], ...". Example:
+    "3req/s, 10req/30s, 30req/5m, 100req/h". Please note that we are
+    using the Varnish duration size identifiers: s, m (and not
+    mn/min), h, d. WARNING: You cannot define different rate_limits
+    for a same key. If you do, only the one given in the first call
+    will be used. See API rate limiting example below.
 Return value
 	DURATION
 Description
     Increments the call counters.
     Returns 0.0 if the call was authorized, or the time to wait if one of the time window limit was reached.
 Example
-    Prevent a single user (or crazy googlebot) to make a denial of service by punching through the cache: limit MISS calls on non-static assets by IP, max 3 req/s, 10 req/30s, 30 req/5m::
+    Prevent a single user (or crazy googlebot) to make a denial of
+    service by punching through the cache: limit MISS calls on
+    non-static assets by IP, max 3 req/s, 10 req/30s, 30 req/5m::
 
             sub vcl_miss {
                 if(req.url !~ "\.(jpg|jpeg|png|gif|ico|swf|css|js|html|htm)$") {
@@ -82,6 +102,27 @@ Example
 
     Please note: You cannot set 2 differents set of rate limits for a same key. (If you do, only one will be used, and the other will be ignored). In this example, simply add some extra text to the key to differentiate the authentificated calls from the non-authentificated ones.
 
+set_windows
+-----------
+
+Prototype
+        ::
+
+                set_windows(STRING key, STRING rate_limits)
+Arguments
+    key: A unique key that will identify what you are throttling.
+
+    rate_limits: A list of different rate limits you want to put on
+    this call.
+
+    These arguments have the same meaning like in is_allowed.
+Return value
+	VOID
+Description
+    Create a set of named windows under the given key.  The rule set
+    is marked as being an "explicit" rule, which will enable more
+    logging for it.  It is intended to be used from vcl_init or as
+    part of an internal handler to create global rules.
 
 remaining_calls
 ---------------
@@ -118,36 +159,72 @@ Example
 MEMORY MANAGEMENT AND DENIAL OF SERVICE
 =======================================
 
-If used incorrectly, this tool could let an attacker force Varnish to consume all available memory and crash. It would be too bad to be DoS'ed by a tool that prevents DoS!
-What you need to know is that this vmod will keep in memory the time of the revelant last requests for each key you provide. And this memory is *outside* of the memory you specify to Varnish for caching. (So if you specify 4G of RAM to varnish, this vmod memory will be on top of it.)
+If used incorrectly, this tool could let an attacker force Varnish to
+consume all available memory and crash. It would be too bad to be
+DoS'ed by a tool that prevents DoS!  What you need to know is that
+this vmod will keep in memory the time of the revelant last requests
+for each key you provide. And this memory is *outside* of the memory
+you specify to Varnish for caching. (So if you specify 4G of RAM to
+varnish, this vmod memory will be on top of it.)
 
-For a given key, the amount of necessary memory is at its maximum fixed to the maximum number of request limit you give to this key, multiplied by 16 bytes. For example:: 
+For a given key, the amount of necessary memory is at its maximum
+fixed to the maximum number of request limit you give to this key,
+multiplied by the size of one the internal data structure to keep
+track of a key, currently 56 bytes on a 64 bit system. For example::
 
         if(throttle.is_allowed("pouet", "2req/s, 100req/h, 1000req/d") > 0s)
 
-For the key "pouet", the maximum memory usage will be 1000 (the maximum number between 2, 100, and 1000) multiplied by 16 bytes = 16 kbytes. Now, with a more advanced key::
+For the key "pouet", the maximum memory usage will be 1000 (the
+maximum number between 2, 100, and 1000) multiplied by 56 bytes ~= 56
+kbytes. Now, with a more advanced key::
 
         if(throttle.is_allowed("ip:" + client.ip, "2req/s, 100req/3h, 1000req/d") > 0s)
 
-We now have one key per client IP, which will each consume 16kbytes maximum. That is potentially unlimited. So what you also need to know is that the request times are kept in memory until they get older than the biggest time window: here one day (the biggest between 1s, 3 hours and 1 day).
-So if you take an average of 10,000 differents IP per day, that would cost at the maximum (if every IP was making 1000 calls), 10,000 * 16kbytes = 160 mbytes. That begins to be quite a number. So one can reduce this number by keeping request limits lower. For example::
+We now have one key per client IP, which will each consume ~56kbytes
+maximum. That is potentially unlimited. So what you also need to know
+is that the request times are kept in memory until they get older than
+the biggest time window: here one day (the biggest between 1s, 3 hours
+and 1 day).  So if you take an average of 10,000 differents IP per
+day, that would cost at the maximum (if every IP was making 1000
+calls), 10,000 * 56kbytes ~= 560 mbytes. That begins to be quite a
+number. So one can reduce this number by keeping request limits
+lower. For example::
 
         if(throttle.is_allowed("ip:" + client.ip, "2req/s, 30req/h") > 0s)
 
-This would reduce the maximum memory consumption, with 10,000 differents IP per day, to 10,000 * 30 * 16 = 4.8 mbytes. Much better. But wait! Now that we no longer have the 1 day window, the request times will only be kept for the new largest window, 1 hour. So if we have around 1,000 different IP per hour, that makes a maximum memory consumption of 1,000 * 30 * 16 = 480 kbytes. Muuch better! So we see that the time window sizes and lengths has a big impact on memory consumption.
-
-With the following example, we are theorically still open to distributed denial of service due to this vmod, but with the required number of necessary clients to consume all memory, it is much more likely that your backend services will fall and crash first. (And remember, we only use at maximum a fixed amount of memory per key, whatever the number of calls for this key).
-
-When we begin to be vulnerable to denial of service by a single user is when a single user can have an unlimited number of keys::
+This would reduce the maximum memory consumption, with 10,000
+differents IP per day, to 10,000 * 30 * 56 ~= 16.8 mbytes. Much
+better. But wait! Now that we no longer have the 1 day window, the
+request times will only be kept for the new largest window, 1 hour. So
+if we have around 1,000 different IP per hour, that makes a maximum
+memory consumption of 1,000 * 30 * 56 ~= 1,7 mbytes. Muuch better! So
+we see that the time window sizes and lengths has a big impact on
+memory consumption.
+
+With the following example, we are theorically still open to
+distributed denial of service due to this vmod, but with the required
+number of necessary clients to consume all memory, it is much more
+likely that your backend services will fall and crash first. (And
+remember, we only use at maximum a fixed amount of memory per key,
+whatever the number of calls for this key).
+
+When we begin to be vulnerable to denial of service by a single user
+is when a single user can have an unlimited number of keys::
 
         if(throttle.is_allowed("ip:" + client.ip + ":path:" + req.url, "2req/s, 30req/h") > 0s)
 
-With this example, you would limit the request rate per IP and per URL. A single user can thus create an unlimited number of keys, and thus consume an unlimited amount of memory, and make a denial of service by crashing varnish. So if you are in a case when you want to have different rate limits per path, it is a good idea to normalize the paths, and have a limited number of them only. For example::
+With this example, you would limit the request rate per IP and per
+URL. A single user can thus create an unlimited number of keys, and
+thus consume an unlimited amount of memory, and make a denial of
+service by crashing varnish. So if you are in a case when you want to
+have different rate limits per path, it is a good idea to normalize
+the paths, and have a limited number of them only. For example::
 
         if(req.url ~ "^/my_api_path/my_api_name") {
             if(throttle.is_allowed("ip:" + client.ip + ":api:api_name", "2req/s, 30req/h") > 0s)
 
-Finally, if you want to want to track the memory usage of this throttle vmod , you can use this command::
+Finally, if you want to want to track the memory usage of this
+throttle vmod , you can use this command::
 
         if(req.url == "/my_admin_page") {
             set resp.http.X-throttle-memusage = throttle.memory_usage();

diff --git a/debian/.gitignore b/debian/.gitignore
@@ -0,0 +1,4 @@
+files
+libvmod-throttle
+*substvars
+*log
diff --git a/debian/rules b/debian/rules
@@ -1,9 +1,9 @@
 #!/usr/bin/make -f
 export DH_VERBOSE=1
 
-VARNISHSRC = $(DEBIAN_VARNISH_SRC)
-VMODDIR = $(shell PKG_CONFIG_PATH="$(VARNISHSRC)" pkg-config --variable=vmoddir varnishapi)
-VMOD_ABI = $(shell printf '\#include "vmod_abi.h"\nVMOD_ABI_Version' | cpp - -I$(DEBIAN_VARNISH_SRC)/include | sed '/^\#/D;s/"//g;s/\([A-Z]\)/\L\1/g;s/[^a-z0-9.]/-/g;s/varnish/varnishabi/')
+VARNISHSRC ?= $(DEBIAN_VARNISH_SRC)
+VMODDIR ?= $(shell PKG_CONFIG_PATH="$(VARNISHSRC)" pkg-config --variable=vmoddir varnishapi)
+VMOD_ABI ?= $(shell printf '\#include "vmod_abi.h"\nVMOD_ABI_Version' | cpp - -I$(DEBIAN_VARNISH_SRC)/include | sed '/^\#/D;s/"//g;s/\([A-Z]\)/\L\1/g;s/[^a-z0-9.]/-/g;s/varnish/varnishabi/')
 
 override_dh_auto_configure:
 	dh_auto_configure -- VMODDIR="$(VMODDIR)" VARNISHSRC="$(VARNISHSRC)"
@@ -14,7 +14,7 @@ override_dh_gencontrol:
 	if [ -n "$$DEBIAN_OVERRIDE_BINARY_VERSION" ]; then \
 		dh_gencontrol -- -Tdebian/substvars -v$$DEBIAN_OVERRIDE_BINARY_VERSION; \
 	else \
-		dh_gencontrol -Tdebian/substvars; \
+		dh_gencontrol -- -Tdebian/substvars; \
 	fi
 
 %:

diff --git a/package.sh b/package.sh
@@ -0,0 +1,11 @@
+#!/bin/sh
+set -x
+
+export VARNISH_VERSION=${VARNISH_VERSION:="3.0.5"}
+export VARNISHSRC=../varnish-${VARNISH_VERSION}
+export DEBIAN_VARNISH_SRC=$VARNISHSRC
+export VMODDIR=/usr/lib/varnish/vmods
+
+git submodule update --init
+./autogen.sh && ./configure && make
+dpkg-buildpackage -uc -us -b