| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | <?php | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * Handle request startup, before loading the environment or libraries. This | 
					
						
							|  |  |  |  * class bootstraps the request state up to the point where we can enter | 
					
						
							|  |  |  |  * Phabricator code. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * NOTE: This class MUST NOT have any dependencies. It runs before libraries | 
					
						
							|  |  |  |  * load. | 
					
						
							|  |  |  |  * | 
					
						
							| 
									
										
											  
											
												Rate limit requests by IP
Summary:
Fixes T3923. On `secure.phabricator.com`, we occasionally get slowed to a crawl when someone runs a security scanner against us, or 5 search bots decide to simultaneously index every line of every file in Diffusion.
Every time a user makes a request, give their IP address some points. If they get too many points in 5 minutes, start blocking their requests automatically for a while.
We give fewer points for logged in requests. We could futher refine this (more points for a 404, more points for a really slow page, etc.) but let's start simply.
Also, provide a mechanism for configuring this, and configuring the LB environment stuff at the same time (this comes up rarely, but we don't have a good answer right now).
Test Plan: Used `ab` and reloading over and over again to hit rate limits. Read documentation.
Reviewers: btrahan
Reviewed By: btrahan
Subscribers: chad, epriestley
Maniphest Tasks: T3923
Differential Revision: https://secure.phabricator.com/D8713
											
										 
											2014-04-08 18:36:21 -07:00
										 |  |  |  * Rate Limiting | 
					
						
							|  |  |  |  * ============= | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Phabricator limits the rate at which clients can request pages, and issues | 
					
						
							|  |  |  |  * HTTP 429 "Too Many Requests" responses if clients request too many pages too | 
					
						
							|  |  |  |  * quickly. Although this is not a complete defense against high-volume attacks, | 
					
						
							|  |  |  |  * it can  protect an install against aggressive crawlers, security scanners, | 
					
						
							|  |  |  |  * and some types of malicious activity. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * To perform rate limiting, each page increments a score counter for the | 
					
						
							|  |  |  |  * requesting user's IP. The page can give the IP more points for an expensive | 
					
						
							|  |  |  |  * request, or fewer for an authetnicated request. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Score counters are kept in buckets, and writes move to a new bucket every | 
					
						
							|  |  |  |  * minute. After a few minutes (defined by @{method:getRateLimitBucketCount}), | 
					
						
							|  |  |  |  * the oldest bucket is discarded. This provides a simple mechanism for keeping | 
					
						
							|  |  |  |  * track of scores without needing to store, access, or read very much data. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Users are allowed to accumulate up to 1000 points per minute, averaged across | 
					
						
							|  |  |  |  * all of the tracked buckets. | 
					
						
							|  |  |  |  * | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |  * @task info         Accessing Request Information | 
					
						
							|  |  |  |  * @task hook         Startup Hooks | 
					
						
							|  |  |  |  * @task apocalypse   In Case Of Apocalypse | 
					
						
							|  |  |  |  * @task validation   Validation | 
					
						
							| 
									
										
											  
											
												Rate limit requests by IP
Summary:
Fixes T3923. On `secure.phabricator.com`, we occasionally get slowed to a crawl when someone runs a security scanner against us, or 5 search bots decide to simultaneously index every line of every file in Diffusion.
Every time a user makes a request, give their IP address some points. If they get too many points in 5 minutes, start blocking their requests automatically for a while.
We give fewer points for logged in requests. We could futher refine this (more points for a 404, more points for a really slow page, etc.) but let's start simply.
Also, provide a mechanism for configuring this, and configuring the LB environment stuff at the same time (this comes up rarely, but we don't have a good answer right now).
Test Plan: Used `ab` and reloading over and over again to hit rate limits. Read documentation.
Reviewers: btrahan
Reviewed By: btrahan
Subscribers: chad, epriestley
Maniphest Tasks: T3923
Differential Revision: https://secure.phabricator.com/D8713
											
										 
											2014-04-08 18:36:21 -07:00
										 |  |  |  * @task ratelimit    Rate Limiting | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |  */ | 
					
						
							|  |  |  | final class PhabricatorStartup { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   private static $startTime; | 
					
						
							|  |  |  |   private static $globals = array(); | 
					
						
							| 
									
										
										
										
											2013-02-11 11:06:59 -08:00
										 |  |  |   private static $capturingOutput; | 
					
						
							| 
									
										
										
										
											2013-06-24 08:21:42 -07:00
										 |  |  |   private static $rawInput; | 
					
						
							| 
									
										
										
										
											2014-04-09 11:52:34 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  |   // TODO: For now, disable rate limiting entirely by default. We need to
 | 
					
						
							|  |  |  |   // iterate on it a bit for Conduit, some of the specific score levels, and
 | 
					
						
							|  |  |  |   // to deal with NAT'd offices.
 | 
					
						
							|  |  |  |   private static $maximumRate = 0; | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* -(  Accessing Request Information  )-------------------------------------- */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * @task info | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function getStartTime() { | 
					
						
							|  |  |  |     return self::$startTime; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-04-02 09:53:56 -07:00
										 |  |  |   /** | 
					
						
							|  |  |  |    * @task info | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function getMicrosecondsSinceStart() { | 
					
						
							|  |  |  |     return (int)(1000000 * (microtime(true) - self::getStartTime())); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |   /** | 
					
						
							|  |  |  |    * @task info | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function setGlobal($key, $value) { | 
					
						
							|  |  |  |     self::validateGlobal($key); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     self::$globals[$key] = $value; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * @task info | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function getGlobal($key, $default = null) { | 
					
						
							|  |  |  |     self::validateGlobal($key); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!array_key_exists($key, self::$globals)) { | 
					
						
							|  |  |  |       return $default; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-08-07 16:09:05 -07:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |     return self::$globals[$key]; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-06-24 08:21:42 -07:00
										 |  |  |   /** | 
					
						
							|  |  |  |    * @task info | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function getRawInput() { | 
					
						
							|  |  |  |     return self::$rawInput; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* -(  Startup Hooks  )------------------------------------------------------ */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * @task hook | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function didStartup() { | 
					
						
							|  |  |  |     self::$startTime = microtime(true); | 
					
						
							|  |  |  |     self::$globals = array(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     static $registered; | 
					
						
							|  |  |  |     if (!$registered) { | 
					
						
							|  |  |  |       // NOTE: This protects us against multiple calls to didStartup() in the
 | 
					
						
							|  |  |  |       // same request, but also against repeated requests to the same
 | 
					
						
							|  |  |  |       // interpreter state, which we may implement in the future.
 | 
					
						
							|  |  |  |       register_shutdown_function(array(__CLASS__, 'didShutdown')); | 
					
						
							|  |  |  |       $registered = true; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2012-12-25 06:15:28 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     self::setupPHP(); | 
					
						
							|  |  |  |     self::verifyPHP(); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												Rate limit requests by IP
Summary:
Fixes T3923. On `secure.phabricator.com`, we occasionally get slowed to a crawl when someone runs a security scanner against us, or 5 search bots decide to simultaneously index every line of every file in Diffusion.
Every time a user makes a request, give their IP address some points. If they get too many points in 5 minutes, start blocking their requests automatically for a while.
We give fewer points for logged in requests. We could futher refine this (more points for a 404, more points for a really slow page, etc.) but let's start simply.
Also, provide a mechanism for configuring this, and configuring the LB environment stuff at the same time (this comes up rarely, but we don't have a good answer right now).
Test Plan: Used `ab` and reloading over and over again to hit rate limits. Read documentation.
Reviewers: btrahan
Reviewed By: btrahan
Subscribers: chad, epriestley
Maniphest Tasks: T3923
Differential Revision: https://secure.phabricator.com/D8713
											
										 
											2014-04-08 18:36:21 -07:00
										 |  |  |     if (isset($_SERVER['REMOTE_ADDR'])) { | 
					
						
							|  |  |  |       self::rateLimitRequest($_SERVER['REMOTE_ADDR']); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |     self::normalizeInput(); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:15:28 -08:00
										 |  |  |     self::verifyRewriteRules(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     self::detectPostMaxSizeTriggered(); | 
					
						
							| 
									
										
										
										
											2013-02-11 11:06:59 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     self::beginOutputCapture(); | 
					
						
							| 
									
										
										
										
											2013-06-24 08:21:42 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  |     self::$rawInput = (string)file_get_contents('php://input'); | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * @task hook | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function didShutdown() { | 
					
						
							|  |  |  |     $event = error_get_last(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!$event) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     switch ($event['type']) { | 
					
						
							|  |  |  |       case E_ERROR: | 
					
						
							|  |  |  |       case E_PARSE: | 
					
						
							|  |  |  |       case E_COMPILE_ERROR: | 
					
						
							|  |  |  |         break; | 
					
						
							|  |  |  |       default: | 
					
						
							|  |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $msg = ">>> UNRECOVERABLE FATAL ERROR <<<\n\n"; | 
					
						
							|  |  |  |     if ($event) { | 
					
						
							|  |  |  |       // Even though we should be emitting this as text-plain, escape things
 | 
					
						
							|  |  |  |       // just to be sure since we can't really be sure what the program state
 | 
					
						
							|  |  |  |       // is when we get here.
 | 
					
						
							|  |  |  |       $msg .= htmlspecialchars( | 
					
						
							|  |  |  |         $event['message']."\n\n".$event['file'].':'.$event['line'], | 
					
						
							|  |  |  |         ENT_QUOTES, | 
					
						
							|  |  |  |         'UTF-8'); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // flip dem tables
 | 
					
						
							|  |  |  |     $msg .= "\n\n\n"; | 
					
						
							|  |  |  |     $msg .= "\xe2\x94\xbb\xe2\x94\x81\xe2\x94\xbb\x20\xef\xb8\xb5\x20\xc2\xaf". | 
					
						
							|  |  |  |             "\x5c\x5f\x28\xe3\x83\x84\x29\x5f\x2f\xc2\xaf\x20\xef\xb8\xb5\x20". | 
					
						
							|  |  |  |             "\xe2\x94\xbb\xe2\x94\x81\xe2\x94\xbb"; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     self::didFatal($msg); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:15:28 -08:00
										 |  |  |   public static function loadCoreLibraries() { | 
					
						
							|  |  |  |     $phabricator_root = dirname(dirname(__FILE__)); | 
					
						
							|  |  |  |     $libraries_root = dirname($phabricator_root); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $root = null; | 
					
						
							|  |  |  |     if (!empty($_SERVER['PHUTIL_LIBRARY_ROOT'])) { | 
					
						
							|  |  |  |       $root = $_SERVER['PHUTIL_LIBRARY_ROOT']; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ini_set( | 
					
						
							|  |  |  |       'include_path', | 
					
						
							|  |  |  |       $libraries_root.PATH_SEPARATOR.ini_get('include_path')); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     @include_once $root.'libphutil/src/__phutil_library_init__.php'; | 
					
						
							|  |  |  |     if (!@constant('__LIBPHUTIL__')) { | 
					
						
							|  |  |  |       self::didFatal( | 
					
						
							|  |  |  |         "Unable to load libphutil. Put libphutil/ next to phabricator/, or ". | 
					
						
							|  |  |  |         "update your PHP 'include_path' to include the parent directory of ". | 
					
						
							|  |  |  |         "libphutil/."); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     phutil_load_library('arcanist/src'); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Load Phabricator itself using the absolute path, so we never end up doing
 | 
					
						
							|  |  |  |     // anything surprising (loading index.php and libraries from different
 | 
					
						
							|  |  |  |     // directories).
 | 
					
						
							|  |  |  |     phutil_load_library($phabricator_root.'/src'); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-11 11:06:59 -08:00
										 |  |  | /* -(  Output Capture  )----------------------------------------------------- */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   public static function beginOutputCapture() { | 
					
						
							|  |  |  |     if (self::$capturingOutput) { | 
					
						
							| 
									
										
										
										
											2014-06-09 11:36:49 -07:00
										 |  |  |       self::didFatal('Already capturing output!'); | 
					
						
							| 
									
										
										
										
											2013-02-11 11:06:59 -08:00
										 |  |  |     } | 
					
						
							|  |  |  |     self::$capturingOutput = true; | 
					
						
							|  |  |  |     ob_start(); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   public static function endOutputCapture() { | 
					
						
							|  |  |  |     if (!self::$capturingOutput) { | 
					
						
							|  |  |  |       return null; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     self::$capturingOutput = false; | 
					
						
							|  |  |  |     return ob_get_clean(); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* -(  In Case of Apocalypse  )---------------------------------------------- */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							| 
									
										
										
										
											2014-01-21 14:03:09 -08:00
										 |  |  |    * Fatal the request completely in response to an exception, sending a plain | 
					
						
							|  |  |  |    * text message to the client. Calls @{method:didFatal} internally. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param   string    Brief description of the exception context, like | 
					
						
							|  |  |  |    *                    `"Rendering Exception"`. | 
					
						
							|  |  |  |    * @param   Exception The exception itself. | 
					
						
							|  |  |  |    * @param   bool      True if it's okay to show the exception's stack trace | 
					
						
							|  |  |  |    *                    to the user. The trace will always be logged. | 
					
						
							|  |  |  |    * @return  exit      This method **does not return**. | 
					
						
							|  |  |  |    * | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |    * @task apocalypse | 
					
						
							|  |  |  |    */ | 
					
						
							| 
									
										
										
										
											2014-01-21 14:03:09 -08:00
										 |  |  |   public static function didEncounterFatalException( | 
					
						
							|  |  |  |     $note, | 
					
						
							|  |  |  |     Exception $ex, | 
					
						
							|  |  |  |     $show_trace) { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $message = '['.$note.'/'.get_class($ex).'] '.$ex->getMessage(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $full_message = $message; | 
					
						
							|  |  |  |     $full_message .= "\n\n"; | 
					
						
							|  |  |  |     $full_message .= $ex->getTraceAsString(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if ($show_trace) { | 
					
						
							|  |  |  |       $message = $full_message; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     self::didFatal($message, $full_message); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Fatal the request completely, sending a plain text message to the client. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param   string  Plain text message to send to the client. | 
					
						
							|  |  |  |    * @param   string  Plain text message to send to the error log. If not | 
					
						
							|  |  |  |    *                  provided, the client message is used. You can pass a more | 
					
						
							|  |  |  |    *                  detailed message here (e.g., with stack traces) to avoid | 
					
						
							|  |  |  |    *                  showing it to users. | 
					
						
							|  |  |  |    * @return  exit    This method **does not return**. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @task apocalypse | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function didFatal($message, $log_message = null) { | 
					
						
							|  |  |  |     if ($log_message === null) { | 
					
						
							|  |  |  |       $log_message = $message; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-11 11:06:59 -08:00
										 |  |  |     self::endOutputCapture(); | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |     $access_log = self::getGlobal('log.access'); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-04-09 11:27:37 -07:00
										 |  |  |     if ($access_log) { | 
					
						
							|  |  |  |       // We may end up here before the access log is initialized, e.g. from
 | 
					
						
							|  |  |  |       // verifyPHP().
 | 
					
						
							| 
									
										
										
										
											2013-05-09 16:08:26 -07:00
										 |  |  |       $access_log->setData( | 
					
						
							|  |  |  |         array( | 
					
						
							|  |  |  |           'c' => 500, | 
					
						
							|  |  |  |         )); | 
					
						
							|  |  |  |       $access_log->write(); | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     header( | 
					
						
							|  |  |  |       'Content-Type: text/plain; charset=utf-8', | 
					
						
							|  |  |  |       $replace = true, | 
					
						
							|  |  |  |       $http_error = 500); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-01-21 14:03:09 -08:00
										 |  |  |     error_log($log_message); | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |     echo $message; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     exit(1); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* -(  Validation  )--------------------------------------------------------- */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |    * @task validation | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |    */ | 
					
						
							|  |  |  |   private static function setupPHP() { | 
					
						
							|  |  |  |     error_reporting(E_ALL | E_STRICT); | 
					
						
							|  |  |  |     ini_set('memory_limit', -1); | 
					
						
							| 
									
										
										
										
											2014-01-23 14:00:44 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     // If we have libxml, disable the incredibly dangerous entity loader.
 | 
					
						
							|  |  |  |     if (function_exists('libxml_disable_entity_loader')) { | 
					
						
							|  |  |  |       libxml_disable_entity_loader(true); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |   /** | 
					
						
							|  |  |  |    * @task validation | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function normalizeInput() { | 
					
						
							|  |  |  |     // Replace superglobals with unfiltered versions, disrespect php.ini (we
 | 
					
						
							|  |  |  |     // filter ourselves)
 | 
					
						
							| 
									
										
										
										
											2013-08-05 11:45:21 -07:00
										 |  |  |     $filter = array(INPUT_GET, INPUT_POST, | 
					
						
							|  |  |  |       INPUT_SERVER, INPUT_ENV, INPUT_COOKIE); | 
					
						
							|  |  |  |     foreach ($filter as $type) { | 
					
						
							|  |  |  |       $filtered = filter_input_array($type, FILTER_UNSAFE_RAW); | 
					
						
							|  |  |  |       if (!is_array($filtered)) { | 
					
						
							|  |  |  |         continue; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |       switch ($type) { | 
					
						
							|  |  |  |         case INPUT_SERVER: | 
					
						
							|  |  |  |           $_SERVER = array_merge($_SERVER, $filtered); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case INPUT_GET: | 
					
						
							|  |  |  |           $_GET = array_merge($_GET, $filtered); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case INPUT_COOKIE: | 
					
						
							|  |  |  |           $_COOKIE = array_merge($_COOKIE, $filtered); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case INPUT_POST: | 
					
						
							|  |  |  |           $_POST = array_merge($_POST, $filtered); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case INPUT_ENV; | 
					
						
							|  |  |  |           $_ENV = array_merge($_ENV, $filtered); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |       } | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // rebuild $_REQUEST, respecting order declared in ini files
 | 
					
						
							|  |  |  |     $order = ini_get('request_order'); | 
					
						
							|  |  |  |     if (!$order) { | 
					
						
							|  |  |  |       $order = ini_get('variables_order'); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     if (!$order) { | 
					
						
							|  |  |  |       // $_REQUEST will be empty, leave it alone
 | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     $_REQUEST = array(); | 
					
						
							|  |  |  |     for ($i = 0; $i < strlen($order); $i++) { | 
					
						
							|  |  |  |       switch ($order[$i]) { | 
					
						
							|  |  |  |         case 'G': | 
					
						
							|  |  |  |           $_REQUEST = array_merge($_REQUEST, $_GET); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case 'P': | 
					
						
							|  |  |  |           $_REQUEST = array_merge($_REQUEST, $_POST); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         case 'C': | 
					
						
							|  |  |  |           $_REQUEST = array_merge($_REQUEST, $_COOKIE); | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |         default: | 
					
						
							|  |  |  |           // $_ENV and $_SERVER never go into $_REQUEST
 | 
					
						
							|  |  |  |           break; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |    * @task validation | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |    */ | 
					
						
							|  |  |  |   private static function verifyPHP() { | 
					
						
							|  |  |  |     $required_version = '5.2.3'; | 
					
						
							|  |  |  |     if (version_compare(PHP_VERSION, $required_version) < 0) { | 
					
						
							|  |  |  |       self::didFatal( | 
					
						
							|  |  |  |         "You are running PHP version '".PHP_VERSION."', which is older than ". | 
					
						
							|  |  |  |         "the minimum version, '{$required_version}'. Update to at least ". | 
					
						
							|  |  |  |         "'{$required_version}'."); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (get_magic_quotes_gpc()) { | 
					
						
							|  |  |  |       self::didFatal( | 
					
						
							|  |  |  |         "Your server is configured with PHP 'magic_quotes_gpc' enabled. This ". | 
					
						
							|  |  |  |         "feature is 'highly discouraged' by PHP's developers and you must ". | 
					
						
							|  |  |  |         "disable it to run Phabricator. Consult the PHP manual for ". | 
					
						
							|  |  |  |         "instructions."); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-07-10 13:20:00 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  |     if (extension_loaded('apc')) { | 
					
						
							|  |  |  |       $apc_version = phpversion('apc'); | 
					
						
							|  |  |  |       $known_bad = array( | 
					
						
							|  |  |  |         '3.1.14' => true, | 
					
						
							|  |  |  |         '3.1.15' => true, | 
					
						
							| 
									
										
										
										
											2013-07-16 11:45:29 -07:00
										 |  |  |         '3.1.15-dev' => true, | 
					
						
							| 
									
										
										
										
											2013-07-10 13:20:00 -07:00
										 |  |  |       ); | 
					
						
							|  |  |  |       if (isset($known_bad[$apc_version])) { | 
					
						
							|  |  |  |         self::didFatal( | 
					
						
							|  |  |  |           "You have APC {$apc_version} installed. This version of APC is ". | 
					
						
							|  |  |  |           "known to be bad, and does not work with Phabricator (it will ". | 
					
						
							|  |  |  |           "cause Phabricator to fatal unrecoverably with nonsense errors). ". | 
					
						
							|  |  |  |           "Downgrade to version 3.1.13."); | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |    * @task validation | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |    */ | 
					
						
							|  |  |  |   private static function verifyRewriteRules() { | 
					
						
							| 
									
										
										
										
											2013-01-22 17:17:37 -08:00
										 |  |  |     if (isset($_REQUEST['__path__']) && strlen($_REQUEST['__path__'])) { | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (php_sapi_name() == 'cli-server') { | 
					
						
							|  |  |  |       // Compatibility with PHP 5.4+ built-in web server.
 | 
					
						
							|  |  |  |       $url = parse_url($_SERVER['REQUEST_URI']); | 
					
						
							|  |  |  |       $_REQUEST['__path__'] = $url['path']; | 
					
						
							| 
									
										
										
										
											2013-01-22 17:17:37 -08:00
										 |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!isset($_REQUEST['__path__'])) { | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |       self::didFatal( | 
					
						
							|  |  |  |         "Request parameter '__path__' is not set. Your rewrite rules ". | 
					
						
							|  |  |  |         "are not configured correctly."); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2013-01-22 17:17:37 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     if (!strlen($_REQUEST['__path__'])) { | 
					
						
							|  |  |  |       self::didFatal( | 
					
						
							|  |  |  |         "Request parameter '__path__' is set, but empty. Your rewrite rules ". | 
					
						
							|  |  |  |         "are not configured correctly. The '__path__' should always ". | 
					
						
							|  |  |  |         "begin with a '/'."); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							| 
									
										
										
										
											2013-08-04 18:07:35 -07:00
										 |  |  |    * @task validation | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |    */ | 
					
						
							|  |  |  |   private static function validateGlobal($key) { | 
					
						
							|  |  |  |     static $globals = array( | 
					
						
							|  |  |  |       'log.access' => true, | 
					
						
							| 
									
										
										
										
											2013-08-07 16:09:05 -07:00
										 |  |  |       'csrf.salt'  => true, | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  |     ); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (empty($globals[$key])) { | 
					
						
							|  |  |  |       throw new Exception("Access to unknown startup global '{$key}'!"); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:15:28 -08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Detect if this request has had its POST data stripped by exceeding the | 
					
						
							|  |  |  |    * 'post_max_size' PHP configuration limit. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * PHP has a setting called 'post_max_size'. If a POST request arrives with | 
					
						
							|  |  |  |    * a body larger than the limit, PHP doesn't generate $_POST but processes | 
					
						
							|  |  |  |    * the request anyway, and provides no formal way to detect that this | 
					
						
							|  |  |  |    * happened. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * We can still read the entire body out of `php://input`. However according | 
					
						
							|  |  |  |    * to the documentation the stream isn't available for "multipart/form-data" | 
					
						
							|  |  |  |    * (on nginx + php-fpm it appears that it is available, though, at least) so | 
					
						
							|  |  |  |    * any attempt to generate $_POST would be fragile. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @task validation | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function detectPostMaxSizeTriggered() { | 
					
						
							|  |  |  |     // If this wasn't a POST, we're fine.
 | 
					
						
							|  |  |  |     if ($_SERVER['REQUEST_METHOD'] != 'POST') { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // If there's POST data, clearly we're in good shape.
 | 
					
						
							|  |  |  |     if ($_POST) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // For HTML5 drag-and-drop file uploads, Safari submits the data as
 | 
					
						
							|  |  |  |     // "application/x-www-form-urlencoded". For most files this generates
 | 
					
						
							|  |  |  |     // something in POST because most files decode to some nonempty (albeit
 | 
					
						
							|  |  |  |     // meaningless) value. However, some files (particularly small images)
 | 
					
						
							|  |  |  |     // don't decode to anything. If we know this is a drag-and-drop upload,
 | 
					
						
							|  |  |  |     // we can skip this check.
 | 
					
						
							|  |  |  |     if (isset($_REQUEST['__upload__'])) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // PHP generates $_POST only for two content types. This routing happens
 | 
					
						
							|  |  |  |     // in `main/php_content_types.c` in PHP. Normally, all forms use one of
 | 
					
						
							|  |  |  |     // these content types, but some requests may not -- for example, Firefox
 | 
					
						
							|  |  |  |     // submits files sent over HTML5 XMLHTTPRequest APIs with the Content-Type
 | 
					
						
							|  |  |  |     // of the file itself. If we don't have a recognized content type, we
 | 
					
						
							|  |  |  |     // don't need $_POST.
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // NOTE: We use strncmp() because the actual content type may be something
 | 
					
						
							|  |  |  |     // like "multipart/form-data; boundary=...".
 | 
					
						
							|  |  |  |     //
 | 
					
						
							|  |  |  |     // NOTE: Chrome sometimes omits this header, see some discussion in T1762
 | 
					
						
							|  |  |  |     // and http://code.google.com/p/chromium/issues/detail?id=6800
 | 
					
						
							|  |  |  |     $content_type = isset($_SERVER['CONTENT_TYPE']) | 
					
						
							|  |  |  |       ? $_SERVER['CONTENT_TYPE'] | 
					
						
							|  |  |  |       : ''; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $parsed_types = array( | 
					
						
							|  |  |  |       'application/x-www-form-urlencoded', | 
					
						
							|  |  |  |       'multipart/form-data', | 
					
						
							|  |  |  |     ); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $is_parsed_type = false; | 
					
						
							|  |  |  |     foreach ($parsed_types as $parsed_type) { | 
					
						
							|  |  |  |       if (strncmp($content_type, $parsed_type, strlen($parsed_type)) === 0) { | 
					
						
							|  |  |  |         $is_parsed_type = true; | 
					
						
							|  |  |  |         break; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!$is_parsed_type) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Check for 'Content-Length'. If there's no data, we don't expect $_POST
 | 
					
						
							|  |  |  |     // to exist.
 | 
					
						
							|  |  |  |     $length = (int)$_SERVER['CONTENT_LENGTH']; | 
					
						
							|  |  |  |     if (!$length) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Time to fatal: we know this was a POST with data that should have been
 | 
					
						
							|  |  |  |     // populated into $_POST, but it wasn't.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $config = ini_get('post_max_size'); | 
					
						
							|  |  |  |     PhabricatorStartup::didFatal( | 
					
						
							|  |  |  |       "As received by the server, this request had a nonzero content length ". | 
					
						
							|  |  |  |       "but no POST data.\n\n". | 
					
						
							|  |  |  |       "Normally, this indicates that it exceeds the 'post_max_size' setting ". | 
					
						
							|  |  |  |       "in the PHP configuration on the server. Increase the 'post_max_size' ". | 
					
						
							|  |  |  |       "setting or reduce the size of the request.\n\n". | 
					
						
							|  |  |  |       "Request size according to 'Content-Length' was '{$length}', ". | 
					
						
							|  |  |  |       "'post_max_size' is set to '{$config}'."); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
											  
											
												Rate limit requests by IP
Summary:
Fixes T3923. On `secure.phabricator.com`, we occasionally get slowed to a crawl when someone runs a security scanner against us, or 5 search bots decide to simultaneously index every line of every file in Diffusion.
Every time a user makes a request, give their IP address some points. If they get too many points in 5 minutes, start blocking their requests automatically for a while.
We give fewer points for logged in requests. We could futher refine this (more points for a 404, more points for a really slow page, etc.) but let's start simply.
Also, provide a mechanism for configuring this, and configuring the LB environment stuff at the same time (this comes up rarely, but we don't have a good answer right now).
Test Plan: Used `ab` and reloading over and over again to hit rate limits. Read documentation.
Reviewers: btrahan
Reviewed By: btrahan
Subscribers: chad, epriestley
Maniphest Tasks: T3923
Differential Revision: https://secure.phabricator.com/D8713
											
										 
											2014-04-08 18:36:21 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  | /* -(  Rate Limiting  )------------------------------------------------------ */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Adjust the permissible rate limit score. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * By default, the limit is `1000`. You can use this method to set it to | 
					
						
							|  |  |  |    * a larger or smaller value. If you set it to `2000`, users may make twice | 
					
						
							|  |  |  |    * as many requests before rate limiting. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param int Maximum score before rate limiting. | 
					
						
							|  |  |  |    * @return void | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function setMaximumRate($rate) { | 
					
						
							|  |  |  |     self::$maximumRate = $rate; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Check if the user (identified by `$user_identity`) has issued too many | 
					
						
							|  |  |  |    * requests recently. If they have, end the request with a 429 error code. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * The key just needs to identify the user. Phabricator uses both user PHIDs | 
					
						
							|  |  |  |    * and user IPs as keys, tracking logged-in and logged-out users separately | 
					
						
							|  |  |  |    * and enforcing different limits. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param   string  Some key which identifies the user making the request. | 
					
						
							|  |  |  |    * @return  void    If the user has exceeded the rate limit, this method | 
					
						
							|  |  |  |    *                  does not return. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function rateLimitRequest($user_identity) { | 
					
						
							|  |  |  |     if (!self::canRateLimit()) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $score = self::getRateLimitScore($user_identity); | 
					
						
							|  |  |  |     if ($score > (self::$maximumRate * self::getRateLimitBucketCount())) { | 
					
						
							|  |  |  |       // Give the user some bonus points for getting rate limited. This keeps
 | 
					
						
							|  |  |  |       // bad actors who keep slamming the 429 page locked out completely,
 | 
					
						
							|  |  |  |       // instead of letting them get a burst of requests through every minute
 | 
					
						
							|  |  |  |       // after a bucket expires.
 | 
					
						
							|  |  |  |       self::addRateLimitScore($user_identity, 50); | 
					
						
							|  |  |  |       self::didRateLimit($user_identity); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Add points to the rate limit score for some user. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * If users have earned more than 1000 points per minute across all the | 
					
						
							|  |  |  |    * buckets they'll be locked out of the application, so awarding 1 point per | 
					
						
							|  |  |  |    * request roughly corresponds to allowing 1000 requests per second, while | 
					
						
							|  |  |  |    * awarding 50 points roughly corresponds to allowing 20 requests per second. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param string  Some key which identifies the user making the request. | 
					
						
							|  |  |  |    * @param float   The cost for this request; more points pushes them toward | 
					
						
							|  |  |  |    *                the limit faster. | 
					
						
							|  |  |  |    * @return void | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   public static function addRateLimitScore($user_identity, $score) { | 
					
						
							|  |  |  |     if (!self::canRateLimit()) { | 
					
						
							|  |  |  |       return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $current = self::getRateLimitBucket(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // There's a bit of a race here, if a second process reads the bucket before
 | 
					
						
							|  |  |  |     // this one writes it, but it's fine if we occasionally fail to record a
 | 
					
						
							|  |  |  |     // user's score. If they're making requests fast enough to hit rate
 | 
					
						
							|  |  |  |     // limiting, we'll get them soon.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $bucket_key = self::getRateLimitBucketKey($current); | 
					
						
							|  |  |  |     $bucket = apc_fetch($bucket_key); | 
					
						
							|  |  |  |     if (!is_array($bucket)) { | 
					
						
							|  |  |  |       $bucket = array(); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (empty($bucket[$user_identity])) { | 
					
						
							|  |  |  |       $bucket[$user_identity] = 0; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $bucket[$user_identity] += $score; | 
					
						
							|  |  |  |     apc_store($bucket_key, $bucket); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Determine if rate limiting is available. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * Rate limiting depends on APC, and isn't available unless the APC user | 
					
						
							|  |  |  |    * cache is available. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @return bool True if rate limiting is available. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function canRateLimit() { | 
					
						
							|  |  |  |     if (!self::$maximumRate) { | 
					
						
							|  |  |  |       return false; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!function_exists('apc_fetch')) { | 
					
						
							|  |  |  |       return false; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return true; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Get the current bucket for storing rate limit scores. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @return int The current bucket. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function getRateLimitBucket() { | 
					
						
							|  |  |  |     return (int)(time() / 60); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Get the total number of rate limit buckets to retain. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @return int Total number of rate limit buckets to retain. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function getRateLimitBucketCount() { | 
					
						
							|  |  |  |     return 5; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Get the APC key for a given bucket. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param int Bucket to get the key for. | 
					
						
							|  |  |  |    * @return string APC key for the bucket. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function getRateLimitBucketKey($bucket) { | 
					
						
							|  |  |  |     return 'rate:bucket:'.$bucket; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Get the APC key for the smallest stored bucket. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @return string APC key for the smallest stored bucket. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function getRateLimitMinKey() { | 
					
						
							|  |  |  |     return 'rate:min'; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Get the current rate limit score for a given user. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @param string Unique key identifying the user. | 
					
						
							|  |  |  |    * @return float The user's current score. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function getRateLimitScore($user_identity) { | 
					
						
							|  |  |  |     $min_key = self::getRateLimitMinKey(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Identify the oldest bucket stored in APC.
 | 
					
						
							|  |  |  |     $cur = self::getRateLimitBucket(); | 
					
						
							|  |  |  |     $min = apc_fetch($min_key); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // If we don't have any buckets stored yet, store the current bucket as
 | 
					
						
							|  |  |  |     // the oldest bucket.
 | 
					
						
							|  |  |  |     if (!$min) { | 
					
						
							|  |  |  |       apc_store($min_key, $cur); | 
					
						
							|  |  |  |       $min = $cur; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Destroy any buckets that are older than the minimum bucket we're keeping
 | 
					
						
							|  |  |  |     // track of. Under load this normally shouldn't do anything, but will clean
 | 
					
						
							|  |  |  |     // up an old bucket once per minute.
 | 
					
						
							|  |  |  |     $count = self::getRateLimitBucketCount(); | 
					
						
							|  |  |  |     for ($cursor = $min; $cursor < ($cur - $count); $cursor++) { | 
					
						
							|  |  |  |       apc_delete(self::getRateLimitBucketKey($cursor)); | 
					
						
							|  |  |  |       apc_store($min_key, $cursor + 1); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     // Now, sum up the user's scores in all of the active buckets.
 | 
					
						
							|  |  |  |     $score = 0; | 
					
						
							|  |  |  |     for (; $cursor <= $cur; $cursor++) { | 
					
						
							|  |  |  |       $bucket = apc_fetch(self::getRateLimitBucketKey($cursor)); | 
					
						
							|  |  |  |       if (isset($bucket[$user_identity])) { | 
					
						
							|  |  |  |         $score += $bucket[$user_identity]; | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return $score; | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /** | 
					
						
							|  |  |  |    * Emit an HTTP 429 "Too Many Requests" response (indicating that the user | 
					
						
							|  |  |  |    * has exceeded application rate limits) and exit. | 
					
						
							|  |  |  |    * | 
					
						
							|  |  |  |    * @return exit This method **does not return**. | 
					
						
							|  |  |  |    * @task ratelimit | 
					
						
							|  |  |  |    */ | 
					
						
							|  |  |  |   private static function didRateLimit() { | 
					
						
							|  |  |  |     $message = | 
					
						
							|  |  |  |       "TOO MANY REQUESTS\n". | 
					
						
							|  |  |  |       "You are issuing too many requests too quickly.\n". | 
					
						
							|  |  |  |       "To adjust limits, see \"Configuring a Preamble Script\" in the ". | 
					
						
							|  |  |  |       "documentation."; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     header( | 
					
						
							|  |  |  |       'Content-Type: text/plain; charset=utf-8', | 
					
						
							|  |  |  |       $replace = true, | 
					
						
							|  |  |  |       $http_error = 429); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     echo $message; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     exit(1); | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-12-25 06:11:39 -08:00
										 |  |  | } |