2017-07-24 16:20:53 -04:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2016-08-06 12:51:43 -04:00
|
|
|
require "ipaddr"
|
2014-08-20 18:42:32 -04:00
|
|
|
|
2010-03-03 19:22:30 -05:00
|
|
|
module ActionDispatch
|
2013-01-02 18:21:13 -05:00
|
|
|
# This middleware calculates the IP address of the remote client that is
|
|
|
|
# making the request. It does this by checking various headers that could
|
|
|
|
# contain the address, and then picking the last-set address that is not
|
2013-02-11 11:32:12 -05:00
|
|
|
# on the list of trusted IPs. This follows the precedent set by e.g.
|
2013-01-02 18:21:13 -05:00
|
|
|
# {the Tomcat server}[https://issues.apache.org/bugzilla/show_bug.cgi?id=50453],
|
2019-10-02 05:54:57 -04:00
|
|
|
# with {reasoning explained at length}[https://blog.gingerlime.com/2012/rails-ip-spoofing-vulnerabilities-and-protection]
|
2013-01-02 18:21:13 -05:00
|
|
|
# by @gingerlime. A more detailed explanation of the algorithm is given
|
|
|
|
# at GetIp#calculate_ip.
|
|
|
|
#
|
2017-08-21 19:53:32 -04:00
|
|
|
# Some Rack servers concatenate repeated headers, like {HTTP RFC 2616}[https://www.w3.org/Protocols/rfc2616/rfc2616-sec4.html#sec4.2]
|
2013-02-21 09:37:45 -05:00
|
|
|
# requires. Some Rack servers simply drop preceding headers, and only report
|
2019-10-02 05:54:57 -04:00
|
|
|
# the value that was {given in the last header}[https://andre.arko.net/2011/12/26/repeated-headers-and-ruby-web-servers].
|
2014-06-07 04:53:27 -04:00
|
|
|
# If you are behind multiple proxy servers (like NGINX to HAProxy to Unicorn)
|
2013-01-02 18:21:13 -05:00
|
|
|
# then you should test your Rack server to make sure your data is good.
|
|
|
|
#
|
|
|
|
# IF YOU DON'T USE A PROXY, THIS MAKES YOU VULNERABLE TO IP SPOOFING.
|
|
|
|
# This middleware assumes that there is at least one proxy sitting around
|
|
|
|
# and setting headers with the client's remote IP address. If you don't use
|
2013-01-02 18:34:27 -05:00
|
|
|
# a proxy, because you are hosted on e.g. Heroku without SSL, any client can
|
|
|
|
# claim to have any IP address by setting the X-Forwarded-For header. If you
|
|
|
|
# care about that, then you need to explicitly drop or ignore those headers
|
|
|
|
# sometime before this middleware runs.
|
2010-03-03 19:22:30 -05:00
|
|
|
class RemoteIp
|
2013-01-02 18:21:13 -05:00
|
|
|
class IpSpoofAttackError < StandardError; end
|
2010-03-03 19:22:30 -05:00
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# The default trusted IPs list simply includes IP addresses that are
|
|
|
|
# guaranteed by the IP specification to be private addresses. Those will
|
|
|
|
# not be the ultimate client IP in production, and so are discarded. See
|
2017-08-21 19:53:32 -04:00
|
|
|
# https://en.wikipedia.org/wiki/Private_network for details.
|
2014-08-20 18:42:32 -04:00
|
|
|
TRUSTED_PROXIES = [
|
2020-01-02 14:50:06 -05:00
|
|
|
"127.0.0.0/8", # localhost IPv4 range, per RFC-3330
|
2014-08-20 18:42:32 -04:00
|
|
|
"::1", # localhost IPv6
|
|
|
|
"fc00::/7", # private IPv6 range fc00::/7
|
|
|
|
"10.0.0.0/8", # private IPv4 range 10.x.x.x
|
|
|
|
"172.16.0.0/12", # private IPv4 range 172.16.0.0 .. 172.31.255.255
|
|
|
|
"192.168.0.0/16", # private IPv4 range 192.168.x.x
|
|
|
|
].map { |proxy| IPAddr.new(proxy) }
|
2011-11-12 02:22:49 -05:00
|
|
|
|
2011-11-14 16:20:20 -05:00
|
|
|
attr_reader :check_ip, :proxies
|
2011-11-12 05:45:31 -05:00
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# Create a new +RemoteIp+ middleware instance.
|
|
|
|
#
|
2015-11-22 06:42:29 -05:00
|
|
|
# The +ip_spoofing_check+ option is on by default. When on, an exception
|
2013-01-02 18:21:13 -05:00
|
|
|
# is raised if it looks like the client is trying to lie about its own IP
|
|
|
|
# address. It makes sense to turn off this check on sites aimed at non-IP
|
|
|
|
# clients (like WAP devices), or behind proxies that set headers in an
|
|
|
|
# incorrect or confusing way (like AWS ELB).
|
|
|
|
#
|
2014-08-20 18:42:32 -04:00
|
|
|
# The +custom_proxies+ argument can take an Array of string, IPAddr, or
|
|
|
|
# Regexp objects which will be used instead of +TRUSTED_PROXIES+. If a
|
|
|
|
# single string, IPAddr, or Regexp object is provided, it will be used in
|
|
|
|
# addition to +TRUSTED_PROXIES+. Any proxy setup will put the value you
|
|
|
|
# want in the middle (or at the beginning) of the X-Forwarded-For list,
|
|
|
|
# with your proxy servers after it. If your proxies aren't removed, pass
|
|
|
|
# them in via the +custom_proxies+ parameter. That way, the middleware will
|
|
|
|
# ignore those IP addresses, and return the one that you want.
|
2015-11-22 06:42:29 -05:00
|
|
|
def initialize(app, ip_spoofing_check = true, custom_proxies = nil)
|
2011-11-12 02:22:49 -05:00
|
|
|
@app = app
|
2015-11-22 06:42:29 -05:00
|
|
|
@check_ip = ip_spoofing_check
|
2014-08-20 18:42:32 -04:00
|
|
|
@proxies = if custom_proxies.blank?
|
|
|
|
TRUSTED_PROXIES
|
|
|
|
elsif custom_proxies.respond_to?(:any?)
|
|
|
|
custom_proxies
|
|
|
|
else
|
|
|
|
Array(custom_proxies) + TRUSTED_PROXIES
|
|
|
|
end
|
2011-11-12 02:22:49 -05:00
|
|
|
end
|
2010-03-03 19:22:30 -05:00
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# Since the IP address may not be needed, we store the object here
|
|
|
|
# without calculating the IP to keep from slowing down the majority of
|
|
|
|
# requests. For those requests that do need to know the IP, the
|
|
|
|
# GetIp#calculate_ip method will calculate the memoized client IP address.
|
2011-11-12 02:22:49 -05:00
|
|
|
def call(env)
|
2015-08-06 19:20:47 -04:00
|
|
|
req = ActionDispatch::Request.new env
|
|
|
|
req.remote_ip = GetIp.new(req, check_ip, proxies)
|
|
|
|
@app.call(req.env)
|
2010-03-03 19:22:30 -05:00
|
|
|
end
|
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# The GetIp class exists as a way to defer processing of the request data
|
|
|
|
# into an actual IP address. If the ActionDispatch::Request#remote_ip method
|
|
|
|
# is called, this class will calculate the value and then memoize it.
|
2011-11-12 05:45:31 -05:00
|
|
|
class GetIp
|
2015-08-06 19:20:47 -04:00
|
|
|
def initialize(req, check_ip, proxies)
|
|
|
|
@req = req
|
2015-06-03 02:00:34 -04:00
|
|
|
@check_ip = check_ip
|
|
|
|
@proxies = proxies
|
2011-11-12 05:45:31 -05:00
|
|
|
end
|
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# Sort through the various IP address headers, looking for the IP most
|
|
|
|
# likely to be the address of the actual remote client making this
|
|
|
|
# request.
|
|
|
|
#
|
|
|
|
# REMOTE_ADDR will be correct if the request is made directly against the
|
|
|
|
# Ruby process, on e.g. Heroku. When the request is proxied by another
|
2014-06-07 04:53:27 -04:00
|
|
|
# server like HAProxy or NGINX, the IP address that made the original
|
2013-01-02 18:21:13 -05:00
|
|
|
# request will be put in an X-Forwarded-For header. If there are multiple
|
|
|
|
# proxies, that header may contain a list of IPs. Other proxy services
|
|
|
|
# set the Client-Ip header instead, so we check that too.
|
|
|
|
#
|
2019-10-02 05:54:57 -04:00
|
|
|
# As discussed in {this post about Rails IP Spoofing}[https://blog.gingerlime.com/2012/rails-ip-spoofing-vulnerabilities-and-protection/],
|
2013-01-02 18:21:13 -05:00
|
|
|
# while the first IP in the list is likely to be the "originating" IP,
|
|
|
|
# it could also have been set by the client maliciously.
|
|
|
|
#
|
|
|
|
# In order to find the first address that is (probably) accurate, we
|
|
|
|
# take the list of IPs, remove known and trusted proxies, and then take
|
|
|
|
# the last address left, which was presumably set by one of those proxies.
|
2011-11-14 16:20:57 -05:00
|
|
|
def calculate_ip
|
2013-01-02 18:21:13 -05:00
|
|
|
# Set by the Rack web server, this is a single value.
|
2020-05-09 22:23:34 -04:00
|
|
|
remote_addr = sanitize_ips(ips_from(@req.remote_addr)).last
|
2013-01-02 18:21:13 -05:00
|
|
|
|
|
|
|
# Could be a CSV list and/or repeated headers that were concatenated.
|
2020-05-09 22:23:34 -04:00
|
|
|
client_ips = sanitize_ips(ips_from(@req.client_ip)).reverse
|
|
|
|
forwarded_ips = sanitize_ips(@req.forwarded_for || []).reverse
|
2013-01-02 18:21:13 -05:00
|
|
|
|
|
|
|
# +Client-Ip+ and +X-Forwarded-For+ should not, generally, both be set.
|
2015-11-22 06:42:29 -05:00
|
|
|
# If they are both set, it means that either:
|
|
|
|
#
|
|
|
|
# 1) This request passed through two proxies with incompatible IP header
|
|
|
|
# conventions.
|
|
|
|
# 2) The client passed one of +Client-Ip+ or +X-Forwarded-For+
|
|
|
|
# (whichever the proxy servers weren't using) themselves.
|
|
|
|
#
|
|
|
|
# Either way, there is no way for us to determine which header is the
|
|
|
|
# right one after the fact. Since we have no idea, if we are concerned
|
|
|
|
# about IP spoofing we need to give up and explode. (If you're not
|
|
|
|
# concerned about IP spoofing you can turn the +ip_spoofing_check+
|
|
|
|
# option off.)
|
2013-06-04 18:01:08 -04:00
|
|
|
should_check_ip = @check_ip && client_ips.last && forwarded_ips.last
|
2013-01-02 18:21:13 -05:00
|
|
|
if should_check_ip && !forwarded_ips.include?(client_ips.last)
|
2011-11-12 05:45:31 -05:00
|
|
|
# We don't know which came from the proxy, and which from the user
|
2017-01-12 03:39:16 -05:00
|
|
|
raise IpSpoofAttackError, "IP spoofing attack?! " \
|
|
|
|
"HTTP_CLIENT_IP=#{@req.client_ip.inspect} " \
|
2015-08-06 19:20:47 -04:00
|
|
|
"HTTP_X_FORWARDED_FOR=#{@req.x_forwarded_for.inspect}"
|
2011-11-12 05:45:31 -05:00
|
|
|
end
|
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# We assume these things about the IP headers:
|
|
|
|
#
|
|
|
|
# - X-Forwarded-For will be a list of IPs, one per proxy, or blank
|
|
|
|
# - Client-Ip is propagated from the outermost proxy, or is blank
|
|
|
|
# - REMOTE_ADDR will be the IP that made the request to Rack
|
When all IPs are trusted, use the furthest away
Scenario: we have a REMOTE_ADDR of `127.0.0.1`, and X-Forwarded-For is
`A, B, C`.
Without any relevant trust, the `remote_ip` is `C`.
If `C` is trusted, then the `remote_ip` is `B`.
If `B` and `C` are trusted, then the `remote_ip` is `A`.
If all of `A`, `B`, and `C` are trusted, then the `remote_ip` should
still be `A`: if our trust was sufficient to get that far out before,
trusting something else should not have us fall back to `127.0.0.1`.
It is this last situation that we're correcting here:
We trust `A` to give us accurate X-Forwarded-For information, yet it has
chosen to leave it unset. Therefore, `A` is telling us that it is itself
the client.
2014-04-04 12:14:16 -04:00
|
|
|
ips = [forwarded_ips, client_ips].flatten.compact
|
2013-01-02 18:21:13 -05:00
|
|
|
|
When all IPs are trusted, use the furthest away
Scenario: we have a REMOTE_ADDR of `127.0.0.1`, and X-Forwarded-For is
`A, B, C`.
Without any relevant trust, the `remote_ip` is `C`.
If `C` is trusted, then the `remote_ip` is `B`.
If `B` and `C` are trusted, then the `remote_ip` is `A`.
If all of `A`, `B`, and `C` are trusted, then the `remote_ip` should
still be `A`: if our trust was sufficient to get that far out before,
trusting something else should not have us fall back to `127.0.0.1`.
It is this last situation that we're correcting here:
We trust `A` to give us accurate X-Forwarded-For information, yet it has
chosen to leave it unset. Therefore, `A` is telling us that it is itself
the client.
2014-04-04 12:14:16 -04:00
|
|
|
# If every single IP option is in the trusted list, return the IP
|
|
|
|
# that's furthest away
|
|
|
|
filter_proxies(ips + [remote_addr]).first || ips.last || remote_addr
|
2011-11-12 05:45:31 -05:00
|
|
|
end
|
|
|
|
|
2013-01-02 18:21:13 -05:00
|
|
|
# Memoizes the value returned by #calculate_ip and returns it for
|
|
|
|
# ActionDispatch::Request to use.
|
2011-11-14 16:20:57 -05:00
|
|
|
def to_s
|
2012-10-24 07:32:32 -04:00
|
|
|
@ip ||= calculate_ip
|
2011-11-14 16:20:57 -05:00
|
|
|
end
|
|
|
|
|
2016-12-22 04:48:24 -05:00
|
|
|
private
|
|
|
|
def ips_from(header) # :doc:
|
2015-08-06 19:20:47 -04:00
|
|
|
return [] unless header
|
2017-03-12 12:51:26 -04:00
|
|
|
# Split the comma-separated list into an array of strings.
|
2020-05-09 22:23:34 -04:00
|
|
|
header.strip.split(/[,\s]+/)
|
|
|
|
end
|
|
|
|
|
|
|
|
def sanitize_ips(ips) # :doc:
|
2014-08-20 18:42:32 -04:00
|
|
|
ips.select do |ip|
|
2018-12-20 12:44:01 -05:00
|
|
|
# Only return IPs that are valid according to the IPAddr#new method.
|
|
|
|
range = IPAddr.new(ip).to_range
|
|
|
|
# We want to make sure nobody is sneaking a netmask in.
|
|
|
|
range.begin == range.end
|
|
|
|
rescue ArgumentError
|
|
|
|
nil
|
2014-08-20 18:42:32 -04:00
|
|
|
end
|
2012-04-25 06:31:00 -04:00
|
|
|
end
|
|
|
|
|
2016-12-22 04:48:24 -05:00
|
|
|
def filter_proxies(ips) # :doc:
|
2014-08-20 18:42:32 -04:00
|
|
|
ips.reject do |ip|
|
|
|
|
@proxies.any? { |proxy| proxy === ip }
|
|
|
|
end
|
2012-04-25 06:31:00 -04:00
|
|
|
end
|
2010-03-03 19:22:30 -05:00
|
|
|
end
|
|
|
|
end
|
2011-11-12 05:45:31 -05:00
|
|
|
end
|