request.rb 21.2 KB
Newer Older
1 2 3 4
require 'tempfile'
require 'stringio'
require 'strscan'

D
Initial  
David Heinemeier Hansson 已提交
5
module ActionController
6
  # CgiRequest and TestRequest provide concrete implementations.
D
Initial  
David Heinemeier Hansson 已提交
7
  class AbstractRequest
8
    cattr_accessor :relative_url_root
9
    remove_method :relative_url_root
10

11
    # The hash of environment variables for this request,
12 13 14
    # such as { 'RAILS_ENV' => 'production' }.
    attr_reader :env

15 16
    # The requested content type, such as :html or :xml.
    attr_writer :format
17

18 19 20
    # The HTTP request method as a lowercase symbol, such as :get.
    # Note, HEAD is returned as :get since the two are functionally
    # equivalent from the application's perspective.
D
Initial  
David Heinemeier Hansson 已提交
21
    def method
22 23 24 25 26 27 28
      @request_method ||=
        if @env['REQUEST_METHOD'] == 'POST' && !parameters[:_method].blank?
          parameters[:_method].to_s.downcase.to_sym
        else
          @env['REQUEST_METHOD'].downcase.to_sym
        end

29
      @request_method == :head ? :get : @request_method
D
Initial  
David Heinemeier Hansson 已提交
30 31
    end

32
    # Is this a GET (or HEAD) request?  Equivalent to request.method == :get
D
Initial  
David Heinemeier Hansson 已提交
33 34 35 36
    def get?
      method == :get
    end

37
    # Is this a POST request?  Equivalent to request.method == :post
D
Initial  
David Heinemeier Hansson 已提交
38 39 40 41
    def post?
      method == :post
    end

42
    # Is this a PUT request?  Equivalent to request.method == :put
D
Initial  
David Heinemeier Hansson 已提交
43 44 45 46
    def put?
      method == :put
    end

47
    # Is this a DELETE request?  Equivalent to request.method == :delete
D
Initial  
David Heinemeier Hansson 已提交
48 49 50 51
    def delete?
      method == :delete
    end

52 53
    # Is this a HEAD request? request.method sees HEAD as :get, so check the
    # HTTP method directly.
54
    def head?
55
      @env['REQUEST_METHOD'].downcase.to_sym == :head
56
    end
57

58 59 60 61
    def headers
      @env
    end

62 63 64 65
    def content_length
      @content_length ||= env['CONTENT_LENGTH'].to_i
    end

66
    # The MIME type of the HTTP request, such as Mime::XML.
67 68 69
    #
    # For backward compatibility, the post format is extracted from the
    # X-Post-Data-Format HTTP header if present.
70
    def content_type
71
      @content_type ||= Mime::Type.lookup(content_type_without_parameters)
72 73
    end

74
    # Returns the accepted MIME type for the request
75
    def accepts
76 77
      @accepts ||=
        if @env['HTTP_ACCEPT'].to_s.strip.empty?
78
          [ content_type, Mime::ALL ].compact # make sure content_type being nil is not included
79 80 81
        else
          Mime::Type.parse(@env['HTTP_ACCEPT'])
        end
82
    end
83

84 85 86 87 88 89 90
    # Returns the Mime type for the format used in the request. If there is no format available, the first of the 
    # accept types will be used. Examples:
    #
    #   GET /posts/5.xml   | request.format => Mime::XML
    #   GET /posts/5.xhtml | request.format => Mime::HTML
    #   GET /posts/5       | request.format => request.accepts.first (usually Mime::HTML for browsers)
    def format
91
      @format ||= parameters[:format] ? Mime::Type.lookup_by_extension(parameters[:format]) : accepts.first
92 93
    end

94 95 96
    # Returns true if the request's "X-Requested-With" header contains
    # "XMLHttpRequest". (The Prototype Javascript library sends this header with
    # every Ajax request.)
97
    def xml_http_request?
98
      not /XMLHttpRequest/i.match(@env['HTTP_X_REQUESTED_WITH']).nil?
99 100 101
    end
    alias xhr? :xml_http_request?

D
Initial  
David Heinemeier Hansson 已提交
102 103 104 105 106 107 108
    # Determine originating IP address.  REMOTE_ADDR is the standard
    # but will fail if the user is behind a proxy.  HTTP_CLIENT_IP and/or
    # HTTP_X_FORWARDED_FOR are set by proxies so check for these before
    # falling back to REMOTE_ADDR.  HTTP_X_FORWARDED_FOR may be a comma-
    # delimited list in the case of multiple chained proxies; the first is
    # the originating IP.
    def remote_ip
109
      return @env['HTTP_CLIENT_IP'] if @env.include? 'HTTP_CLIENT_IP'
110

111 112
      if @env.include? 'HTTP_X_FORWARDED_FOR' then
        remote_ips = @env['HTTP_X_FORWARDED_FOR'].split(',').reject do |ip|
113
          ip.strip =~ /^unknown$|^(10|172\.(1[6-9]|2[0-9]|30|31)|192\.168)\./i
114 115 116
        end

        return remote_ips.first.strip unless remote_ips.empty?
D
Initial  
David Heinemeier Hansson 已提交
117
      end
118

119
      @env['REMOTE_ADDR']
D
Initial  
David Heinemeier Hansson 已提交
120 121
    end

122 123 124 125 126 127 128 129
    # Returns the lowercase name of the HTTP server software.
    def server_software
      (@env['SERVER_SOFTWARE'] && /^([a-zA-Z]+)/ =~ @env['SERVER_SOFTWARE']) ? $1.downcase : nil
    end


    # Returns the complete URL used for this request
    def url
D
David Heinemeier Hansson 已提交
130
      protocol + host_with_port + request_uri
131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171
    end

    # Return 'https://' if this is an SSL request and 'http://' otherwise.
    def protocol
      ssl? ? 'https://' : 'http://'
    end

    # Is this an SSL request?
    def ssl?
      @env['HTTPS'] == 'on' || @env['HTTP_X_FORWARDED_PROTO'] == 'https'
    end

    # Returns the host for this request, such as example.com.
    def host
    end

    # Returns a host:port string for this request, such as example.com or
    # example.com:8080.
    def host_with_port
      host + port_string
    end

    # Returns the port number of this request as an integer.
    def port
      @port_as_int ||= @env['SERVER_PORT'].to_i
    end

    # Returns the standard port number for this request's protocol
    def standard_port
      case protocol
        when 'https://' then 443
        else 80
      end
    end

    # Returns a port suffix like ":8080" if the port number of this request
    # is not the default HTTP port 80 or HTTPS port 443.
    def port_string
      (port == standard_port) ? '' : ":#{port}"
    end

172 173 174
    # Returns the domain part of a host, such as rubyonrails.org in "www.rubyonrails.org". You can specify
    # a different <tt>tld_length</tt>, such as 2 to catch rubyonrails.co.uk in "www.rubyonrails.co.uk".
    def domain(tld_length = 1)
175
      return nil if !/\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}/.match(host).nil? or host.nil?
176

177
      host.split('.').last(1 + tld_length).join('.')
178 179 180 181 182 183
    end

    # Returns all the subdomains as an array, so ["dev", "www"] would be returned for "dev.www.rubyonrails.org".
    # You can specify a different <tt>tld_length</tt>, such as 2 to catch ["www"] instead of ["www", "rubyonrails"]
    # in "www.rubyonrails.co.uk".
    def subdomains(tld_length = 1)
184
      return [] unless host
185
      parts = host.split('.')
186
      parts[0..-(tld_length+2)]
187 188
    end

189 190
    # Return the request URI, accounting for server idiosyncracies.
    # WEBrick includes the full URL. IIS leaves REQUEST_URI blank.
D
Initial  
David Heinemeier Hansson 已提交
191
    def request_uri
192
      if uri = @env['REQUEST_URI']
193 194 195 196
        # Remove domain, which webrick puts into the request_uri.
        (%r{^\w+\://[^/]+(/.*|$)$} =~ uri) ? $1 : uri
      else
        # Construct IIS missing REQUEST_URI from SCRIPT_NAME and PATH_INFO.
197 198
        script_filename = @env['SCRIPT_NAME'].to_s.match(%r{[^/]+$})
        uri = @env['PATH_INFO']
199
        uri = uri.sub(/#{script_filename}\//, '') unless script_filename.nil?
200
        unless (env_qs = @env['QUERY_STRING']).nil? || env_qs.empty?
201 202
          uri << '?' << env_qs
        end
203
        @env['REQUEST_URI'] = uri
204
      end
205
    end
D
Initial  
David Heinemeier Hansson 已提交
206

207
    # Returns the interpreted path to requested resource after all the installation directory of this application was taken into account
D
Initial  
David Heinemeier Hansson 已提交
208
    def path
209
      path = (uri = request_uri) ? uri.split('?').first.to_s : ''
210

211
      # Cut off the path to the installation directory if given
212 213
      path.sub!(%r/^#{relative_url_root}/, '')
      path || ''      
214
    end
215
    
216
    # Returns the path minus the web server relative installation directory.
217 218 219
    # This can be set with the environment variable RAILS_RELATIVE_URL_ROOT.
    # It can be automatically extracted for Apache setups. If the server is not
    # Apache, this method returns an empty string.
220
    def relative_url_root
221 222 223 224 225 226 227 228
      @@relative_url_root ||= case
        when @env["RAILS_RELATIVE_URL_ROOT"]
          @env["RAILS_RELATIVE_URL_ROOT"]
        when server_software == 'apache'
          @env["SCRIPT_NAME"].to_s.sub(/\/dispatch\.(fcgi|rb|cgi)$/, '')
        else
          ''
      end
D
Initial  
David Heinemeier Hansson 已提交
229 230 231
    end


232 233
    # Read the request body. This is useful for web services that need to
    # work with raw requests directly.
234
    def raw_post
235 236 237 238 239
      unless env.include? 'RAW_POST_DATA'
        env['RAW_POST_DATA'] = body.read(content_length)
        body.rewind if body.respond_to?(:rewind)
      end
      env['RAW_POST_DATA']
240 241
    end

242 243 244
    # Returns both GET and POST parameters in a single hash.
    def parameters
      @parameters ||= request_parameters.update(query_parameters).update(path_parameters).with_indifferent_access
D
Initial  
David Heinemeier Hansson 已提交
245
    end
246

247
    def path_parameters=(parameters) #:nodoc:
248
      @path_parameters = parameters
249 250
      @symbolized_path_parameters = @parameters = nil
    end
251

252 253
    # The same as <tt>path_parameters</tt> with explicitly symbolized keys 
    def symbolized_path_parameters 
254
      @symbolized_path_parameters ||= path_parameters.symbolize_keys
255
    end
D
Initial  
David Heinemeier Hansson 已提交
256

257 258 259 260 261
    # Returns a hash with the parameters used to form the path of the request 
    #
    # Example: 
    #
    #   {:action => 'my_action', :controller => 'my_controller'}
262 263 264
    def path_parameters
      @path_parameters ||= {}
    end
265 266


D
Initial  
David Heinemeier Hansson 已提交
267 268 269
    #--
    # Must be implemented in the concrete request
    #++
270 271 272 273 274

    # The request body is an IO input stream.
    def body
    end

275
    def query_parameters #:nodoc:
D
Initial  
David Heinemeier Hansson 已提交
276 277
    end

278
    def request_parameters #:nodoc:
D
Initial  
David Heinemeier Hansson 已提交
279 280
    end

281
    def cookies #:nodoc:
D
Initial  
David Heinemeier Hansson 已提交
282 283
    end

284
    def session #:nodoc:
D
Initial  
David Heinemeier Hansson 已提交
285 286
    end

287 288 289 290
    def session=(session) #:nodoc:
      @session = session
    end

291
    def reset_session #:nodoc:
292
    end
293

294 295 296
    protected
      # The raw content type string. Use when you need parameters such as
      # charset or boundary which aren't included in the content_type MIME type.
297
      # Overridden by the X-POST_DATA_FORMAT header for backward compatibility.
298
      def content_type_with_parameters
299 300
        content_type_from_legacy_post_data_format_header ||
          env['CONTENT_TYPE'].to_s
301 302 303 304 305 306 307 308 309 310 311
      end

      # The raw content type string with its parameters stripped off.
      def content_type_without_parameters
        @content_type_without_parameters ||= self.class.extract_content_type_without_parameters(content_type_with_parameters)
      end

    private
      def content_type_from_legacy_post_data_format_header
        if x_post_format = @env['HTTP_X_POST_DATA_FORMAT']
          case x_post_format.to_s.downcase
312 313
            when 'yaml';  'application/x-yaml'
            when 'xml';   'application/xml'
314 315 316 317
          end
        end
      end

318
      def parse_formatted_request_parameters
319 320
        return {} if content_length.zero?

321
        content_type, boundary = self.class.extract_multipart_boundary(content_type_with_parameters)
322 323

        # Don't parse params for unknown requests.
324 325 326 327 328 329
        return {} if content_type.blank?

        mime_type = Mime::Type.lookup(content_type)
        strategy = ActionController::Base.param_parsers[mime_type]

        # Only multipart form parsing expects a stream.
J
Jeremy Kemper 已提交
330
        body = (strategy && strategy != :multipart_form) ? raw_post : self.body
331 332 333 334 335

        case strategy
          when Proc
            strategy.call(body)
          when :url_encoded_form
336 337
            self.class.clean_up_ajax_request_body! body
            self.class.parse_query_parameters(body)
338
          when :multipart_form
339
            self.class.parse_multipart_form_parameters(body, boundary, content_length, env)
340 341 342 343 344 345 346 347 348 349
          when :xml_simple, :xml_node
            body.blank? ? {} : Hash.from_xml(body).with_indifferent_access
          when :yaml
            YAML.load(body)
          else
            {}
        end
      rescue Exception => e # YAML, XML or Ruby code block errors
        raise
        { "body" => body,
350
          "content_type" => content_type_with_parameters,
351 352 353 354 355
          "content_length" => content_length,
          "exception" => "#{e.message} (#{e.class})",
          "backtrace" => e.backtrace }
      end

356
    class << self
357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397
      def parse_query_parameters(query_string)
        return {} if query_string.blank?

        pairs = query_string.split('&').collect do |chunk|
          next if chunk.empty?
          key, value = chunk.split('=', 2)
          next if key.empty?
          value = value.nil? ? nil : CGI.unescape(value)
          [ CGI.unescape(key), value ]
        end.compact

        UrlEncodedPairParser.new(pairs).result
      end

      def parse_request_parameters(params)
        parser = UrlEncodedPairParser.new

        params = params.dup
        until params.empty?
          for key, value in params
            if key.blank?
              params.delete key
            elsif !key.include?('[')
              # much faster to test for the most common case first (GET)
              # and avoid the call to build_deep_hash
              parser.result[key] = get_typed_value(value[0])
              params.delete key
            elsif value.is_a?(Array)
              parser.parse(key, get_typed_value(value.shift))
              params.delete key if value.empty?
            else
              raise TypeError, "Expected array, found #{value.inspect}"
            end
          end
        end

        parser.result
      end

      def parse_multipart_form_parameters(body, boundary, content_length, env)
        parse_request_parameters(read_multipart(body, boundary, content_length, env))
398
      end
399

400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417
      def extract_multipart_boundary(content_type_with_parameters)
        if content_type_with_parameters =~ MULTIPART_BOUNDARY
          ['multipart/form-data', $1.dup]
        else
          extract_content_type_without_parameters(content_type_with_parameters)
        end
      end

      def extract_content_type_without_parameters(content_type_with_parameters)
        $1.strip.downcase if content_type_with_parameters =~ /^([^,\;]*)/
      end

      def clean_up_ajax_request_body!(body)
        body.chop! if body[-1] == 0
        body.gsub!(/&_=$/, '')
      end


418 419 420 421 422 423 424 425 426 427
      private
        def get_typed_value(value)
          case value
            when String
              value
            when NilClass
              ''
            when Array
              value.map { |v| get_typed_value(v) }
            else
428 429
              # This is an uploaded file.
              if value.respond_to?(:original_filename) && !value.original_filename.blank?
430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544
                unless value.respond_to?(:full_original_filename)
                  class << value
                    alias_method :full_original_filename, :original_filename

                    # Take the basename of the upload's original filename.
                    # This handles the full Windows paths given by Internet Explorer
                    # (and perhaps other broken user agents) without affecting
                    # those which give the lone filename.
                    # The Windows regexp is adapted from Perl's File::Basename.
                    def original_filename
                      if md = /^(?:.*[:\\\/])?(.*)/m.match(full_original_filename)
                        md.captures.first
                      else
                        File.basename full_original_filename
                      end
                    end
                  end
                end

                # Return the same value after overriding original_filename.
                value

              # Multipart values may have content type, but no filename.
              elsif value.respond_to?(:read)
                result = value.read
                value.rewind
                result

              # Unknown value, neither string nor multipart.
              else
                raise "Unknown form value: #{value.inspect}"
              end
          end
        end


        MULTIPART_BOUNDARY = %r|\Amultipart/form-data.*boundary=\"?([^\";,]+)\"?|n

        EOL = "\015\012"

        def read_multipart(body, boundary, content_length, env)
          params = Hash.new([])
          boundary = "--" + boundary
          quoted_boundary = Regexp.quote(boundary, "n")
          buf = ""
          bufsize = 10 * 1024
          boundary_end=""

          # start multipart/form-data
          body.binmode if defined? body.binmode
          boundary_size = boundary.size + EOL.size
          content_length -= boundary_size
          status = body.read(boundary_size)
          if nil == status
            raise EOFError, "no content body"
          elsif boundary + EOL != status
            raise EOFError, "bad content body"
          end

          loop do
            head = nil
            content =
              if 10240 < content_length
                Tempfile.new("CGI")
              else
                StringIO.new
              end
            content.binmode if defined? content.binmode

            until head and /#{quoted_boundary}(?:#{EOL}|--)/n.match(buf)

              if (not head) and /#{EOL}#{EOL}/n.match(buf)
                buf = buf.sub(/\A((?:.|\n)*?#{EOL})#{EOL}/n) do
                  head = $1.dup
                  ""
                end
                next
              end

              if head and ( (EOL + boundary + EOL).size < buf.size )
                content.print buf[0 ... (buf.size - (EOL + boundary + EOL).size)]
                buf[0 ... (buf.size - (EOL + boundary + EOL).size)] = ""
              end

              c = if bufsize < content_length
                    body.read(bufsize)
                  else
                    body.read(content_length)
                  end
              if c.nil? || c.empty?
                raise EOFError, "bad content body"
              end
              buf.concat(c)
              content_length -= c.size
            end

            buf = buf.sub(/\A((?:.|\n)*?)(?:[\r\n]{1,2})?#{quoted_boundary}([\r\n]{1,2}|--)/n) do
              content.print $1
              if "--" == $2
                content_length = -1
              end
             boundary_end = $2.dup
              ""
            end

            content.rewind

            /Content-Disposition:.* filename=(?:"((?:\\.|[^\"])*)"|([^;]*))/ni.match(head)
            filename = ($1 or $2 or "")
            if /Mac/ni.match(env['HTTP_USER_AGENT']) and
                /Mozilla/ni.match(env['HTTP_USER_AGENT']) and
                (not /MSIE/ni.match(env['HTTP_USER_AGENT']))
              filename = CGI.unescape(filename)
            end

545
            /Content-Type: ([^\r]*)/ni.match(head)
546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578
            content_type = ($1 or "")

            (class << content; self; end).class_eval do
              alias local_path path
              define_method(:original_filename) {filename.dup.taint}
              define_method(:content_type) {content_type.dup.taint}
            end

            /Content-Disposition:.* name="?([^\";]*)"?/ni.match(head)
            name = $1.dup

            if params.has_key?(name)
              params[name].push(content)
            else
              params[name] = [content]
            end
            break if buf.size == 0
            break if content_length == -1
          end
          raise EOFError, "bad boundary end of body part" unless boundary_end=~/--/

          params
        end
    end
  end

  class UrlEncodedPairParser < StringScanner #:nodoc:
    attr_reader :top, :parent, :result

    def initialize(pairs = [])
      super('')
      @result = {}
      pairs.each { |key, value| parse(key, value) }
579
    end
580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661

    KEY_REGEXP = %r{([^\[\]=&]+)}
    BRACKETED_KEY_REGEXP = %r{\[([^\[\]=&]+)\]}

    # Parse the query string
    def parse(key, value)
      self.string = key
      @top, @parent = result, nil

      # First scan the bare key
      key = scan(KEY_REGEXP) or return
      key = post_key_check(key)

      # Then scan as many nestings as present
      until eos?
        r = scan(BRACKETED_KEY_REGEXP) or return
        key = self[1]
        key = post_key_check(key)
      end

      bind(key, value)
    end

    private
      # After we see a key, we must look ahead to determine our next action. Cases:
      #
      #   [] follows the key. Then the value must be an array.
      #   = follows the key. (A value comes next)
      #   & or the end of string follows the key. Then the key is a flag.
      #   otherwise, a hash follows the key.
      def post_key_check(key)
        if scan(/\[\]/) # a[b][] indicates that b is an array
          container(key, Array)
          nil
        elsif check(/\[[^\]]/) # a[b] indicates that a is a hash
          container(key, Hash)
          nil
        else # End of key? We do nothing.
          key
        end
      end

      # Add a container to the stack.
      def container(key, klass)
        type_conflict! klass, top[key] if top.is_a?(Hash) && top.key?(key) && ! top[key].is_a?(klass)
        value = bind(key, klass.new)
        type_conflict! klass, value unless value.is_a?(klass)
        push(value)
      end

      # Push a value onto the 'stack', which is actually only the top 2 items.
      def push(value)
        @parent, @top = @top, value
      end

      # Bind a key (which may be nil for items in an array) to the provided value.
      def bind(key, value)
        if top.is_a? Array
          if key
            if top[-1].is_a?(Hash) && ! top[-1].key?(key)
              top[-1][key] = value
            else
              top << {key => value}.with_indifferent_access
              push top.last
            end
          else
            top << value
          end
        elsif top.is_a? Hash
          key = CGI.unescape(key)
          parent << (@top = {}) if top.key?(key) && parent.is_a?(Array)
          return top[key] ||= value
        else
          raise ArgumentError, "Don't know what to do: top is #{top.inspect}"
        end

        return value
      end

      def type_conflict!(klass, value)
        raise TypeError, "Conflicting types for parameter containers. Expected an instance of #{klass} but found an instance of #{value.class}. This can be caused by colliding Array and Hash parameters like qs[]=value&qs[key]=value."
      end
D
Initial  
David Heinemeier Hansson 已提交
662
  end
663
end