diff options
Diffstat (limited to 'lib/uri/http.rb')
| -rw-r--r-- | lib/uri/http.rb | 119 |
1 files changed, 78 insertions, 41 deletions
diff --git a/lib/uri/http.rb b/lib/uri/http.rb index 87eb8893f2..3c41cd4e93 100644 --- a/lib/uri/http.rb +++ b/lib/uri/http.rb @@ -1,12 +1,13 @@ -# +# frozen_string_literal: false # = uri/http.rb # # Author:: Akira Yamada <akira@ruby-lang.org> # License:: You can redistribute it and/or modify it under the same term as Ruby. -# Revision:: $Id$ +# +# See URI for general documentation # -require 'uri/generic' +require_relative 'generic' module URI @@ -14,87 +15,123 @@ module URI # The syntax of HTTP URIs is defined in RFC1738 section 3.3. # # Note that the Ruby URI library allows HTTP URLs containing usernames and - # passwords. This is not legal as per the RFC, but used to be - # supported in Internet Explorer 5 and 6, before the MS04-004 security + # passwords. This is not legal as per the RFC, but used to be + # supported in Internet Explorer 5 and 6, before the MS04-004 security # update. See <URL:http://support.microsoft.com/kb/834489>. # class HTTP < Generic + # A Default port of 80 for URI::HTTP. DEFAULT_PORT = 80 - COMPONENT = [ - :scheme, - :userinfo, :host, :port, - :path, - :query, - :fragment + # An Array of the available components for URI::HTTP. + COMPONENT = %i[ + scheme + userinfo host port + path + query + fragment ].freeze # # == Description # - # Create a new URI::HTTP object from components, with syntax checking. + # Creates a new URI::HTTP object from components, with syntax checking. # - # The components accepted are userinfo, host, port, path, query and + # The components accepted are userinfo, host, port, path, query, and # fragment. # - # The components should be provided either as an Array, or as a Hash - # with keys formed by preceding the component names with a colon. + # The components should be provided either as an Array, or as a Hash + # with keys formed by preceding the component names with a colon. # - # If an Array is used, the components must be passed in the order - # [userinfo, host, port, path, query, fragment]. + # If an Array is used, the components must be passed in the + # order <code>[userinfo, host, port, path, query, fragment]</code>. # # Example: # - # newuri = URI::HTTP.build({:host => 'www.example.com', - # :path> => '/foo/bar'}) + # uri = URI::HTTP.build(host: 'www.example.com', path: '/foo/bar') # - # newuri = URI::HTTP.build([nil, "www.example.com", nil, "/path", + # uri = URI::HTTP.build([nil, "www.example.com", nil, "/path", # "query", 'fragment']) # - # Currently, if passed userinfo components this method generates + # Currently, if passed userinfo components this method generates # invalid HTTP URIs as per RFC 1738. # def self.build(args) - tmp = Util::make_components_hash(self, args) - return super(tmp) + tmp = Util.make_components_hash(self, args) + super(tmp) + end + + # Do not allow empty host names, as they are not allowed by RFC 3986. + def check_host(v) + ret = super + + if ret && v.empty? + raise InvalidComponentError, + "bad component(expected host component): #{v}" + end + + ret end # # == Description # - # Create a new URI::HTTP object from generic URI components as per - # RFC 2396. No HTTP-specific syntax checking (as per RFC 1738) is - # performed. + # Returns the full path for an HTTP request, as required by Net::HTTP::Get. # - # Arguments are +scheme+, +userinfo+, +host+, +port+, +registry+, +path+, - # +opaque+, +query+ and +fragment+, in that order. + # If the URI contains a query, the full path is URI#path + '?' + URI#query. + # Otherwise, the path is simply URI#path. # # Example: # - # uri = URI::HTTP.new(['http', nil, "www.example.com", nil, "/path", - # "query", 'fragment']) + # uri = URI::HTTP.build(path: '/foo/bar', query: 'test=true') + # uri.request_uri # => "/foo/bar?test=true" # - def initialize(*arg) - super(*arg) + def request_uri + return unless @path + + url = @query ? "#@path?#@query" : @path.dup + url.start_with?(?/.freeze) ? url : ?/ + url end # # == Description # - # Returns the full path for an HTTP request, as required by Net::HTTP::Get. + # Returns the authority for an HTTP uri, as defined in + # https://www.rfc-editor.org/rfc/rfc3986#section-3.2. # - # If the URI contains a query, the full path is URI#path + '?' + URI#query. - # Otherwise, the path is simply URI#path. # - def request_uri - r = path_query - if r[0] != ?/ - r = '/' + r + # Example: + # + # URI::HTTP.build(host: 'www.example.com', path: '/foo/bar').authority #=> "www.example.com" + # URI::HTTP.build(host: 'www.example.com', port: 8000, path: '/foo/bar').authority #=> "www.example.com:8000" + # URI::HTTP.build(host: 'www.example.com', port: 80, path: '/foo/bar').authority #=> "www.example.com" + # + def authority + if port == default_port + host + else + "#{host}:#{port}" end + end - r + # + # == Description + # + # Returns the origin for an HTTP uri, as defined in + # https://www.rfc-editor.org/rfc/rfc6454. + # + # + # Example: + # + # URI::HTTP.build(host: 'www.example.com', path: '/foo/bar').origin #=> "http://www.example.com" + # URI::HTTP.build(host: 'www.example.com', port: 8000, path: '/foo/bar').origin #=> "http://www.example.com:8000" + # URI::HTTP.build(host: 'www.example.com', port: 80, path: '/foo/bar').origin #=> "http://www.example.com" + # URI::HTTPS.build(host: 'www.example.com', path: '/foo/bar').origin #=> "https://www.example.com" + # + def origin + "#{scheme}://#{authority}" end end - @@schemes['HTTP'] = HTTP + register_scheme 'HTTP', HTTP end |
