Module: WEBrick::HTTPUtils
- Defined in:
- lib/webrick/httputils.rb
Overview
HTTPUtils provides utility methods for working with the HTTP protocol.
This module is generally used internally by WEBrick
Defined Under Namespace
Classes: CookieHeader, FormData, SplitHeader
Constant Summary collapse
- DefaultMimeTypes =
Default mime types
{ "ai" => "application/postscript", "asc" => "text/plain", "avi" => "video/x-msvideo", "avif" => "image/avif", "bin" => "application/octet-stream", "bmp" => "image/bmp", "class" => "application/octet-stream", "cer" => "application/pkix-cert", "crl" => "application/pkix-crl", "crt" => "application/x-x509-ca-cert", "css" => "text/css", "dms" => "application/octet-stream", "doc" => "application/msword", "dvi" => "application/x-dvi", "eps" => "application/postscript", "etx" => "text/x-setext", "exe" => "application/octet-stream", "gif" => "image/gif", "htm" => "text/html", "html" => "text/html", "ico" => "image/x-icon", "jpe" => "image/jpeg", "jpeg" => "image/jpeg", "jpg" => "image/jpeg", "js" => "application/javascript", "json" => "application/json", "lha" => "application/octet-stream", "lzh" => "application/octet-stream", "mjs" => "application/javascript", "mov" => "video/quicktime", "mp4" => "video/mp4", "mpe" => "video/mpeg", "mpeg" => "video/mpeg", "mpg" => "video/mpeg", "otf" => "font/otf", "pbm" => "image/x-portable-bitmap", "pdf" => "application/pdf", "pgm" => "image/x-portable-graymap", "png" => "image/png", "pnm" => "image/x-portable-anymap", "ppm" => "image/x-portable-pixmap", "ppt" => "application/vnd.ms-powerpoint", "ps" => "application/postscript", "qt" => "video/quicktime", "ras" => "image/x-cmu-raster", "rb" => "text/plain", "rd" => "text/plain", "rtf" => "application/rtf", "sgm" => "text/sgml", "sgml" => "text/sgml", "svg" => "image/svg+xml", "tif" => "image/tiff", "tiff" => "image/tiff", "ttc" => "font/collection", "ttf" => "font/ttf", "txt" => "text/plain", "wasm" => "application/wasm", "webm" => "video/webm", "webmanifest" => "application/manifest+json", "webp" => "image/webp", "woff" => "font/woff", "woff2" => "font/woff2", "xbm" => "image/x-xbitmap", "xhtml" => "text/html", "xls" => "application/vnd.ms-excel", "xml" => "text/xml", "xpm" => "image/x-xpixmap", "xwd" => "image/x-xwindowdump", "zip" => "application/zip", }
- HEADER_CLASSES =
Hash.new(SplitHeader).update({ "cookie" => CookieHeader, })
- UNESCAPED =
_make_regex(control+space+delims+unwise+nonascii)
- UNESCAPED_FORM =
_make_regex(reserved+control+delims+unwise+nonascii)
- NONASCII =
_make_regex(nonascii)
- ESCAPED =
/%([0-9a-fA-F]{2})/
- UNESCAPED_PCHAR =
_make_regex!(unreserved+":@&=+$,")
Class Method Summary collapse
- ._escape(str, regex) ⇒ Object
-
._make_regex(str) ⇒ Object
:stopdoc:.
- ._make_regex!(str) ⇒ Object
- ._unescape(str, regex) ⇒ Object
-
.dequote(str) ⇒ Object
Removes quotes and escapes from
str
. -
.escape(str) ⇒ Object
Escapes HTTP reserved and unwise characters in
str
. -
.escape8bit(str) ⇒ Object
Escapes 8 bit characters in
str
. -
.escape_form(str) ⇒ Object
Escapes form reserved characters in
str
. -
.escape_path(str) ⇒ Object
Escapes path
str
. -
.load_mime_types(file) ⇒ Object
Loads Apache-compatible mime.types in
file
. -
.mime_type(filename, mime_tab) ⇒ Object
Returns the mime type of
filename
from the list inmime_tab
. -
.normalize_path(path) ⇒ Object
Normalizes a request path.
-
.parse_form_data(io, boundary) ⇒ Object
Parses form data in
io
with the givenboundary
. - .parse_header(raw) ⇒ Object
-
.parse_query(str) ⇒ Object
Parses the query component of a URI in
str
. -
.parse_qvalues(value) ⇒ Object
Parses q values in
value
as used in Accept headers. -
.parse_range_header(ranges_specifier) ⇒ Object
Parses a Range header value
ranges_specifier
. -
.quote(str) ⇒ Object
Quotes and escapes quotes in
str
. -
.split_header_value(str) ⇒ Object
Splits a header value
str
according to HTTP specification. -
.unescape(str) ⇒ Object
Unescapes HTTP reserved and unwise characters in
str
. -
.unescape_form(str) ⇒ Object
Unescapes form reserved characters in
str
.
Class Method Details
._escape(str, regex) ⇒ Object
474 475 476 477 478 479 |
# File 'lib/webrick/httputils.rb', line 474 def _escape(str, regex) str = str.b str.gsub!(regex) {"%%%02X" % $1.ord} # %-escaped string should contain US-ASCII only str.force_encoding(Encoding::US_ASCII) end |
._make_regex(str) ⇒ Object
:stopdoc:
472 |
# File 'lib/webrick/httputils.rb', line 472 def _make_regex(str) /([#{Regexp.escape(str)}])/n end |
._make_regex!(str) ⇒ Object
473 |
# File 'lib/webrick/httputils.rb', line 473 def _make_regex!(str) /([^#{Regexp.escape(str)}])/n end |
._unescape(str, regex) ⇒ Object
480 481 482 483 484 485 |
# File 'lib/webrick/httputils.rb', line 480 def _unescape(str, regex) str = str.b str.gsub!(regex) {$1.hex.chr} # encoding of %-unescaped string is unknown str end |
.dequote(str) ⇒ Object
Removes quotes and escapes from str
254 255 256 257 258 |
# File 'lib/webrick/httputils.rb', line 254 def dequote(str) ret = (/\A"(.*)"\Z/ =~ str) ? $1 : str.dup ret.gsub!(/\\(.)/, "\\1") ret end |
.escape(str) ⇒ Object
Escapes HTTP reserved and unwise characters in str
498 499 500 |
# File 'lib/webrick/httputils.rb', line 498 def escape(str) _escape(str, UNESCAPED) end |
.escape8bit(str) ⇒ Object
Escapes 8 bit characters in str
539 540 541 |
# File 'lib/webrick/httputils.rb', line 539 def escape8bit(str) _escape(str, NONASCII) end |
.escape_form(str) ⇒ Object
Escapes form reserved characters in str
512 513 514 515 516 |
# File 'lib/webrick/httputils.rb', line 512 def escape_form(str) ret = _escape(str, UNESCAPED_FORM) ret.gsub!(/ /, "+") ret end |
.escape_path(str) ⇒ Object
Escapes path str
528 529 530 531 532 533 534 |
# File 'lib/webrick/httputils.rb', line 528 def escape_path(str) result = +"" str.scan(%r{/([^/]*)}).each{|i| result << "/" << _escape(i[0], UNESCAPED_PCHAR) } return result end |
.load_mime_types(file) ⇒ Object
Loads Apache-compatible mime.types in file
.
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 |
# File 'lib/webrick/httputils.rb', line 122 def load_mime_types(file) # note: +file+ may be a "| command" for now; some people may # rely on this, but currently we do not use this method by default. File.open(file){ |io| hash = Hash.new io.each{ |line| next if /^#/ =~ line line.chomp! mimetype, ext0 = line.split(/\s+/, 2) next unless ext0 next if ext0.empty? ext0.split(/\s+/).each{ |ext| hash[ext] = mimetype } } hash } end |
.mime_type(filename, mime_tab) ⇒ Object
Returns the mime type of filename
from the list in mime_tab
. If no mime type was found application/octet-stream is returned.
144 145 146 147 148 |
# File 'lib/webrick/httputils.rb', line 144 def mime_type(filename, mime_tab) suffix1 = (/\.(\w+)$/ =~ filename && $1.downcase) suffix2 = (/\.(\w+)\.[\w\-]+$/ =~ filename && $1.downcase) mime_tab[suffix1] || mime_tab[suffix2] || "application/octet-stream" end |
.normalize_path(path) ⇒ Object
Normalizes a request path. Raises an exception if the path cannot be normalized.
31 32 33 34 35 36 37 38 39 40 41 |
# File 'lib/webrick/httputils.rb', line 31 def normalize_path(path) raise "abnormal path '#{path}'" if path[0] != ?/ ret = path.dup ret.gsub!(%r{/+}o, '/') # // => / while ret.sub!(%r'/\.(?:/|\Z)', '/'); end # /. => / while ret.sub!(%r'/(?!\.\./)[^/]+/\.\.(?:/|\Z)', '/'); end # /foo/.. => /foo raise "abnormal path '#{path}'" if %r{/\.\.(/|\Z)} =~ ret ret end |
.parse_form_data(io, boundary) ⇒ Object
Parses form data in io
with the given boundary
426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 |
# File 'lib/webrick/httputils.rb', line 426 def parse_form_data(io, boundary) boundary_regexp = /\A--#{Regexp.quote(boundary)}(--)?#{CRLF}\z/ form_data = Hash.new return form_data unless io data = nil io.each_line{|line| if boundary_regexp =~ line if data data.chop! key = data.name if form_data.has_key?(key) form_data[key].append_data(data) else form_data[key] = data end end data = FormData.new next else if data data << line end end } return form_data end |
.parse_header(raw) ⇒ Object
171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 |
# File 'lib/webrick/httputils.rb', line 171 def parse_header(raw) header = Hash.new([].freeze) field = nil raw.each_line{|line| case line when /^([A-Za-z0-9!\#$%&'*+\-.^_`|~]+):([^\r\n\0]*?)\r\n\z/om field, value = $1, $2 field.downcase! header[field] = HEADER_CLASSES[field].new unless header.has_key?(field) header[field] << value when /^[ \t]+([^\r\n\0]*?)\r\n/om unless field raise HTTPStatus::BadRequest, "bad header '#{line}'." end value = line value.gsub!(/\A[ \t]+/, '') value.slice!(-2..-1) header[field][-1] << " " << value else raise HTTPStatus::BadRequest, "bad header '#{line}'." end } header.each{|key, values| values.each{|value| value.gsub!(/\A[ \t]+/, '') value.gsub!(/[ \t]+\z/, '') } } header end |
.parse_query(str) ⇒ Object
Parses the query component of a URI in str
402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 |
# File 'lib/webrick/httputils.rb', line 402 def parse_query(str) query = Hash.new if str str.split(/[&;]/).each{|x| next if x.empty? key, val = x.split(/=/,2) key = unescape_form(key) val = unescape_form(val.to_s) val = FormData.new(val) val.name = key if query.has_key?(key) query[key].append_data(val) next end query[key] = val } end query end |
.parse_qvalues(value) ⇒ Object
Parses q values in value
as used in Accept headers.
233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 |
# File 'lib/webrick/httputils.rb', line 233 def parse_qvalues(value) tmp = [] if value parts = value.split(/,[ \t]*/) parts.each {|part| if m = %r{^([^ \t,]+?)(?:;[ \t]*q=(\d+(?:\.\d+)?))?$}.match(part) val = m[1] q = (m[2] or 1).to_f tmp.push([val, q]) end } tmp = tmp.sort_by{|val, q| -q} tmp.collect!{|val, q| val} end return tmp end |
.parse_range_header(ranges_specifier) ⇒ Object
Parses a Range header value ranges_specifier
215 216 217 218 219 220 221 222 223 224 225 226 227 |
# File 'lib/webrick/httputils.rb', line 215 def parse_range_header(ranges_specifier) if /^bytes=(.*)/ =~ ranges_specifier byte_range_set = split_header_value($1) byte_range_set.collect{|range_spec| case range_spec when /^(\d+)-(\d+)/ then $1.to_i .. $2.to_i when /^(\d+)-/ then $1.to_i .. -1 when /^-(\d+)/ then -($1.to_i) .. -1 else return nil end } end end |
.quote(str) ⇒ Object
Quotes and escapes quotes in str
264 265 266 |
# File 'lib/webrick/httputils.rb', line 264 def quote(str) +'"' << str.gsub(/[\\\"]/o, "\\\1") << '"' end |
.split_header_value(str) ⇒ Object
Splits a header value str
according to HTTP specification.
206 207 208 209 |
# File 'lib/webrick/httputils.rb', line 206 def split_header_value(str) str.scan(%r'\G((?:"(?:\\.|[^"])+?"|[^",]++)+) (?:,[ \t]*|\Z)'xn).flatten end |
.unescape(str) ⇒ Object
Unescapes HTTP reserved and unwise characters in str
505 506 507 |
# File 'lib/webrick/httputils.rb', line 505 def unescape(str) _unescape(str, ESCAPED) end |
.unescape_form(str) ⇒ Object
Unescapes form reserved characters in str
521 522 523 |
# File 'lib/webrick/httputils.rb', line 521 def unescape_form(str) _unescape(str.gsub(/\+/, " "), ESCAPED) end |