File: media_types.rb

package info (click to toggle)
ruby-http-accept 2.2.1-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 136 kB
  • sloc: ruby: 352; makefile: 4
file content (125 lines) | stat: -rw-r--r-- 3,586 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
# frozen_string_literal: true

# Released under the MIT License.
# Copyright, 2016-2024, by Samuel Williams.

require 'strscan'

require_relative 'parse_error'
require_relative 'quoted_string'
require_relative 'sort'

require_relative 'media_types/map'

module HTTP
	module Accept
		# Parse and process the HTTP Accept: header.
		module MediaTypes
			# According to https://tools.ietf.org/html/rfc7231#section-5.3.2
			MIME_TYPE = /(?<type>#{TOKEN})\/(?<subtype>#{TOKEN})/
			PARAMETER = /\s*;\s*(?<key>#{TOKEN})=((?<value>#{TOKEN})|(?<quoted_value>#{QUOTED_STRING}))/
			
			# A single entry in the Accept: header, which includes a mime type and associated parameters.
			MediaRange = Struct.new(:type, :subtype, :parameters) do
				def initialize(type, subtype = '*', parameters = {})
					super(type, subtype, parameters)
				end
				
				def parameters_string
					return '' if parameters == nil or parameters.empty?
					
					parameters.collect do |key, value|
						"; #{key.to_s}=#{QuotedString.quote(value.to_s)}"
					end.join
				end
				
				def === other
					if other.is_a? self.class
						super
					else
						return self.mime_type === other
					end
				end
				
				def mime_type
					"#{type}/#{subtype}"
				end
				
				def to_s
					"#{type}/#{subtype}#{parameters_string}"
				end
				
				alias to_str to_s
				
				def quality_factor
					parameters.fetch('q', 1.0).to_f
				end
				
				def split(*args)
					return [type, subtype]
				end
				
				def self.parse_parameters(scanner, normalize_whitespace)
					parameters = {}
					
					while scanner.scan(PARAMETER)
						key = scanner[:key]
						
						# If the regular expression PARAMETER matched, it must be one of these two:
						if value = scanner[:value]
							parameters[key] = value
						elsif quoted_value = scanner[:quoted_value]
							parameters[key] = QuotedString.unquote(quoted_value, normalize_whitespace)
						end
					end
					
					return parameters
				end
				
				def self.parse(scanner, normalize_whitespace = true)
					return to_enum(:parse, scanner, normalize_whitespace) unless block_given?
					
					while scanner.scan(MIME_TYPE)
						type = scanner[:type]
						subtype = scanner[:subtype]
						
						parameters = parse_parameters(scanner, normalize_whitespace)
						
						yield self.new(type, subtype, parameters)
						
						# Are there more?
						break unless scanner.scan(/\s*,\s*/)
					end
					
					raise ParseError.new("Could not parse entire string!") unless scanner.eos?
				end
			end
			
			def self.parse(text, normalize_whitespace = true)
				scanner = StringScanner.new(text)
				
				media_types = MediaRange.parse(scanner, normalize_whitespace)
				
				return Sort.by_quality_factor(media_types)
			end
			
			HTTP_ACCEPT = 'HTTP_ACCEPT'.freeze
			WILDCARD_MEDIA_RANGE = MediaRange.new("*", "*", {}).freeze
			
			# Parse the list of browser preferred content types and return ordered by priority. If no `Accept:` header is specified, the behaviour is the same as if `Accept: */*` was provided (according to RFC).
			def self.browser_preferred_media_types(env)
				if accept_content_types = env[HTTP_ACCEPT]&.strip
					unless accept_content_types.empty?
						return HTTP::Accept::MediaTypes.parse(accept_content_types)
					end
				end
				
				# According to http://tools.ietf.org/html/rfc7231#section-5.3.2:
				# A request without any Accept header field implies that the user agent will accept any media type in response.
				# You should treat a non-existent Accept header as */*.
				return [WILDCARD_MEDIA_RANGE]
			end
		end
	end
end