• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1"""MIME-Type Parser
2
3This module provides basic functions for handling mime-types. It can handle
4matching mime-types against a list of media-ranges. See section 14.1 of
5the HTTP specification [RFC 2616] for a complete explanation.
6
7   http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.1
8
9Based on mimeparse 0.1.2 by Joe Gregorio:
10
11    http://code.google.com/p/mimeparse/
12
13Contents:
14    - parse_mime_type():   Parses a mime-type into its component parts.
15    - parse_media_range(): Media-ranges are mime-types with wild-cards and a 'q' quality parameter.
16    - quality():           Determines the quality ('q') of a mime-type when compared against a list of media-ranges.
17    - quality_parsed():    Just like quality() except the second parameter must be pre-parsed.
18    - best_match():        Choose the mime-type with the highest quality ('q') from a list of candidates.
19    - desired_matches():   Filter against a list of desired mime-types in the order the server prefers.
20
21"""
22
23
24def parse_mime_type(mime_type):
25    """Carves up a mime-type and returns a tuple of the
26       (type, subtype, params) where 'params' is a dictionary
27       of all the parameters for the media range.
28       For example, the media range 'application/xhtml;q=0.5' would
29       get parsed into:
30
31       ('application', 'xhtml', {'q', '0.5'})
32       """
33    type = mime_type.split(';')
34    type, plist = type[0], type[1:]
35    try:
36        type, subtype = type.split('/', 1)
37    except ValueError:
38        type, subtype = type.strip() or '*', '*'
39    else:
40        type = type.strip() or '*'
41        subtype = subtype.strip() or '*'
42    params = {}
43    for param in plist:
44        param = param.split('=', 1)
45        if len(param) == 2:
46            key, value = param[0].strip(), param[1].strip()
47            if key and value:
48                params[key] = value
49    return type, subtype, params
50
51def parse_media_range(range):
52    """Carves up a media range and returns a tuple of the
53       (type, subtype, params) where 'params' is a dictionary
54       of all the parameters for the media range.
55       For example, the media range 'application/*;q=0.5' would
56       get parsed into:
57
58       ('application', '*', {'q', '0.5'})
59
60       In addition this function also guarantees that there
61       is a value for 'q' in the params dictionary, filling it
62       in with a proper default if necessary.
63       """
64    type, subtype, params = parse_mime_type(range)
65    try:
66        if not 0 <= float(params['q']) <= 1:
67            raise ValueError
68    except (KeyError, ValueError):
69        params['q'] = '1'
70    return type, subtype, params
71
72def fitness_and_quality_parsed(mime_type, parsed_ranges):
73    """Find the best match for a given mime-type against
74       a list of media_ranges that have already been
75       parsed by parse_media_range(). Returns a tuple of
76       the fitness value and the value of the 'q' quality
77       parameter of the best match, or (-1, 0) if no match
78       was found. Just as for quality_parsed(), 'parsed_ranges'
79       must be a list of parsed media ranges."""
80    best_fitness, best_fit_q = -1, 0
81    target_type, target_subtype, target_params = parse_media_range(mime_type)
82    for type, subtype, params in parsed_ranges:
83        if (type == target_type
84                    or type == '*' or target_type == '*') and (
85                subtype == target_subtype
86                    or subtype == '*' or target_subtype == '*'):
87            fitness = 0
88            if type == target_type:
89                fitness += 100
90            if subtype == target_subtype:
91                fitness += 10
92            for key in target_params:
93                if key != 'q' and key in params:
94                    if params[key] == target_params[key]:
95                        fitness += 1
96            if fitness > best_fitness:
97                best_fitness = fitness
98                best_fit_q = params['q']
99    return best_fitness, float(best_fit_q)
100
101def quality_parsed(mime_type, parsed_ranges):
102    """Find the best match for a given mime-type against
103    a list of media_ranges that have already been
104    parsed by parse_media_range(). Returns the
105    'q' quality parameter of the best match, 0 if no
106    match was found. This function behaves the same as quality()
107    except that 'parsed_ranges' must be a list of
108    parsed media ranges."""
109    return fitness_and_quality_parsed(mime_type, parsed_ranges)[1]
110
111def quality(mime_type, ranges):
112    """Returns the quality 'q' of a mime-type when compared
113    against the media-ranges in ranges. For example:
114
115    >>> quality('text/html','text/*;q=0.3, text/html;q=0.7, text/html;level=1, text/html;level=2;q=0.4, */*;q=0.5')
116    0.7
117
118    """
119    parsed_ranges = map(parse_media_range, ranges.split(','))
120    return quality_parsed(mime_type, parsed_ranges)
121
122def best_match(supported, header):
123    """Takes a list of supported mime-types and finds the best
124    match for all the media-ranges listed in header. In case of
125    ambiguity, whatever comes first in the list will be chosen.
126    The value of header must be a string that conforms to the format
127    of the HTTP Accept: header. The value of 'supported' is a list
128    of mime-types.
129
130    >>> best_match(['application/xbel+xml', 'text/xml'], 'text/*;q=0.5,*/*; q=0.1')
131    'text/xml'
132    """
133    if not supported:
134        return ''
135    parsed_header = list(map(parse_media_range, header.split(',')))
136    best_type = max([
137            (fitness_and_quality_parsed(mime_type, parsed_header), -n)
138            for n, mime_type in enumerate(supported)])
139    return best_type[0][1] and supported[-best_type[1]] or ''
140
141def desired_matches(desired, header):
142    """Takes a list of desired mime-types in the order the server prefers to
143    send them regardless of the browsers preference.
144
145    Browsers (such as Firefox) technically want XML over HTML depending on how
146    one reads the specification. This function is provided for a server to
147    declare a set of desired mime-types it supports, and returns a subset of
148    the desired list in the same order should each one be Accepted by the
149    browser.
150
151    >>> desired_matches(['text/html', 'application/xml'], \
152    ...     'text/xml,application/xml,application/xhtml+xml,text/html;q=0.9,text/plain;q=0.8,image/png')
153    ['text/html', 'application/xml']
154    >>> desired_matches(['text/html', 'application/xml'], 'application/xml,application/json')
155    ['application/xml']
156    """
157    parsed_ranges = list(map(parse_media_range, header.split(',')))
158    return [mimetype for mimetype in desired
159        if quality_parsed(mimetype, parsed_ranges)]
160
161