cookies.py 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636
  1. ####
  2. # Copyright 2000 by Timothy O'Malley <timo@alum.mit.edu>
  3. #
  4. # All Rights Reserved
  5. #
  6. # Permission to use, copy, modify, and distribute this software
  7. # and its documentation for any purpose and without fee is hereby
  8. # granted, provided that the above copyright notice appear in all
  9. # copies and that both that copyright notice and this permission
  10. # notice appear in supporting documentation, and that the name of
  11. # Timothy O'Malley not be used in advertising or publicity
  12. # pertaining to distribution of the software without specific, written
  13. # prior permission.
  14. #
  15. # Timothy O'Malley DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
  16. # SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY
  17. # AND FITNESS, IN NO EVENT SHALL Timothy O'Malley BE LIABLE FOR
  18. # ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
  19. # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
  20. # WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
  21. # ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
  22. # PERFORMANCE OF THIS SOFTWARE.
  23. #
  24. ####
  25. #
  26. # Id: Cookie.py,v 2.29 2000/08/23 05:28:49 timo Exp
  27. # by Timothy O'Malley <timo@alum.mit.edu>
  28. #
  29. # Cookie.py is a Python module for the handling of HTTP
  30. # cookies as a Python dictionary. See RFC 2109 for more
  31. # information on cookies.
  32. #
  33. # The original idea to treat Cookies as a dictionary came from
  34. # Dave Mitchell (davem@magnet.com) in 1995, when he released the
  35. # first version of nscookie.py.
  36. #
  37. ####
  38. r"""
  39. Here's a sample session to show how to use this module.
  40. At the moment, this is the only documentation.
  41. The Basics
  42. ----------
  43. Importing is easy...
  44. >>> from http import cookies
  45. Most of the time you start by creating a cookie.
  46. >>> C = cookies.SimpleCookie()
  47. Once you've created your Cookie, you can add values just as if it were
  48. a dictionary.
  49. >>> C = cookies.SimpleCookie()
  50. >>> C["fig"] = "newton"
  51. >>> C["sugar"] = "wafer"
  52. >>> C.output()
  53. 'Set-Cookie: fig=newton\r\nSet-Cookie: sugar=wafer'
  54. Notice that the printable representation of a Cookie is the
  55. appropriate format for a Set-Cookie: header. This is the
  56. default behavior. You can change the header and printed
  57. attributes by using the .output() function
  58. >>> C = cookies.SimpleCookie()
  59. >>> C["rocky"] = "road"
  60. >>> C["rocky"]["path"] = "/cookie"
  61. >>> print(C.output(header="Cookie:"))
  62. Cookie: rocky=road; Path=/cookie
  63. >>> print(C.output(attrs=[], header="Cookie:"))
  64. Cookie: rocky=road
  65. The load() method of a Cookie extracts cookies from a string. In a
  66. CGI script, you would use this method to extract the cookies from the
  67. HTTP_COOKIE environment variable.
  68. >>> C = cookies.SimpleCookie()
  69. >>> C.load("chips=ahoy; vienna=finger")
  70. >>> C.output()
  71. 'Set-Cookie: chips=ahoy\r\nSet-Cookie: vienna=finger'
  72. The load() method is darn-tootin smart about identifying cookies
  73. within a string. Escaped quotation marks, nested semicolons, and other
  74. such trickeries do not confuse it.
  75. >>> C = cookies.SimpleCookie()
  76. >>> C.load('keebler="E=everybody; L=\\"Loves\\"; fudge=\\012;";')
  77. >>> print(C)
  78. Set-Cookie: keebler="E=everybody; L=\"Loves\"; fudge=\012;"
  79. Each element of the Cookie also supports all of the RFC 2109
  80. Cookie attributes. Here's an example which sets the Path
  81. attribute.
  82. >>> C = cookies.SimpleCookie()
  83. >>> C["oreo"] = "doublestuff"
  84. >>> C["oreo"]["path"] = "/"
  85. >>> print(C)
  86. Set-Cookie: oreo=doublestuff; Path=/
  87. Each dictionary element has a 'value' attribute, which gives you
  88. back the value associated with the key.
  89. >>> C = cookies.SimpleCookie()
  90. >>> C["twix"] = "none for you"
  91. >>> C["twix"].value
  92. 'none for you'
  93. The SimpleCookie expects that all values should be standard strings.
  94. Just to be sure, SimpleCookie invokes the str() builtin to convert
  95. the value to a string, when the values are set dictionary-style.
  96. >>> C = cookies.SimpleCookie()
  97. >>> C["number"] = 7
  98. >>> C["string"] = "seven"
  99. >>> C["number"].value
  100. '7'
  101. >>> C["string"].value
  102. 'seven'
  103. >>> C.output()
  104. 'Set-Cookie: number=7\r\nSet-Cookie: string=seven'
  105. Finis.
  106. """
  107. #
  108. # Import our required modules
  109. #
  110. import re
  111. import string
  112. __all__ = ["CookieError", "BaseCookie", "SimpleCookie"]
  113. _nulljoin = ''.join
  114. _semispacejoin = '; '.join
  115. _spacejoin = ' '.join
  116. def _warn_deprecated_setter(setter):
  117. import warnings
  118. msg = ('The .%s setter is deprecated. The attribute will be read-only in '
  119. 'future releases. Please use the set() method instead.' % setter)
  120. warnings.warn(msg, DeprecationWarning, stacklevel=3)
  121. #
  122. # Define an exception visible to External modules
  123. #
  124. class CookieError(Exception):
  125. pass
  126. # These quoting routines conform to the RFC2109 specification, which in
  127. # turn references the character definitions from RFC2068. They provide
  128. # a two-way quoting algorithm. Any non-text character is translated
  129. # into a 4 character sequence: a forward-slash followed by the
  130. # three-digit octal equivalent of the character. Any '\' or '"' is
  131. # quoted with a preceding '\' slash.
  132. # Because of the way browsers really handle cookies (as opposed to what
  133. # the RFC says) we also encode "," and ";".
  134. #
  135. # These are taken from RFC2068 and RFC2109.
  136. # _LegalChars is the list of chars which don't require "'s
  137. # _Translator hash-table for fast quoting
  138. #
  139. _LegalChars = string.ascii_letters + string.digits + "!#$%&'*+-.^_`|~:"
  140. _UnescapedChars = _LegalChars + ' ()/<=>?@[]{}'
  141. _Translator = {n: '\\%03o' % n
  142. for n in set(range(256)) - set(map(ord, _UnescapedChars))}
  143. _Translator.update({
  144. ord('"'): '\\"',
  145. ord('\\'): '\\\\',
  146. })
  147. _is_legal_key = re.compile('[%s]+' % re.escape(_LegalChars)).fullmatch
  148. def _quote(str):
  149. r"""Quote a string for use in a cookie header.
  150. If the string does not need to be double-quoted, then just return the
  151. string. Otherwise, surround the string in doublequotes and quote
  152. (with a \) special characters.
  153. """
  154. if str is None or _is_legal_key(str):
  155. return str
  156. else:
  157. return '"' + str.translate(_Translator) + '"'
  158. _OctalPatt = re.compile(r"\\[0-3][0-7][0-7]")
  159. _QuotePatt = re.compile(r"[\\].")
  160. def _unquote(str):
  161. # If there aren't any doublequotes,
  162. # then there can't be any special characters. See RFC 2109.
  163. if str is None or len(str) < 2:
  164. return str
  165. if str[0] != '"' or str[-1] != '"':
  166. return str
  167. # We have to assume that we must decode this string.
  168. # Down to work.
  169. # Remove the "s
  170. str = str[1:-1]
  171. # Check for special sequences. Examples:
  172. # \012 --> \n
  173. # \" --> "
  174. #
  175. i = 0
  176. n = len(str)
  177. res = []
  178. while 0 <= i < n:
  179. o_match = _OctalPatt.search(str, i)
  180. q_match = _QuotePatt.search(str, i)
  181. if not o_match and not q_match: # Neither matched
  182. res.append(str[i:])
  183. break
  184. # else:
  185. j = k = -1
  186. if o_match:
  187. j = o_match.start(0)
  188. if q_match:
  189. k = q_match.start(0)
  190. if q_match and (not o_match or k < j): # QuotePatt matched
  191. res.append(str[i:k])
  192. res.append(str[k+1])
  193. i = k + 2
  194. else: # OctalPatt matched
  195. res.append(str[i:j])
  196. res.append(chr(int(str[j+1:j+4], 8)))
  197. i = j + 4
  198. return _nulljoin(res)
  199. # The _getdate() routine is used to set the expiration time in the cookie's HTTP
  200. # header. By default, _getdate() returns the current time in the appropriate
  201. # "expires" format for a Set-Cookie header. The one optional argument is an
  202. # offset from now, in seconds. For example, an offset of -3600 means "one hour
  203. # ago". The offset may be a floating point number.
  204. #
  205. _weekdayname = ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun']
  206. _monthname = [None,
  207. 'Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun',
  208. 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec']
  209. def _getdate(future=0, weekdayname=_weekdayname, monthname=_monthname):
  210. from time import gmtime, time
  211. now = time()
  212. year, month, day, hh, mm, ss, wd, y, z = gmtime(now + future)
  213. return "%s, %02d %3s %4d %02d:%02d:%02d GMT" % \
  214. (weekdayname[wd], day, monthname[month], year, hh, mm, ss)
  215. class Morsel(dict):
  216. """A class to hold ONE (key, value) pair.
  217. In a cookie, each such pair may have several attributes, so this class is
  218. used to keep the attributes associated with the appropriate key,value pair.
  219. This class also includes a coded_value attribute, which is used to hold
  220. the network representation of the value. This is most useful when Python
  221. objects are pickled for network transit.
  222. """
  223. # RFC 2109 lists these attributes as reserved:
  224. # path comment domain
  225. # max-age secure version
  226. #
  227. # For historical reasons, these attributes are also reserved:
  228. # expires
  229. #
  230. # This is an extension from Microsoft:
  231. # httponly
  232. #
  233. # This dictionary provides a mapping from the lowercase
  234. # variant on the left to the appropriate traditional
  235. # formatting on the right.
  236. _reserved = {
  237. "expires" : "expires",
  238. "path" : "Path",
  239. "comment" : "Comment",
  240. "domain" : "Domain",
  241. "max-age" : "Max-Age",
  242. "secure" : "Secure",
  243. "httponly" : "HttpOnly",
  244. "version" : "Version",
  245. }
  246. _flags = {'secure', 'httponly'}
  247. def __init__(self):
  248. # Set defaults
  249. self._key = self._value = self._coded_value = None
  250. # Set default attributes
  251. for key in self._reserved:
  252. dict.__setitem__(self, key, "")
  253. @property
  254. def key(self):
  255. return self._key
  256. @key.setter
  257. def key(self, key):
  258. _warn_deprecated_setter('key')
  259. self._key = key
  260. @property
  261. def value(self):
  262. return self._value
  263. @value.setter
  264. def value(self, value):
  265. _warn_deprecated_setter('value')
  266. self._value = value
  267. @property
  268. def coded_value(self):
  269. return self._coded_value
  270. @coded_value.setter
  271. def coded_value(self, coded_value):
  272. _warn_deprecated_setter('coded_value')
  273. self._coded_value = coded_value
  274. def __setitem__(self, K, V):
  275. K = K.lower()
  276. if not K in self._reserved:
  277. raise CookieError("Invalid attribute %r" % (K,))
  278. dict.__setitem__(self, K, V)
  279. def setdefault(self, key, val=None):
  280. key = key.lower()
  281. if key not in self._reserved:
  282. raise CookieError("Invalid attribute %r" % (key,))
  283. return dict.setdefault(self, key, val)
  284. def __eq__(self, morsel):
  285. if not isinstance(morsel, Morsel):
  286. return NotImplemented
  287. return (dict.__eq__(self, morsel) and
  288. self._value == morsel._value and
  289. self._key == morsel._key and
  290. self._coded_value == morsel._coded_value)
  291. __ne__ = object.__ne__
  292. def copy(self):
  293. morsel = Morsel()
  294. dict.update(morsel, self)
  295. morsel.__dict__.update(self.__dict__)
  296. return morsel
  297. def update(self, values):
  298. data = {}
  299. for key, val in dict(values).items():
  300. key = key.lower()
  301. if key not in self._reserved:
  302. raise CookieError("Invalid attribute %r" % (key,))
  303. data[key] = val
  304. dict.update(self, data)
  305. def isReservedKey(self, K):
  306. return K.lower() in self._reserved
  307. def set(self, key, val, coded_val, LegalChars=_LegalChars):
  308. if LegalChars != _LegalChars:
  309. import warnings
  310. warnings.warn(
  311. 'LegalChars parameter is deprecated, ignored and will '
  312. 'be removed in future versions.', DeprecationWarning,
  313. stacklevel=2)
  314. if key.lower() in self._reserved:
  315. raise CookieError('Attempt to set a reserved key %r' % (key,))
  316. if not _is_legal_key(key):
  317. raise CookieError('Illegal key %r' % (key,))
  318. # It's a good key, so save it.
  319. self._key = key
  320. self._value = val
  321. self._coded_value = coded_val
  322. def __getstate__(self):
  323. return {
  324. 'key': self._key,
  325. 'value': self._value,
  326. 'coded_value': self._coded_value,
  327. }
  328. def __setstate__(self, state):
  329. self._key = state['key']
  330. self._value = state['value']
  331. self._coded_value = state['coded_value']
  332. def output(self, attrs=None, header="Set-Cookie:"):
  333. return "%s %s" % (header, self.OutputString(attrs))
  334. __str__ = output
  335. def __repr__(self):
  336. return '<%s: %s>' % (self.__class__.__name__, self.OutputString())
  337. def js_output(self, attrs=None):
  338. # Print javascript
  339. return """
  340. <script type="text/javascript">
  341. <!-- begin hiding
  342. document.cookie = \"%s\";
  343. // end hiding -->
  344. </script>
  345. """ % (self.OutputString(attrs).replace('"', r'\"'))
  346. def OutputString(self, attrs=None):
  347. # Build up our result
  348. #
  349. result = []
  350. append = result.append
  351. # First, the key=value pair
  352. append("%s=%s" % (self.key, self.coded_value))
  353. # Now add any defined attributes
  354. if attrs is None:
  355. attrs = self._reserved
  356. items = sorted(self.items())
  357. for key, value in items:
  358. if value == "":
  359. continue
  360. if key not in attrs:
  361. continue
  362. if key == "expires" and isinstance(value, int):
  363. append("%s=%s" % (self._reserved[key], _getdate(value)))
  364. elif key == "max-age" and isinstance(value, int):
  365. append("%s=%d" % (self._reserved[key], value))
  366. elif key in self._flags:
  367. if value:
  368. append(str(self._reserved[key]))
  369. else:
  370. append("%s=%s" % (self._reserved[key], value))
  371. # Return the result
  372. return _semispacejoin(result)
  373. #
  374. # Pattern for finding cookie
  375. #
  376. # This used to be strict parsing based on the RFC2109 and RFC2068
  377. # specifications. I have since discovered that MSIE 3.0x doesn't
  378. # follow the character rules outlined in those specs. As a
  379. # result, the parsing rules here are less strict.
  380. #
  381. _LegalKeyChars = r"\w\d!#%&'~_`><@,:/\$\*\+\-\.\^\|\)\(\?\}\{\="
  382. _LegalValueChars = _LegalKeyChars + '\[\]'
  383. _CookiePattern = re.compile(r"""
  384. (?x) # This is a verbose pattern
  385. \s* # Optional whitespace at start of cookie
  386. (?P<key> # Start of group 'key'
  387. [""" + _LegalKeyChars + r"""]+? # Any word of at least one letter
  388. ) # End of group 'key'
  389. ( # Optional group: there may not be a value.
  390. \s*=\s* # Equal Sign
  391. (?P<val> # Start of group 'val'
  392. "(?:[^\\"]|\\.)*" # Any doublequoted string
  393. | # or
  394. \w{3},\s[\w\d\s-]{9,11}\s[\d:]{8}\sGMT # Special case for "expires" attr
  395. | # or
  396. [""" + _LegalValueChars + r"""]* # Any word or empty string
  397. ) # End of group 'val'
  398. )? # End of optional value group
  399. \s* # Any number of spaces.
  400. (\s+|;|$) # Ending either at space, semicolon, or EOS.
  401. """, re.ASCII) # May be removed if safe.
  402. # At long last, here is the cookie class. Using this class is almost just like
  403. # using a dictionary. See this module's docstring for example usage.
  404. #
  405. class BaseCookie(dict):
  406. """A container class for a set of Morsels."""
  407. def value_decode(self, val):
  408. """real_value, coded_value = value_decode(STRING)
  409. Called prior to setting a cookie's value from the network
  410. representation. The VALUE is the value read from HTTP
  411. header.
  412. Override this function to modify the behavior of cookies.
  413. """
  414. return val, val
  415. def value_encode(self, val):
  416. """real_value, coded_value = value_encode(VALUE)
  417. Called prior to setting a cookie's value from the dictionary
  418. representation. The VALUE is the value being assigned.
  419. Override this function to modify the behavior of cookies.
  420. """
  421. strval = str(val)
  422. return strval, strval
  423. def __init__(self, input=None):
  424. if input:
  425. self.load(input)
  426. def __set(self, key, real_value, coded_value):
  427. """Private method for setting a cookie's value"""
  428. M = self.get(key, Morsel())
  429. M.set(key, real_value, coded_value)
  430. dict.__setitem__(self, key, M)
  431. def __setitem__(self, key, value):
  432. """Dictionary style assignment."""
  433. if isinstance(value, Morsel):
  434. # allow assignment of constructed Morsels (e.g. for pickling)
  435. dict.__setitem__(self, key, value)
  436. else:
  437. rval, cval = self.value_encode(value)
  438. self.__set(key, rval, cval)
  439. def output(self, attrs=None, header="Set-Cookie:", sep="\015\012"):
  440. """Return a string suitable for HTTP."""
  441. result = []
  442. items = sorted(self.items())
  443. for key, value in items:
  444. result.append(value.output(attrs, header))
  445. return sep.join(result)
  446. __str__ = output
  447. def __repr__(self):
  448. l = []
  449. items = sorted(self.items())
  450. for key, value in items:
  451. l.append('%s=%s' % (key, repr(value.value)))
  452. return '<%s: %s>' % (self.__class__.__name__, _spacejoin(l))
  453. def js_output(self, attrs=None):
  454. """Return a string suitable for JavaScript."""
  455. result = []
  456. items = sorted(self.items())
  457. for key, value in items:
  458. result.append(value.js_output(attrs))
  459. return _nulljoin(result)
  460. def load(self, rawdata):
  461. """Load cookies from a string (presumably HTTP_COOKIE) or
  462. from a dictionary. Loading cookies from a dictionary 'd'
  463. is equivalent to calling:
  464. map(Cookie.__setitem__, d.keys(), d.values())
  465. """
  466. if isinstance(rawdata, str):
  467. self.__parse_string(rawdata)
  468. else:
  469. # self.update() wouldn't call our custom __setitem__
  470. for key, value in rawdata.items():
  471. self[key] = value
  472. return
  473. def __parse_string(self, str, patt=_CookiePattern):
  474. i = 0 # Our starting point
  475. n = len(str) # Length of string
  476. parsed_items = [] # Parsed (type, key, value) triples
  477. morsel_seen = False # A key=value pair was previously encountered
  478. TYPE_ATTRIBUTE = 1
  479. TYPE_KEYVALUE = 2
  480. # We first parse the whole cookie string and reject it if it's
  481. # syntactically invalid (this helps avoid some classes of injection
  482. # attacks).
  483. while 0 <= i < n:
  484. # Start looking for a cookie
  485. match = patt.match(str, i)
  486. if not match:
  487. # No more cookies
  488. break
  489. key, value = match.group("key"), match.group("val")
  490. i = match.end(0)
  491. if key[0] == "$":
  492. if not morsel_seen:
  493. # We ignore attributes which pertain to the cookie
  494. # mechanism as a whole, such as "$Version".
  495. # See RFC 2965. (Does anyone care?)
  496. continue
  497. parsed_items.append((TYPE_ATTRIBUTE, key[1:], value))
  498. elif key.lower() in Morsel._reserved:
  499. if not morsel_seen:
  500. # Invalid cookie string
  501. return
  502. if value is None:
  503. if key.lower() in Morsel._flags:
  504. parsed_items.append((TYPE_ATTRIBUTE, key, True))
  505. else:
  506. # Invalid cookie string
  507. return
  508. else:
  509. parsed_items.append((TYPE_ATTRIBUTE, key, _unquote(value)))
  510. elif value is not None:
  511. parsed_items.append((TYPE_KEYVALUE, key, self.value_decode(value)))
  512. morsel_seen = True
  513. else:
  514. # Invalid cookie string
  515. return
  516. # The cookie string is valid, apply it.
  517. M = None # current morsel
  518. for tp, key, value in parsed_items:
  519. if tp == TYPE_ATTRIBUTE:
  520. assert M is not None
  521. M[key] = value
  522. else:
  523. assert tp == TYPE_KEYVALUE
  524. rval, cval = value
  525. self.__set(key, rval, cval)
  526. M = self[key]
  527. class SimpleCookie(BaseCookie):
  528. """
  529. SimpleCookie supports strings as cookie values. When setting
  530. the value using the dictionary assignment notation, SimpleCookie
  531. calls the builtin str() to convert the value to a string. Values
  532. received from HTTP are kept as strings.
  533. """
  534. def value_decode(self, val):
  535. return _unquote(val), val
  536. def value_encode(self, val):
  537. strval = str(val)
  538. return strval, _quote(strval)