summaryrefslogtreecommitdiff
path: root/Windows/dateutil/test/test_parser.py
diff options
context:
space:
mode:
Diffstat (limited to 'Windows/dateutil/test/test_parser.py')
-rw-r--r--Windows/dateutil/test/test_parser.py856
1 files changed, 0 insertions, 856 deletions
diff --git a/Windows/dateutil/test/test_parser.py b/Windows/dateutil/test/test_parser.py
deleted file mode 100644
index dcaa7cc0..00000000
--- a/Windows/dateutil/test/test_parser.py
+++ /dev/null
@@ -1,856 +0,0 @@
-# -*- coding: utf-8 -*-
-from __future__ import unicode_literals
-
-import itertools
-from datetime import datetime, timedelta
-import unittest
-import sys
-
-from dateutil import tz
-from dateutil.tz import tzoffset
-from dateutil.parser import parse, parserinfo
-from dateutil.parser import UnknownTimezoneWarning
-
-from ._common import TZEnvContext
-
-from six import assertRaisesRegex, PY3
-from io import StringIO
-
-import pytest
-
-# Platform info
-IS_WIN = sys.platform.startswith('win')
-
-try:
- datetime.now().strftime('%-d')
- PLATFORM_HAS_DASH_D = True
-except ValueError:
- PLATFORM_HAS_DASH_D = False
-
-# Parser test cases using no keyword arguments. Format: (parsable_text, expected_datetime, assertion_message)
-PARSER_TEST_CASES = [
- ("Thu Sep 25 10:36:28 2003", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("Thu Sep 25 2003", datetime(2003, 9, 25), "date command format strip"),
- ("2003-09-25T10:49:41", datetime(2003, 9, 25, 10, 49, 41), "iso format strip"),
- ("2003-09-25T10:49", datetime(2003, 9, 25, 10, 49), "iso format strip"),
- ("2003-09-25T10", datetime(2003, 9, 25, 10), "iso format strip"),
- ("2003-09-25", datetime(2003, 9, 25), "iso format strip"),
- ("20030925T104941", datetime(2003, 9, 25, 10, 49, 41), "iso stripped format strip"),
- ("20030925T1049", datetime(2003, 9, 25, 10, 49, 0), "iso stripped format strip"),
- ("20030925T10", datetime(2003, 9, 25, 10), "iso stripped format strip"),
- ("20030925", datetime(2003, 9, 25), "iso stripped format strip"),
- ("2003-09-25 10:49:41,502", datetime(2003, 9, 25, 10, 49, 41, 502000), "python logger format"),
- ("199709020908", datetime(1997, 9, 2, 9, 8), "no separator"),
- ("19970902090807", datetime(1997, 9, 2, 9, 8, 7), "no separator"),
- ("2003-09-25", datetime(2003, 9, 25), "date with dash"),
- ("09-25-2003", datetime(2003, 9, 25), "date with dash"),
- ("25-09-2003", datetime(2003, 9, 25), "date with dash"),
- ("10-09-2003", datetime(2003, 10, 9), "date with dash"),
- ("10-09-03", datetime(2003, 10, 9), "date with dash"),
- ("2003.09.25", datetime(2003, 9, 25), "date with dot"),
- ("09.25.2003", datetime(2003, 9, 25), "date with dot"),
- ("25.09.2003", datetime(2003, 9, 25), "date with dot"),
- ("10.09.2003", datetime(2003, 10, 9), "date with dot"),
- ("10.09.03", datetime(2003, 10, 9), "date with dot"),
- ("2003/09/25", datetime(2003, 9, 25), "date with slash"),
- ("09/25/2003", datetime(2003, 9, 25), "date with slash"),
- ("25/09/2003", datetime(2003, 9, 25), "date with slash"),
- ("10/09/2003", datetime(2003, 10, 9), "date with slash"),
- ("10/09/03", datetime(2003, 10, 9), "date with slash"),
- ("2003 09 25", datetime(2003, 9, 25), "date with space"),
- ("09 25 2003", datetime(2003, 9, 25), "date with space"),
- ("25 09 2003", datetime(2003, 9, 25), "date with space"),
- ("10 09 2003", datetime(2003, 10, 9), "date with space"),
- ("10 09 03", datetime(2003, 10, 9), "date with space"),
- ("25 09 03", datetime(2003, 9, 25), "date with space"),
- ("03 25 Sep", datetime(2003, 9, 25), "strangely ordered date"),
- ("25 03 Sep", datetime(2025, 9, 3), "strangely ordered date"),
- (" July 4 , 1976 12:01:02 am ", datetime(1976, 7, 4, 0, 1, 2), "extra space"),
- ("Wed, July 10, '96", datetime(1996, 7, 10, 0, 0), "random format"),
- ("1996.July.10 AD 12:08 PM", datetime(1996, 7, 10, 12, 8), "random format"),
- ("July 4, 1976", datetime(1976, 7, 4), "random format"),
- ("7 4 1976", datetime(1976, 7, 4), "random format"),
- ("4 jul 1976", datetime(1976, 7, 4), "random format"),
- ("7-4-76", datetime(1976, 7, 4), "random format"),
- ("19760704", datetime(1976, 7, 4), "random format"),
- ("0:01:02 on July 4, 1976", datetime(1976, 7, 4, 0, 1, 2), "random format"),
- ("0:01:02 on July 4, 1976", datetime(1976, 7, 4, 0, 1, 2), "random format"),
- ("July 4, 1976 12:01:02 am", datetime(1976, 7, 4, 0, 1, 2), "random format"),
- ("Mon Jan 2 04:24:27 1995", datetime(1995, 1, 2, 4, 24, 27), "random format"),
- ("04.04.95 00:22", datetime(1995, 4, 4, 0, 22), "random format"),
- ("Jan 1 1999 11:23:34.578", datetime(1999, 1, 1, 11, 23, 34, 578000), "random format"),
- ("950404 122212", datetime(1995, 4, 4, 12, 22, 12), "random format"),
- ("3rd of May 2001", datetime(2001, 5, 3), "random format"),
- ("5th of March 2001", datetime(2001, 3, 5), "random format"),
- ("1st of May 2003", datetime(2003, 5, 1), "random format"),
- ('0099-01-01T00:00:00', datetime(99, 1, 1, 0, 0), "99 ad"),
- ('0031-01-01T00:00:00', datetime(31, 1, 1, 0, 0), "31 ad"),
- ("20080227T21:26:01.123456789", datetime(2008, 2, 27, 21, 26, 1, 123456), "high precision seconds"),
- ('13NOV2017', datetime(2017, 11, 13), "dBY (See GH360)"),
- ('0003-03-04', datetime(3, 3, 4), "pre 12 year same month (See GH PR #293)"),
- ('December.0031.30', datetime(31, 12, 30), "BYd corner case (GH#687)")
-]
-
-
-@pytest.mark.parametrize("parsable_text,expected_datetime,assertion_message", PARSER_TEST_CASES)
-def test_parser(parsable_text, expected_datetime, assertion_message):
- assert parse(parsable_text) == expected_datetime, assertion_message
-
-
-# Parser test cases using datetime(2003, 9, 25) as a default.
-# Format: (parsable_text, expected_datetime, assertion_message)
-PARSER_DEFAULT_TEST_CASES = [
- ("Thu Sep 25 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("Thu Sep 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("Thu 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("Sep 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
- ("10:36", datetime(2003, 9, 25, 10, 36), "date command format strip"),
- ("Sep 2003", datetime(2003, 9, 25), "date command format strip"),
- ("Sep", datetime(2003, 9, 25), "date command format strip"),
- ("2003", datetime(2003, 9, 25), "date command format strip"),
- ("10h36m28.5s", datetime(2003, 9, 25, 10, 36, 28, 500000), "hour with letters"),
- ("10h36m28s", datetime(2003, 9, 25, 10, 36, 28), "hour with letters strip"),
- ("10h36m", datetime(2003, 9, 25, 10, 36), "hour with letters strip"),
- ("10h", datetime(2003, 9, 25, 10), "hour with letters strip"),
- ("10 h 36", datetime(2003, 9, 25, 10, 36), "hour with letters strip"),
- ("10 h 36.5", datetime(2003, 9, 25, 10, 36, 30), "hour with letter strip"),
- ("36 m 5", datetime(2003, 9, 25, 0, 36, 5), "hour with letters spaces"),
- ("36 m 5 s", datetime(2003, 9, 25, 0, 36, 5), "minute with letters spaces"),
- ("36 m 05", datetime(2003, 9, 25, 0, 36, 5), "minute with letters spaces"),
- ("36 m 05 s", datetime(2003, 9, 25, 0, 36, 5), "minutes with letters spaces"),
- ("10h am", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10h pm", datetime(2003, 9, 25, 22), "hour am pm"),
- ("10am", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10pm", datetime(2003, 9, 25, 22), "hour am pm"),
- ("10:00 am", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10:00 pm", datetime(2003, 9, 25, 22), "hour am pm"),
- ("10:00am", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10:00pm", datetime(2003, 9, 25, 22), "hour am pm"),
- ("10:00a.m", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10:00p.m", datetime(2003, 9, 25, 22), "hour am pm"),
- ("10:00a.m.", datetime(2003, 9, 25, 10), "hour am pm"),
- ("10:00p.m.", datetime(2003, 9, 25, 22), "hour am pm"),
- ("Wed", datetime(2003, 10, 1), "weekday alone"),
- ("Wednesday", datetime(2003, 10, 1), "long weekday"),
- ("October", datetime(2003, 10, 25), "long month"),
- ("31-Dec-00", datetime(2000, 12, 31), "zero year"),
- ("0:01:02", datetime(2003, 9, 25, 0, 1, 2), "random format"),
- ("12h 01m02s am", datetime(2003, 9, 25, 0, 1, 2), "random format"),
- ("12:08 PM", datetime(2003, 9, 25, 12, 8), "random format"),
- ("01h02m03", datetime(2003, 9, 25, 1, 2, 3), "random format"),
- ("01h02", datetime(2003, 9, 25, 1, 2), "random format"),
- ("01h02s", datetime(2003, 9, 25, 1, 0, 2), "random format"),
- ("01m02", datetime(2003, 9, 25, 0, 1, 2), "random format"),
- ("01m02h", datetime(2003, 9, 25, 2, 1), "random format"),
- ("2004 10 Apr 11h30m", datetime(2004, 4, 10, 11, 30), "random format")
-]
-
-
-@pytest.mark.parametrize("parsable_text,expected_datetime,assertion_message", PARSER_DEFAULT_TEST_CASES)
-def test_parser_default(parsable_text, expected_datetime, assertion_message):
- assert parse(parsable_text, default=datetime(2003, 9, 25)) == expected_datetime, assertion_message
-
-
-class TestFormat(unittest.TestCase):
-
- def test_ybd(self):
- # If we have a 4-digit year, a non-numeric month (abbreviated or not),
- # and a day (1 or 2 digits), then there is no ambiguity as to which
- # token is a year/month/day. This holds regardless of what order the
- # terms are in and for each of the separators below.
-
- seps = ['-', ' ', '/', '.']
-
- year_tokens = ['%Y']
- month_tokens = ['%b', '%B']
- day_tokens = ['%d']
- if PLATFORM_HAS_DASH_D:
- day_tokens.append('%-d')
-
- prods = itertools.product(year_tokens, month_tokens, day_tokens)
- perms = [y for x in prods for y in itertools.permutations(x)]
- unambig_fmts = [sep.join(perm) for sep in seps for perm in perms]
-
- actual = datetime(2003, 9, 25)
-
- for fmt in unambig_fmts:
- dstr = actual.strftime(fmt)
- res = parse(dstr)
- self.assertEqual(res, actual)
-
-
-class TestInputFormats(object):
- def test_empty_string_invalid(self):
- with pytest.raises(ValueError):
- parse('')
-
- def test_none_invalid(self):
- with pytest.raises(TypeError):
- parse(None)
-
- def test_int_invalid(self):
- with pytest.raises(TypeError):
- parse(13)
-
- def test_duck_typing(self):
- # We want to support arbitrary classes that implement the stream
- # interface.
-
- class StringPassThrough(object):
- def __init__(self, stream):
- self.stream = stream
-
- def read(self, *args, **kwargs):
- return self.stream.read(*args, **kwargs)
-
- dstr = StringPassThrough(StringIO('2014 January 19'))
-
- res = parse(dstr)
- expected = datetime(2014, 1, 19)
- assert res == expected
-
- def test_parse_stream(self):
- dstr = StringIO('2014 January 19')
-
- res = parse(dstr)
- expected = datetime(2014, 1, 19)
- assert res == expected
-
- def test_parse_str(self):
- # Parser should be able to handle bytestring and unicode
- uni_str = '2014-05-01 08:00:00'
- bytes_str = uni_str.encode()
-
- res = parse(bytes_str)
- expected = parse(uni_str)
- assert res == expected
-
- def test_parse_bytes(self):
- res = parse(b'2014 January 19')
- expected = datetime(2014, 1, 19)
- assert res == expected
-
- def test_parse_bytearray(self):
- # GH#417
- res = parse(bytearray(b'2014 January 19'))
- expected = datetime(2014, 1, 19)
- assert res == expected
-
-
-class ParserTest(unittest.TestCase):
-
- def setUp(self):
- self.tzinfos = {"BRST": -10800}
- self.brsttz = tzoffset("BRST", -10800)
- self.default = datetime(2003, 9, 25)
-
- # Parser should be able to handle bytestring and unicode
- self.uni_str = '2014-05-01 08:00:00'
- self.str_str = self.uni_str.encode()
-
- def testParserParseStr(self):
- from dateutil.parser import parser
-
- self.assertEqual(parser().parse(self.str_str),
- parser().parse(self.uni_str))
-
- def testParseUnicodeWords(self):
-
- class rus_parserinfo(parserinfo):
- MONTHS = [("янв", "Январь"),
- ("фев", "Февраль"),
- ("мар", "Март"),
- ("апр", "Апрель"),
- ("май", "Май"),
- ("июн", "Июнь"),
- ("июл", "Июль"),
- ("авг", "Август"),
- ("сен", "Сентябрь"),
- ("окт", "Октябрь"),
- ("ноя", "Ноябрь"),
- ("дек", "Декабрь")]
-
- self.assertEqual(parse('10 Сентябрь 2015 10:20',
- parserinfo=rus_parserinfo()),
- datetime(2015, 9, 10, 10, 20))
-
- def testParseWithNulls(self):
- # This relies on the from __future__ import unicode_literals, because
- # explicitly specifying a unicode literal is a syntax error in Py 3.2
- # May want to switch to u'...' if we ever drop Python 3.2 support.
- pstring = '\x00\x00August 29, 1924'
-
- self.assertEqual(parse(pstring),
- datetime(1924, 8, 29))
-
- def testDateCommandFormat(self):
- self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
- tzinfos=self.tzinfos),
- datetime(2003, 9, 25, 10, 36, 28,
- tzinfo=self.brsttz))
-
- def testDateCommandFormatUnicode(self):
- self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
- tzinfos=self.tzinfos),
- datetime(2003, 9, 25, 10, 36, 28,
- tzinfo=self.brsttz))
-
- def testDateCommandFormatReversed(self):
- self.assertEqual(parse("2003 10:36:28 BRST 25 Sep Thu",
- tzinfos=self.tzinfos),
- datetime(2003, 9, 25, 10, 36, 28,
- tzinfo=self.brsttz))
-
- def testDateCommandFormatWithLong(self):
- if not PY3:
- self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
- tzinfos={"BRST": long(-10800)}),
- datetime(2003, 9, 25, 10, 36, 28,
- tzinfo=self.brsttz))
-
- def testDateCommandFormatIgnoreTz(self):
- self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
- ignoretz=True),
- datetime(2003, 9, 25, 10, 36, 28))
-
- def testDateRCommandFormat(self):
- self.assertEqual(parse("Thu, 25 Sep 2003 10:49:41 -0300"),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=self.brsttz))
-
- def testISOFormat(self):
- self.assertEqual(parse("2003-09-25T10:49:41.5-03:00"),
- datetime(2003, 9, 25, 10, 49, 41, 500000,
- tzinfo=self.brsttz))
-
- def testISOFormatStrip1(self):
- self.assertEqual(parse("2003-09-25T10:49:41-03:00"),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=self.brsttz))
-
- def testISOFormatStrip2(self):
- self.assertEqual(parse("2003-09-25T10:49:41+03:00"),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=tzoffset(None, 10800)))
-
- def testISOStrippedFormat(self):
- self.assertEqual(parse("20030925T104941.5-0300"),
- datetime(2003, 9, 25, 10, 49, 41, 500000,
- tzinfo=self.brsttz))
-
- def testISOStrippedFormatStrip1(self):
- self.assertEqual(parse("20030925T104941-0300"),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=self.brsttz))
-
- def testISOStrippedFormatStrip2(self):
- self.assertEqual(parse("20030925T104941+0300"),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=tzoffset(None, 10800)))
-
- def testDateWithDash8(self):
- self.assertEqual(parse("10-09-2003", dayfirst=True),
- datetime(2003, 9, 10))
-
- def testDateWithDash11(self):
- self.assertEqual(parse("10-09-03", yearfirst=True),
- datetime(2010, 9, 3))
-
- def testDateWithDot8(self):
- self.assertEqual(parse("10.09.2003", dayfirst=True),
- datetime(2003, 9, 10))
-
- def testDateWithDot11(self):
- self.assertEqual(parse("10.09.03", yearfirst=True),
- datetime(2010, 9, 3))
-
- def testDateWithSlash8(self):
- self.assertEqual(parse("10/09/2003", dayfirst=True),
- datetime(2003, 9, 10))
-
- def testDateWithSlash11(self):
- self.assertEqual(parse("10/09/03", yearfirst=True),
- datetime(2010, 9, 3))
-
- def testDateWithSpace8(self):
- self.assertEqual(parse("10 09 2003", dayfirst=True),
- datetime(2003, 9, 10))
-
- def testDateWithSpace11(self):
- self.assertEqual(parse("10 09 03", yearfirst=True),
- datetime(2010, 9, 3))
-
- def testAMPMNoHour(self):
- with self.assertRaises(ValueError):
- parse("AM")
-
- with self.assertRaises(ValueError):
- parse("Jan 20, 2015 PM")
-
- def testAMPMRange(self):
- with self.assertRaises(ValueError):
- parse("13:44 AM")
-
- with self.assertRaises(ValueError):
- parse("January 25, 1921 23:13 PM")
-
- def testPertain(self):
- self.assertEqual(parse("Sep 03", default=self.default),
- datetime(2003, 9, 3))
- self.assertEqual(parse("Sep of 03", default=self.default),
- datetime(2003, 9, 25))
-
- def testFuzzy(self):
- s = "Today is 25 of September of 2003, exactly " \
- "at 10:49:41 with timezone -03:00."
- self.assertEqual(parse(s, fuzzy=True),
- datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=self.brsttz))
-
- def testFuzzyWithTokens(self):
- s1 = "Today is 25 of September of 2003, exactly " \
- "at 10:49:41 with timezone -03:00."
- self.assertEqual(parse(s1, fuzzy_with_tokens=True),
- (datetime(2003, 9, 25, 10, 49, 41,
- tzinfo=self.brsttz),
- ('Today is ', 'of ', ', exactly at ',
- ' with timezone ', '.')))
-
- s2 = "http://biz.yahoo.com/ipo/p/600221.html"
- self.assertEqual(parse(s2, fuzzy_with_tokens=True),
- (datetime(2060, 2, 21, 0, 0, 0),
- ('http://biz.yahoo.com/ipo/p/', '.html')))
-
- def testFuzzyAMPMProblem(self):
- # Sometimes fuzzy parsing results in AM/PM flag being set without
- # hours - if it's fuzzy it should ignore that.
- s1 = "I have a meeting on March 1, 1974."
- s2 = "On June 8th, 2020, I am going to be the first man on Mars"
-
- # Also don't want any erroneous AM or PMs changing the parsed time
- s3 = "Meet me at the AM/PM on Sunset at 3:00 AM on December 3rd, 2003"
- s4 = "Meet me at 3:00AM on December 3rd, 2003 at the AM/PM on Sunset"
-
- self.assertEqual(parse(s1, fuzzy=True), datetime(1974, 3, 1))
- self.assertEqual(parse(s2, fuzzy=True), datetime(2020, 6, 8))
- self.assertEqual(parse(s3, fuzzy=True), datetime(2003, 12, 3, 3))
- self.assertEqual(parse(s4, fuzzy=True), datetime(2003, 12, 3, 3))
-
- def testFuzzyIgnoreAMPM(self):
- s1 = "Jan 29, 1945 14:45 AM I going to see you there?"
- with pytest.warns(UnknownTimezoneWarning):
- res = parse(s1, fuzzy=True)
- self.assertEqual(res, datetime(1945, 1, 29, 14, 45))
-
- def testRandomFormat2(self):
- self.assertEqual(parse("1996.07.10 AD at 15:08:56 PDT",
- ignoretz=True),
- datetime(1996, 7, 10, 15, 8, 56))
-
- def testRandomFormat4(self):
- self.assertEqual(parse("Tuesday, April 12, 1952 AD 3:30:42pm PST",
- ignoretz=True),
- datetime(1952, 4, 12, 15, 30, 42))
-
- def testRandomFormat5(self):
- self.assertEqual(parse("November 5, 1994, 8:15:30 am EST",
- ignoretz=True),
- datetime(1994, 11, 5, 8, 15, 30))
-
- def testRandomFormat6(self):
- self.assertEqual(parse("1994-11-05T08:15:30-05:00",
- ignoretz=True),
- datetime(1994, 11, 5, 8, 15, 30))
-
- def testRandomFormat7(self):
- self.assertEqual(parse("1994-11-05T08:15:30Z",
- ignoretz=True),
- datetime(1994, 11, 5, 8, 15, 30))
-
- def testRandomFormat17(self):
- self.assertEqual(parse("1976-07-04T00:01:02Z", ignoretz=True),
- datetime(1976, 7, 4, 0, 1, 2))
-
- def testRandomFormat18(self):
- self.assertEqual(parse("1986-07-05T08:15:30z",
- ignoretz=True),
- datetime(1986, 7, 5, 8, 15, 30))
-
- def testRandomFormat20(self):
- self.assertEqual(parse("Tue Apr 4 00:22:12 PDT 1995", ignoretz=True),
- datetime(1995, 4, 4, 0, 22, 12))
-
- def testRandomFormat24(self):
- self.assertEqual(parse("0:00 PM, PST", default=self.default,
- ignoretz=True),
- datetime(2003, 9, 25, 12, 0))
-
- def testRandomFormat26(self):
- with pytest.warns(UnknownTimezoneWarning):
- res = parse("5:50 A.M. on June 13, 1990")
-
- self.assertEqual(res, datetime(1990, 6, 13, 5, 50))
-
- def testInvalidDay(self):
- with self.assertRaises(ValueError):
- parse("Feb 30, 2007")
-
- def testUnspecifiedDayFallback(self):
- # Test that for an unspecified day, the fallback behavior is correct.
- self.assertEqual(parse("April 2009", default=datetime(2010, 1, 31)),
- datetime(2009, 4, 30))
-
- def testUnspecifiedDayFallbackFebNoLeapYear(self):
- self.assertEqual(parse("Feb 2007", default=datetime(2010, 1, 31)),
- datetime(2007, 2, 28))
-
- def testUnspecifiedDayFallbackFebLeapYear(self):
- self.assertEqual(parse("Feb 2008", default=datetime(2010, 1, 31)),
- datetime(2008, 2, 29))
-
- def testTzinfoDictionaryCouldReturnNone(self):
- self.assertEqual(parse('2017-02-03 12:40 BRST', tzinfos={"BRST": None}),
- datetime(2017, 2, 3, 12, 40))
-
- def testTzinfosCallableCouldReturnNone(self):
- self.assertEqual(parse('2017-02-03 12:40 BRST', tzinfos=lambda *args: None),
- datetime(2017, 2, 3, 12, 40))
-
- def testErrorType01(self):
- self.assertRaises(ValueError,
- parse, 'shouldfail')
-
- def testCorrectErrorOnFuzzyWithTokens(self):
- assertRaisesRegex(self, ValueError, 'Unknown string format',
- parse, '04/04/32/423', fuzzy_with_tokens=True)
- assertRaisesRegex(self, ValueError, 'Unknown string format',
- parse, '04/04/04 +32423', fuzzy_with_tokens=True)
- assertRaisesRegex(self, ValueError, 'Unknown string format',
- parse, '04/04/0d4', fuzzy_with_tokens=True)
-
- def testIncreasingCTime(self):
- # This test will check 200 different years, every month, every day,
- # every hour, every minute, every second, and every weekday, using
- # a delta of more or less 1 year, 1 month, 1 day, 1 minute and
- # 1 second.
- delta = timedelta(days=365+31+1, seconds=1+60+60*60)
- dt = datetime(1900, 1, 1, 0, 0, 0, 0)
- for i in range(200):
- self.assertEqual(parse(dt.ctime()), dt)
- dt += delta
-
- def testIncreasingISOFormat(self):
- delta = timedelta(days=365+31+1, seconds=1+60+60*60)
- dt = datetime(1900, 1, 1, 0, 0, 0, 0)
- for i in range(200):
- self.assertEqual(parse(dt.isoformat()), dt)
- dt += delta
-
- def testMicrosecondsPrecisionError(self):
- # Skip found out that sad precision problem. :-(
- dt1 = parse("00:11:25.01")
- dt2 = parse("00:12:10.01")
- self.assertEqual(dt1.microsecond, 10000)
- self.assertEqual(dt2.microsecond, 10000)
-
- def testMicrosecondPrecisionErrorReturns(self):
- # One more precision issue, discovered by Eric Brown. This should
- # be the last one, as we're no longer using floating points.
- for ms in [100001, 100000, 99999, 99998,
- 10001, 10000, 9999, 9998,
- 1001, 1000, 999, 998,
- 101, 100, 99, 98]:
- dt = datetime(2008, 2, 27, 21, 26, 1, ms)
- self.assertEqual(parse(dt.isoformat()), dt)
-
- def testCustomParserInfo(self):
- # Custom parser info wasn't working, as Michael Elsdörfer discovered.
- from dateutil.parser import parserinfo, parser
-
- class myparserinfo(parserinfo):
- MONTHS = parserinfo.MONTHS[:]
- MONTHS[0] = ("Foo", "Foo")
- myparser = parser(myparserinfo())
- dt = myparser.parse("01/Foo/2007")
- self.assertEqual(dt, datetime(2007, 1, 1))
-
- def testCustomParserShortDaynames(self):
- # Horacio Hoyos discovered that day names shorter than 3 characters,
- # for example two letter German day name abbreviations, don't work:
- # https://github.com/dateutil/dateutil/issues/343
- from dateutil.parser import parserinfo, parser
-
- class GermanParserInfo(parserinfo):
- WEEKDAYS = [("Mo", "Montag"),
- ("Di", "Dienstag"),
- ("Mi", "Mittwoch"),
- ("Do", "Donnerstag"),
- ("Fr", "Freitag"),
- ("Sa", "Samstag"),
- ("So", "Sonntag")]
-
- myparser = parser(GermanParserInfo())
- dt = myparser.parse("Sa 21. Jan 2017")
- self.assertEqual(dt, datetime(2017, 1, 21))
-
- def testNoYearFirstNoDayFirst(self):
- dtstr = '090107'
-
- # Should be MMDDYY
- self.assertEqual(parse(dtstr),
- datetime(2007, 9, 1))
-
- self.assertEqual(parse(dtstr, yearfirst=False, dayfirst=False),
- datetime(2007, 9, 1))
-
- def testYearFirst(self):
- dtstr = '090107'
-
- # Should be MMDDYY
- self.assertEqual(parse(dtstr, yearfirst=True),
- datetime(2009, 1, 7))
-
- self.assertEqual(parse(dtstr, yearfirst=True, dayfirst=False),
- datetime(2009, 1, 7))
-
- def testDayFirst(self):
- dtstr = '090107'
-
- # Should be DDMMYY
- self.assertEqual(parse(dtstr, dayfirst=True),
- datetime(2007, 1, 9))
-
- self.assertEqual(parse(dtstr, yearfirst=False, dayfirst=True),
- datetime(2007, 1, 9))
-
- def testDayFirstYearFirst(self):
- dtstr = '090107'
- # Should be YYDDMM
- self.assertEqual(parse(dtstr, yearfirst=True, dayfirst=True),
- datetime(2009, 7, 1))
-
- def testUnambiguousYearFirst(self):
- dtstr = '2015 09 25'
- self.assertEqual(parse(dtstr, yearfirst=True),
- datetime(2015, 9, 25))
-
- def testUnambiguousDayFirst(self):
- dtstr = '2015 09 25'
- self.assertEqual(parse(dtstr, dayfirst=True),
- datetime(2015, 9, 25))
-
- def testUnambiguousDayFirstYearFirst(self):
- dtstr = '2015 09 25'
- self.assertEqual(parse(dtstr, dayfirst=True, yearfirst=True),
- datetime(2015, 9, 25))
-
- def test_mstridx(self):
- # See GH408
- dtstr = '2015-15-May'
- self.assertEqual(parse(dtstr),
- datetime(2015, 5, 15))
-
- def test_idx_check(self):
- dtstr = '2017-07-17 06:15:'
- # Pre-PR, the trailing colon will cause an IndexError at 824-825
- # when checking `i < len_l` and then accessing `l[i+1]`
- res = parse(dtstr, fuzzy=True)
- self.assertEqual(res, datetime(2017, 7, 17, 6, 15))
-
- def test_hmBY(self):
- # See GH#483
- dtstr = '02:17NOV2017'
- res = parse(dtstr, default=self.default)
- self.assertEqual(res, datetime(2017, 11, self.default.day, 2, 17))
-
- def test_validate_hour(self):
- # See GH353
- invalid = "201A-01-01T23:58:39.239769+03:00"
- with self.assertRaises(ValueError):
- parse(invalid)
-
- def test_era_trailing_year(self):
- dstr = 'AD2001'
- res = parse(dstr)
- assert res.year == 2001, res
-
-
-class TestParseUnimplementedCases(object):
- @pytest.mark.xfail
- def test_somewhat_ambiguous_string(self):
- # Ref: github issue #487
- # The parser is choosing the wrong part for hour
- # causing datetime to raise an exception.
- dtstr = '1237 PM BRST Mon Oct 30 2017'
- res = parse(dtstr, tzinfo=self.tzinfos)
- assert res == datetime(2017, 10, 30, 12, 37, tzinfo=self.tzinfos)
-
- @pytest.mark.xfail
- def test_YmdH_M_S(self):
- # found in nasdaq's ftp data
- dstr = '1991041310:19:24'
- expected = datetime(1991, 4, 13, 10, 19, 24)
- res = parse(dstr)
- assert res == expected, (res, expected)
-
- @pytest.mark.xfail
- def test_first_century(self):
- dstr = '0031 Nov 03'
- expected = datetime(31, 11, 3)
- res = parse(dstr)
- assert res == expected, res
-
- @pytest.mark.xfail
- def test_era_trailing_year_with_dots(self):
- dstr = 'A.D.2001'
- res = parse(dstr)
- assert res.year == 2001, res
-
- @pytest.mark.xfail
- def test_ad_nospace(self):
- expected = datetime(6, 5, 19)
- for dstr in [' 6AD May 19', ' 06AD May 19',
- ' 006AD May 19', ' 0006AD May 19']:
- res = parse(dstr)
- assert res == expected, (dstr, res)
-
- @pytest.mark.xfail
- def test_four_letter_day(self):
- dstr = 'Frid Dec 30, 2016'
- expected = datetime(2016, 12, 30)
- res = parse(dstr)
- assert res == expected
-
- @pytest.mark.xfail
- def test_non_date_number(self):
- dstr = '1,700'
- with pytest.raises(ValueError):
- parse(dstr)
-
- @pytest.mark.xfail
- def test_on_era(self):
- # This could be classified as an "eras" test, but the relevant part
- # about this is the ` on `
- dstr = '2:15 PM on January 2nd 1973 A.D.'
- expected = datetime(1973, 1, 2, 14, 15)
- res = parse(dstr)
- assert res == expected
-
- @pytest.mark.xfail
- def test_extraneous_year(self):
- # This was found in the wild at insidertrading.org
- dstr = "2011 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d NOVEMBER 7, 2012"
- res = parse(dstr, fuzzy_with_tokens=True)
- expected = datetime(2012, 11, 7)
- assert res == expected
-
- @pytest.mark.xfail
- def test_extraneous_year_tokens(self):
- # This was found in the wild at insidertrading.org
- # Unlike in the case above, identifying the first "2012" as the year
- # would not be a problem, but infering that the latter 2012 is hhmm
- # is a problem.
- dstr = "2012 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d NOVEMBER 7, 2012"
- expected = datetime(2012, 11, 7)
- (res, tokens) = parse(dstr, fuzzy_with_tokens=True)
- assert res == expected
- assert tokens == ("2012 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d ",)
-
- @pytest.mark.xfail
- def test_extraneous_year2(self):
- # This was found in the wild at insidertrading.org
- dstr = ("Berylson Amy Smith 1998 Grantor Retained Annuity Trust "
- "u/d/t November 2, 1998 f/b/o Jennifer L Berylson")
- res = parse(dstr, fuzzy_with_tokens=True)
- expected = datetime(1998, 11, 2)
- assert res == expected
-
- @pytest.mark.xfail
- def test_extraneous_year3(self):
- # This was found in the wild at insidertrading.org
- dstr = "SMITH R & WEISS D 94 CHILD TR FBO M W SMITH UDT 12/1/1994"
- res = parse(dstr, fuzzy_with_tokens=True)
- expected = datetime(1994, 12, 1)
- assert res == expected
-
- @pytest.mark.xfail
- def test_unambiguous_YYYYMM(self):
- # 171206 can be parsed as YYMMDD. However, 201712 cannot be parsed
- # as instance of YYMMDD and parser could fallback to YYYYMM format.
- dstr = "201712"
- res = parse(dstr)
- expected = datetime(2017, 12, 1)
- assert res == expected
-
-
-@pytest.mark.skipif(IS_WIN, reason='Windows does not use TZ var')
-def test_parse_unambiguous_nonexistent_local():
- # When dates are specified "EST" even when they should be "EDT" in the
- # local time zone, we should still assign the local time zone
- with TZEnvContext('EST+5EDT,M3.2.0/2,M11.1.0/2'):
- dt_exp = datetime(2011, 8, 1, 12, 30, tzinfo=tz.tzlocal())
- dt = parse('2011-08-01T12:30 EST')
-
- assert dt.tzname() == 'EDT'
- assert dt == dt_exp
-
-
-@pytest.mark.skipif(IS_WIN, reason='Windows does not use TZ var')
-def test_tzlocal_in_gmt():
- # GH #318
- with TZEnvContext('GMT0BST,M3.5.0,M10.5.0'):
- # This is an imaginary datetime in tz.tzlocal() but should still
- # parse using the GMT-as-alias-for-UTC rule
- dt = parse('2004-05-01T12:00 GMT')
- dt_exp = datetime(2004, 5, 1, 12, tzinfo=tz.tzutc())
-
- assert dt == dt_exp
-
-
-@pytest.mark.skipif(IS_WIN, reason='Windows does not use TZ var')
-def test_tzlocal_parse_fold():
- # One manifestion of GH #318
- with TZEnvContext('EST+5EDT,M3.2.0/2,M11.1.0/2'):
- dt_exp = datetime(2011, 11, 6, 1, 30, tzinfo=tz.tzlocal())
- dt_exp = tz.enfold(dt_exp, fold=1)
- dt = parse('2011-11-06T01:30 EST')
-
- # Because this is ambiguous, kuntil `tz.tzlocal() is tz.tzlocal()`
- # we'll just check the attributes we care about rather than
- # dt == dt_exp
- assert dt.tzname() == dt_exp.tzname()
- assert dt.replace(tzinfo=None) == dt_exp.replace(tzinfo=None)
- assert getattr(dt, 'fold') == getattr(dt_exp, 'fold')
- assert dt.astimezone(tz.tzutc()) == dt_exp.astimezone(tz.tzutc())
-
-
-def test_parse_tzinfos_fold():
- NYC = tz.gettz('America/New_York')
- tzinfos = {'EST': NYC, 'EDT': NYC}
-
- dt_exp = tz.enfold(datetime(2011, 11, 6, 1, 30, tzinfo=NYC), fold=1)
- dt = parse('2011-11-06T01:30 EST', tzinfos=tzinfos)
-
- assert dt == dt_exp
- assert dt.tzinfo is dt_exp.tzinfo
- assert getattr(dt, 'fold') == getattr(dt_exp, 'fold')
- assert dt.astimezone(tz.tzutc()) == dt_exp.astimezone(tz.tzutc())
-
-
-@pytest.mark.parametrize('dtstr,dt', [
- ('5.6h', datetime(2003, 9, 25, 5, 36)),
- ('5.6m', datetime(2003, 9, 25, 0, 5, 36)),
- # '5.6s' never had a rounding problem, test added for completeness
- ('5.6s', datetime(2003, 9, 25, 0, 0, 5, 600000))
-])
-def test_rounding_floatlike_strings(dtstr, dt):
- assert parse(dtstr, default=datetime(2003, 9, 25)) == dt
-
-
-@pytest.mark.parametrize('value', ['1: test', 'Nan'])
-def test_decimal_error(value):
- # GH 632, GH 662 - decimal.Decimal raises some non-ValueError exception when
- # constructed with an invalid value
- with pytest.raises(ValueError):
- parse(value)