2018-10-31 16:08:29 +00:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
import itertools
|
|
|
|
from datetime import datetime, timedelta
|
|
|
|
import unittest
|
|
|
|
import sys
|
2018-10-31 16:08:29 +00:00
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
from dateutil import tz
|
2018-10-31 16:08:29 +00:00
|
|
|
from dateutil.tz import tzoffset
|
2022-01-24 04:07:52 +00:00
|
|
|
from dateutil.parser import parse, parserinfo
|
|
|
|
from dateutil.parser import ParserError
|
|
|
|
from dateutil.parser import UnknownTimezoneWarning
|
|
|
|
|
|
|
|
from ._common import TZEnvContext
|
|
|
|
|
|
|
|
from six import assertRaisesRegex, PY2
|
|
|
|
from io import StringIO
|
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
|
|
|
# Platform info
|
|
|
|
IS_WIN = sys.platform.startswith('win')
|
|
|
|
|
|
|
|
PLATFORM_HAS_DASH_D = False
|
|
|
|
try:
|
|
|
|
if datetime.now().strftime('%-d'):
|
|
|
|
PLATFORM_HAS_DASH_D = True
|
|
|
|
except ValueError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.fixture(params=[True, False])
|
|
|
|
def fuzzy(request):
|
|
|
|
"""Fixture to pass fuzzy=True or fuzzy=False to parse"""
|
|
|
|
return request.param
|
|
|
|
|
|
|
|
|
|
|
|
# Parser test cases using no keyword arguments. Format: (parsable_text, expected_datetime, assertion_message)
|
|
|
|
PARSER_TEST_CASES = [
|
|
|
|
("Thu Sep 25 10:36:28 2003", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("Thu Sep 25 2003", datetime(2003, 9, 25), "date command format strip"),
|
|
|
|
("2003-09-25T10:49:41", datetime(2003, 9, 25, 10, 49, 41), "iso format strip"),
|
|
|
|
("2003-09-25T10:49", datetime(2003, 9, 25, 10, 49), "iso format strip"),
|
|
|
|
("2003-09-25T10", datetime(2003, 9, 25, 10), "iso format strip"),
|
|
|
|
("2003-09-25", datetime(2003, 9, 25), "iso format strip"),
|
|
|
|
("20030925T104941", datetime(2003, 9, 25, 10, 49, 41), "iso stripped format strip"),
|
|
|
|
("20030925T1049", datetime(2003, 9, 25, 10, 49, 0), "iso stripped format strip"),
|
|
|
|
("20030925T10", datetime(2003, 9, 25, 10), "iso stripped format strip"),
|
|
|
|
("20030925", datetime(2003, 9, 25), "iso stripped format strip"),
|
|
|
|
("2003-09-25 10:49:41,502", datetime(2003, 9, 25, 10, 49, 41, 502000), "python logger format"),
|
|
|
|
("199709020908", datetime(1997, 9, 2, 9, 8), "no separator"),
|
|
|
|
("19970902090807", datetime(1997, 9, 2, 9, 8, 7), "no separator"),
|
|
|
|
("09-25-2003", datetime(2003, 9, 25), "date with dash"),
|
|
|
|
("25-09-2003", datetime(2003, 9, 25), "date with dash"),
|
|
|
|
("10-09-2003", datetime(2003, 10, 9), "date with dash"),
|
|
|
|
("10-09-03", datetime(2003, 10, 9), "date with dash"),
|
|
|
|
("2003.09.25", datetime(2003, 9, 25), "date with dot"),
|
|
|
|
("09.25.2003", datetime(2003, 9, 25), "date with dot"),
|
|
|
|
("25.09.2003", datetime(2003, 9, 25), "date with dot"),
|
|
|
|
("10.09.2003", datetime(2003, 10, 9), "date with dot"),
|
|
|
|
("10.09.03", datetime(2003, 10, 9), "date with dot"),
|
|
|
|
("2003/09/25", datetime(2003, 9, 25), "date with slash"),
|
|
|
|
("09/25/2003", datetime(2003, 9, 25), "date with slash"),
|
|
|
|
("25/09/2003", datetime(2003, 9, 25), "date with slash"),
|
|
|
|
("10/09/2003", datetime(2003, 10, 9), "date with slash"),
|
|
|
|
("10/09/03", datetime(2003, 10, 9), "date with slash"),
|
|
|
|
("2003 09 25", datetime(2003, 9, 25), "date with space"),
|
|
|
|
("09 25 2003", datetime(2003, 9, 25), "date with space"),
|
|
|
|
("25 09 2003", datetime(2003, 9, 25), "date with space"),
|
|
|
|
("10 09 2003", datetime(2003, 10, 9), "date with space"),
|
|
|
|
("10 09 03", datetime(2003, 10, 9), "date with space"),
|
|
|
|
("25 09 03", datetime(2003, 9, 25), "date with space"),
|
|
|
|
("03 25 Sep", datetime(2003, 9, 25), "strangely ordered date"),
|
|
|
|
("25 03 Sep", datetime(2025, 9, 3), "strangely ordered date"),
|
|
|
|
(" July 4 , 1976 12:01:02 am ", datetime(1976, 7, 4, 0, 1, 2), "extra space"),
|
|
|
|
("Wed, July 10, '96", datetime(1996, 7, 10, 0, 0), "random format"),
|
|
|
|
("1996.July.10 AD 12:08 PM", datetime(1996, 7, 10, 12, 8), "random format"),
|
|
|
|
("July 4, 1976", datetime(1976, 7, 4), "random format"),
|
|
|
|
("7 4 1976", datetime(1976, 7, 4), "random format"),
|
|
|
|
("4 jul 1976", datetime(1976, 7, 4), "random format"),
|
|
|
|
("4 Jul 1976", datetime(1976, 7, 4), "'%-d %b %Y' format"),
|
|
|
|
("7-4-76", datetime(1976, 7, 4), "random format"),
|
|
|
|
("19760704", datetime(1976, 7, 4), "random format"),
|
|
|
|
("0:01:02 on July 4, 1976", datetime(1976, 7, 4, 0, 1, 2), "random format"),
|
|
|
|
("July 4, 1976 12:01:02 am", datetime(1976, 7, 4, 0, 1, 2), "random format"),
|
|
|
|
("Mon Jan 2 04:24:27 1995", datetime(1995, 1, 2, 4, 24, 27), "random format"),
|
|
|
|
("04.04.95 00:22", datetime(1995, 4, 4, 0, 22), "random format"),
|
|
|
|
("Jan 1 1999 11:23:34.578", datetime(1999, 1, 1, 11, 23, 34, 578000), "random format"),
|
|
|
|
("950404 122212", datetime(1995, 4, 4, 12, 22, 12), "random format"),
|
|
|
|
("3rd of May 2001", datetime(2001, 5, 3), "random format"),
|
|
|
|
("5th of March 2001", datetime(2001, 3, 5), "random format"),
|
|
|
|
("1st of May 2003", datetime(2003, 5, 1), "random format"),
|
|
|
|
('0099-01-01T00:00:00', datetime(99, 1, 1, 0, 0), "99 ad"),
|
|
|
|
('0031-01-01T00:00:00', datetime(31, 1, 1, 0, 0), "31 ad"),
|
|
|
|
("20080227T21:26:01.123456789", datetime(2008, 2, 27, 21, 26, 1, 123456), "high precision seconds"),
|
|
|
|
('13NOV2017', datetime(2017, 11, 13), "dBY (See GH360)"),
|
|
|
|
('0003-03-04', datetime(3, 3, 4), "pre 12 year same month (See GH PR #293)"),
|
|
|
|
('December.0031.30', datetime(31, 12, 30), "BYd corner case (GH#687)"),
|
|
|
|
|
|
|
|
# Cases with legacy h/m/s format, candidates for deprecation (GH#886)
|
|
|
|
("2016-12-21 04.2h", datetime(2016, 12, 21, 4, 12), "Fractional Hours"),
|
|
|
|
]
|
|
|
|
# Check that we don't have any duplicates
|
|
|
|
assert len(set([x[0] for x in PARSER_TEST_CASES])) == len(PARSER_TEST_CASES)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("parsable_text,expected_datetime,assertion_message", PARSER_TEST_CASES)
|
|
|
|
def test_parser(parsable_text, expected_datetime, assertion_message):
|
|
|
|
assert parse(parsable_text) == expected_datetime, assertion_message
|
|
|
|
|
|
|
|
|
|
|
|
# Parser test cases using datetime(2003, 9, 25) as a default.
|
|
|
|
# Format: (parsable_text, expected_datetime, assertion_message)
|
|
|
|
PARSER_DEFAULT_TEST_CASES = [
|
|
|
|
("Thu Sep 25 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("Thu Sep 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("Thu 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("Sep 10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("10:36:28", datetime(2003, 9, 25, 10, 36, 28), "date command format strip"),
|
|
|
|
("10:36", datetime(2003, 9, 25, 10, 36), "date command format strip"),
|
|
|
|
("Sep 2003", datetime(2003, 9, 25), "date command format strip"),
|
|
|
|
("Sep", datetime(2003, 9, 25), "date command format strip"),
|
|
|
|
("2003", datetime(2003, 9, 25), "date command format strip"),
|
|
|
|
("10h36m28.5s", datetime(2003, 9, 25, 10, 36, 28, 500000), "hour with letters"),
|
|
|
|
("10h36m28s", datetime(2003, 9, 25, 10, 36, 28), "hour with letters strip"),
|
|
|
|
("10h36m", datetime(2003, 9, 25, 10, 36), "hour with letters strip"),
|
|
|
|
("10h", datetime(2003, 9, 25, 10), "hour with letters strip"),
|
|
|
|
("10 h 36", datetime(2003, 9, 25, 10, 36), "hour with letters strip"),
|
|
|
|
("10 h 36.5", datetime(2003, 9, 25, 10, 36, 30), "hour with letter strip"),
|
|
|
|
("36 m 5", datetime(2003, 9, 25, 0, 36, 5), "hour with letters spaces"),
|
|
|
|
("36 m 5 s", datetime(2003, 9, 25, 0, 36, 5), "minute with letters spaces"),
|
|
|
|
("36 m 05", datetime(2003, 9, 25, 0, 36, 5), "minute with letters spaces"),
|
|
|
|
("36 m 05 s", datetime(2003, 9, 25, 0, 36, 5), "minutes with letters spaces"),
|
|
|
|
("10h am", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10h pm", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("10am", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10pm", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("10:00 am", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10:00 pm", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("10:00am", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10:00pm", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("10:00a.m", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10:00p.m", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("10:00a.m.", datetime(2003, 9, 25, 10), "hour am pm"),
|
|
|
|
("10:00p.m.", datetime(2003, 9, 25, 22), "hour am pm"),
|
|
|
|
("Wed", datetime(2003, 10, 1), "weekday alone"),
|
|
|
|
("Wednesday", datetime(2003, 10, 1), "long weekday"),
|
|
|
|
("October", datetime(2003, 10, 25), "long month"),
|
|
|
|
("31-Dec-00", datetime(2000, 12, 31), "zero year"),
|
|
|
|
("0:01:02", datetime(2003, 9, 25, 0, 1, 2), "random format"),
|
|
|
|
("12h 01m02s am", datetime(2003, 9, 25, 0, 1, 2), "random format"),
|
|
|
|
("12:08 PM", datetime(2003, 9, 25, 12, 8), "random format"),
|
|
|
|
("01h02m03", datetime(2003, 9, 25, 1, 2, 3), "random format"),
|
|
|
|
("01h02", datetime(2003, 9, 25, 1, 2), "random format"),
|
|
|
|
("01h02s", datetime(2003, 9, 25, 1, 0, 2), "random format"),
|
|
|
|
("01m02", datetime(2003, 9, 25, 0, 1, 2), "random format"),
|
|
|
|
("01m02h", datetime(2003, 9, 25, 2, 1), "random format"),
|
|
|
|
("2004 10 Apr 11h30m", datetime(2004, 4, 10, 11, 30), "random format")
|
|
|
|
]
|
|
|
|
# Check that we don't have any duplicates
|
|
|
|
assert len(set([x[0] for x in PARSER_DEFAULT_TEST_CASES])) == len(PARSER_DEFAULT_TEST_CASES)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize("parsable_text,expected_datetime,assertion_message", PARSER_DEFAULT_TEST_CASES)
|
|
|
|
def test_parser_default(parsable_text, expected_datetime, assertion_message):
|
|
|
|
assert parse(parsable_text, default=datetime(2003, 9, 25)) == expected_datetime, assertion_message
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('sep', ['-', '.', '/', ' '])
|
|
|
|
def test_parse_dayfirst(sep):
|
|
|
|
expected = datetime(2003, 9, 10)
|
|
|
|
fmt = sep.join(['%d', '%m', '%Y'])
|
|
|
|
dstr = expected.strftime(fmt)
|
|
|
|
result = parse(dstr, dayfirst=True)
|
|
|
|
assert result == expected
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('sep', ['-', '.', '/', ' '])
|
|
|
|
def test_parse_yearfirst(sep):
|
|
|
|
expected = datetime(2010, 9, 3)
|
|
|
|
fmt = sep.join(['%Y', '%m', '%d'])
|
|
|
|
dstr = expected.strftime(fmt)
|
|
|
|
result = parse(dstr, yearfirst=True)
|
|
|
|
assert result == expected
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('dstr,expected', [
|
|
|
|
("Thu Sep 25 10:36:28 BRST 2003", datetime(2003, 9, 25, 10, 36, 28)),
|
|
|
|
("1996.07.10 AD at 15:08:56 PDT", datetime(1996, 7, 10, 15, 8, 56)),
|
|
|
|
("Tuesday, April 12, 1952 AD 3:30:42pm PST",
|
|
|
|
datetime(1952, 4, 12, 15, 30, 42)),
|
|
|
|
("November 5, 1994, 8:15:30 am EST", datetime(1994, 11, 5, 8, 15, 30)),
|
|
|
|
("1994-11-05T08:15:30-05:00", datetime(1994, 11, 5, 8, 15, 30)),
|
|
|
|
("1994-11-05T08:15:30Z", datetime(1994, 11, 5, 8, 15, 30)),
|
|
|
|
("1976-07-04T00:01:02Z", datetime(1976, 7, 4, 0, 1, 2)),
|
|
|
|
("1986-07-05T08:15:30z", datetime(1986, 7, 5, 8, 15, 30)),
|
|
|
|
("Tue Apr 4 00:22:12 PDT 1995", datetime(1995, 4, 4, 0, 22, 12)),
|
|
|
|
])
|
|
|
|
def test_parse_ignoretz(dstr, expected):
|
|
|
|
result = parse(dstr, ignoretz=True)
|
|
|
|
assert result == expected
|
|
|
|
|
|
|
|
|
|
|
|
_brsttz = tzoffset("BRST", -10800)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('dstr,expected', [
|
|
|
|
("20030925T104941-0300",
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41, tzinfo=_brsttz)),
|
|
|
|
("Thu, 25 Sep 2003 10:49:41 -0300",
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41, tzinfo=_brsttz)),
|
|
|
|
("2003-09-25T10:49:41.5-03:00",
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41, 500000, tzinfo=_brsttz)),
|
|
|
|
("2003-09-25T10:49:41-03:00",
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41, tzinfo=_brsttz)),
|
|
|
|
("20030925T104941.5-0300",
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41, 500000, tzinfo=_brsttz)),
|
|
|
|
])
|
|
|
|
def test_parse_with_tzoffset(dstr, expected):
|
|
|
|
# In these cases, we are _not_ passing a tzinfos arg
|
|
|
|
result = parse(dstr)
|
|
|
|
assert result == expected
|
|
|
|
|
|
|
|
|
|
|
|
class TestFormat(object):
|
|
|
|
|
|
|
|
def test_ybd(self):
|
|
|
|
# If we have a 4-digit year, a non-numeric month (abbreviated or not),
|
|
|
|
# and a day (1 or 2 digits), then there is no ambiguity as to which
|
|
|
|
# token is a year/month/day. This holds regardless of what order the
|
|
|
|
# terms are in and for each of the separators below.
|
|
|
|
|
|
|
|
seps = ['-', ' ', '/', '.']
|
|
|
|
|
|
|
|
year_tokens = ['%Y']
|
|
|
|
month_tokens = ['%b', '%B']
|
|
|
|
day_tokens = ['%d']
|
|
|
|
if PLATFORM_HAS_DASH_D:
|
|
|
|
day_tokens.append('%-d')
|
|
|
|
|
|
|
|
prods = itertools.product(year_tokens, month_tokens, day_tokens)
|
|
|
|
perms = [y for x in prods for y in itertools.permutations(x)]
|
|
|
|
unambig_fmts = [sep.join(perm) for sep in seps for perm in perms]
|
|
|
|
|
|
|
|
actual = datetime(2003, 9, 25)
|
|
|
|
|
|
|
|
for fmt in unambig_fmts:
|
|
|
|
dstr = actual.strftime(fmt)
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == actual
|
|
|
|
|
|
|
|
# TODO: some redundancy with PARSER_TEST_CASES cases
|
|
|
|
@pytest.mark.parametrize("fmt,dstr", [
|
|
|
|
("%a %b %d %Y", "Thu Sep 25 2003"),
|
|
|
|
("%b %d %Y", "Sep 25 2003"),
|
|
|
|
("%Y-%m-%d", "2003-09-25"),
|
|
|
|
("%Y%m%d", "20030925"),
|
|
|
|
("%Y-%b-%d", "2003-Sep-25"),
|
|
|
|
("%d-%b-%Y", "25-Sep-2003"),
|
|
|
|
("%b-%d-%Y", "Sep-25-2003"),
|
|
|
|
("%m-%d-%Y", "09-25-2003"),
|
|
|
|
("%d-%m-%Y", "25-09-2003"),
|
|
|
|
("%Y.%m.%d", "2003.09.25"),
|
|
|
|
("%Y.%b.%d", "2003.Sep.25"),
|
|
|
|
("%d.%b.%Y", "25.Sep.2003"),
|
|
|
|
("%b.%d.%Y", "Sep.25.2003"),
|
|
|
|
("%m.%d.%Y", "09.25.2003"),
|
|
|
|
("%d.%m.%Y", "25.09.2003"),
|
|
|
|
("%Y/%m/%d", "2003/09/25"),
|
|
|
|
("%Y/%b/%d", "2003/Sep/25"),
|
|
|
|
("%d/%b/%Y", "25/Sep/2003"),
|
|
|
|
("%b/%d/%Y", "Sep/25/2003"),
|
|
|
|
("%m/%d/%Y", "09/25/2003"),
|
|
|
|
("%d/%m/%Y", "25/09/2003"),
|
|
|
|
("%Y %m %d", "2003 09 25"),
|
|
|
|
("%Y %b %d", "2003 Sep 25"),
|
|
|
|
("%d %b %Y", "25 Sep 2003"),
|
|
|
|
("%m %d %Y", "09 25 2003"),
|
|
|
|
("%d %m %Y", "25 09 2003"),
|
|
|
|
("%y %d %b", "03 25 Sep",),
|
|
|
|
])
|
|
|
|
def test_strftime_formats_2003Sep25(self, fmt, dstr):
|
|
|
|
expected = datetime(2003, 9, 25)
|
|
|
|
|
|
|
|
# First check that the format strings behave as expected
|
|
|
|
# (not strictly necessary, but nice to have)
|
|
|
|
assert expected.strftime(fmt) == dstr
|
|
|
|
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
|
|
|
|
class TestInputTypes(object):
|
|
|
|
def test_empty_string_invalid(self):
|
|
|
|
with pytest.raises(ParserError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse('')
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def test_none_invalid(self):
|
|
|
|
with pytest.raises(TypeError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse(None)
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def test_int_invalid(self):
|
|
|
|
with pytest.raises(TypeError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse(13)
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def test_duck_typing(self):
|
2018-10-31 16:08:29 +00:00
|
|
|
# We want to support arbitrary classes that implement the stream
|
|
|
|
# interface.
|
|
|
|
|
|
|
|
class StringPassThrough(object):
|
|
|
|
def __init__(self, stream):
|
|
|
|
self.stream = stream
|
|
|
|
|
|
|
|
def read(self, *args, **kwargs):
|
|
|
|
return self.stream.read(*args, **kwargs)
|
|
|
|
|
|
|
|
dstr = StringPassThrough(StringIO('2014 January 19'))
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
res = parse(dstr)
|
|
|
|
expected = datetime(2014, 1, 19)
|
|
|
|
assert res == expected
|
2018-10-31 16:08:29 +00:00
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def test_parse_stream(self):
|
2018-10-31 16:08:29 +00:00
|
|
|
dstr = StringIO('2014 January 19')
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
res = parse(dstr)
|
|
|
|
expected = datetime(2014, 1, 19)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
def test_parse_str(self):
|
|
|
|
# Parser should be able to handle bytestring and unicode
|
|
|
|
uni_str = '2014-05-01 08:00:00'
|
|
|
|
bytes_str = uni_str.encode()
|
|
|
|
|
|
|
|
res = parse(bytes_str)
|
|
|
|
expected = parse(uni_str)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
def test_parse_bytes(self):
|
|
|
|
res = parse(b'2014 January 19')
|
|
|
|
expected = datetime(2014, 1, 19)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
def test_parse_bytearray(self):
|
|
|
|
# GH#417
|
|
|
|
res = parse(bytearray(b'2014 January 19'))
|
|
|
|
expected = datetime(2014, 1, 19)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
|
|
|
|
class TestTzinfoInputTypes(object):
|
|
|
|
def assert_equal_same_tz(self, dt1, dt2):
|
|
|
|
assert dt1 == dt2
|
|
|
|
assert dt1.tzinfo is dt2.tzinfo
|
|
|
|
|
|
|
|
def test_tzinfo_dict_could_return_none(self):
|
|
|
|
dstr = "2017-02-03 12:40 BRST"
|
|
|
|
result = parse(dstr, tzinfos={"BRST": None})
|
|
|
|
expected = datetime(2017, 2, 3, 12, 40)
|
|
|
|
self.assert_equal_same_tz(result, expected)
|
|
|
|
|
|
|
|
def test_tzinfos_callable_could_return_none(self):
|
|
|
|
dstr = "2017-02-03 12:40 BRST"
|
|
|
|
result = parse(dstr, tzinfos=lambda *args: None)
|
|
|
|
expected = datetime(2017, 2, 3, 12, 40)
|
|
|
|
self.assert_equal_same_tz(result, expected)
|
|
|
|
|
|
|
|
def test_invalid_tzinfo_input(self):
|
|
|
|
dstr = "2014 January 19 09:00 UTC"
|
|
|
|
# Pass an absurd tzinfos object
|
|
|
|
tzinfos = {"UTC": ValueError}
|
|
|
|
with pytest.raises(TypeError):
|
|
|
|
parse(dstr, tzinfos=tzinfos)
|
|
|
|
|
|
|
|
def test_valid_tzinfo_tzinfo_input(self):
|
|
|
|
dstr = "2014 January 19 09:00 UTC"
|
|
|
|
tzinfos = {"UTC": tz.UTC}
|
|
|
|
expected = datetime(2014, 1, 19, 9, tzinfo=tz.UTC)
|
|
|
|
res = parse(dstr, tzinfos=tzinfos)
|
|
|
|
self.assert_equal_same_tz(res, expected)
|
|
|
|
|
|
|
|
def test_valid_tzinfo_unicode_input(self):
|
|
|
|
dstr = "2014 January 19 09:00 UTC"
|
|
|
|
tzinfos = {u"UTC": u"UTC+0"}
|
|
|
|
expected = datetime(2014, 1, 19, 9, tzinfo=tz.tzstr("UTC+0"))
|
|
|
|
res = parse(dstr, tzinfos=tzinfos)
|
|
|
|
self.assert_equal_same_tz(res, expected)
|
|
|
|
|
|
|
|
def test_valid_tzinfo_callable_input(self):
|
|
|
|
dstr = "2014 January 19 09:00 UTC"
|
|
|
|
|
|
|
|
def tzinfos(*args, **kwargs):
|
|
|
|
return u"UTC+0"
|
|
|
|
|
|
|
|
expected = datetime(2014, 1, 19, 9, tzinfo=tz.tzstr("UTC+0"))
|
|
|
|
res = parse(dstr, tzinfos=tzinfos)
|
|
|
|
self.assert_equal_same_tz(res, expected)
|
|
|
|
|
|
|
|
def test_valid_tzinfo_int_input(self):
|
|
|
|
dstr = "2014 January 19 09:00 UTC"
|
|
|
|
tzinfos = {u"UTC": -28800}
|
|
|
|
expected = datetime(2014, 1, 19, 9, tzinfo=tz.tzoffset(u"UTC", -28800))
|
|
|
|
res = parse(dstr, tzinfos=tzinfos)
|
|
|
|
self.assert_equal_same_tz(res, expected)
|
|
|
|
|
|
|
|
|
|
|
|
class ParserTest(unittest.TestCase):
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def setup_class(cls):
|
|
|
|
cls.tzinfos = {"BRST": -10800}
|
|
|
|
cls.brsttz = tzoffset("BRST", -10800)
|
|
|
|
cls.default = datetime(2003, 9, 25)
|
2018-10-31 16:08:29 +00:00
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
# Parser should be able to handle bytestring and unicode
|
|
|
|
cls.uni_str = '2014-05-01 08:00:00'
|
|
|
|
cls.str_str = cls.uni_str.encode()
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testParserParseStr(self):
|
|
|
|
from dateutil.parser import parser
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
assert parser().parse(self.str_str) == parser().parse(self.uni_str)
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testParseUnicodeWords(self):
|
|
|
|
|
|
|
|
class rus_parserinfo(parserinfo):
|
|
|
|
MONTHS = [("янв", "Январь"),
|
|
|
|
("фев", "Февраль"),
|
|
|
|
("мар", "Март"),
|
|
|
|
("апр", "Апрель"),
|
|
|
|
("май", "Май"),
|
|
|
|
("июн", "Июнь"),
|
|
|
|
("июл", "Июль"),
|
|
|
|
("авг", "Август"),
|
|
|
|
("сен", "Сентябрь"),
|
|
|
|
("окт", "Октябрь"),
|
|
|
|
("ноя", "Ноябрь"),
|
|
|
|
("дек", "Декабрь")]
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
expected = datetime(2015, 9, 10, 10, 20)
|
|
|
|
res = parse('10 Сентябрь 2015 10:20', parserinfo=rus_parserinfo())
|
|
|
|
assert res == expected
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testParseWithNulls(self):
|
|
|
|
# This relies on the from __future__ import unicode_literals, because
|
|
|
|
# explicitly specifying a unicode literal is a syntax error in Py 3.2
|
|
|
|
# May want to switch to u'...' if we ever drop Python 3.2 support.
|
|
|
|
pstring = '\x00\x00August 29, 1924'
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
assert parse(pstring) == datetime(1924, 8, 29)
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testDateCommandFormat(self):
|
|
|
|
self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
|
|
|
|
tzinfos=self.tzinfos),
|
|
|
|
datetime(2003, 9, 25, 10, 36, 28,
|
|
|
|
tzinfo=self.brsttz))
|
|
|
|
|
|
|
|
def testDateCommandFormatReversed(self):
|
|
|
|
self.assertEqual(parse("2003 10:36:28 BRST 25 Sep Thu",
|
|
|
|
tzinfos=self.tzinfos),
|
|
|
|
datetime(2003, 9, 25, 10, 36, 28,
|
|
|
|
tzinfo=self.brsttz))
|
|
|
|
|
|
|
|
def testDateCommandFormatWithLong(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
if PY2:
|
2018-10-31 16:08:29 +00:00
|
|
|
self.assertEqual(parse("Thu Sep 25 10:36:28 BRST 2003",
|
|
|
|
tzinfos={"BRST": long(-10800)}),
|
|
|
|
datetime(2003, 9, 25, 10, 36, 28,
|
|
|
|
tzinfo=self.brsttz))
|
|
|
|
|
|
|
|
def testISOFormatStrip2(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
self.assertEqual(parse("2003-09-25T10:49:41+03:00"),
|
2018-10-31 16:08:29 +00:00
|
|
|
datetime(2003, 9, 25, 10, 49, 41,
|
2022-01-24 04:07:52 +00:00
|
|
|
tzinfo=tzoffset(None, 10800)))
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testISOStrippedFormatStrip2(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
self.assertEqual(parse("20030925T104941+0300"),
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41,
|
|
|
|
tzinfo=tzoffset(None, 10800)))
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testAMPMNoHour(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.raises(ParserError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse("AM")
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.raises(ParserError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse("Jan 20, 2015 PM")
|
|
|
|
|
|
|
|
def testAMPMRange(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.raises(ParserError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse("13:44 AM")
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.raises(ParserError):
|
2018-10-31 16:08:29 +00:00
|
|
|
parse("January 25, 1921 23:13 PM")
|
|
|
|
|
|
|
|
def testPertain(self):
|
|
|
|
self.assertEqual(parse("Sep 03", default=self.default),
|
|
|
|
datetime(2003, 9, 3))
|
|
|
|
self.assertEqual(parse("Sep of 03", default=self.default),
|
|
|
|
datetime(2003, 9, 25))
|
|
|
|
|
|
|
|
def testFuzzy(self):
|
|
|
|
s = "Today is 25 of September of 2003, exactly " \
|
|
|
|
"at 10:49:41 with timezone -03:00."
|
|
|
|
self.assertEqual(parse(s, fuzzy=True),
|
|
|
|
datetime(2003, 9, 25, 10, 49, 41,
|
|
|
|
tzinfo=self.brsttz))
|
|
|
|
|
|
|
|
def testFuzzyWithTokens(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
s1 = "Today is 25 of September of 2003, exactly " \
|
2018-10-31 16:08:29 +00:00
|
|
|
"at 10:49:41 with timezone -03:00."
|
2022-01-24 04:07:52 +00:00
|
|
|
self.assertEqual(parse(s1, fuzzy_with_tokens=True),
|
2018-10-31 16:08:29 +00:00
|
|
|
(datetime(2003, 9, 25, 10, 49, 41,
|
|
|
|
tzinfo=self.brsttz),
|
|
|
|
('Today is ', 'of ', ', exactly at ',
|
|
|
|
' with timezone ', '.')))
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
s2 = "http://biz.yahoo.com/ipo/p/600221.html"
|
|
|
|
self.assertEqual(parse(s2, fuzzy_with_tokens=True),
|
|
|
|
(datetime(2060, 2, 21, 0, 0, 0),
|
|
|
|
('http://biz.yahoo.com/ipo/p/', '.html')))
|
|
|
|
|
2018-10-31 16:08:29 +00:00
|
|
|
def testFuzzyAMPMProblem(self):
|
|
|
|
# Sometimes fuzzy parsing results in AM/PM flag being set without
|
|
|
|
# hours - if it's fuzzy it should ignore that.
|
|
|
|
s1 = "I have a meeting on March 1, 1974."
|
|
|
|
s2 = "On June 8th, 2020, I am going to be the first man on Mars"
|
|
|
|
|
|
|
|
# Also don't want any erroneous AM or PMs changing the parsed time
|
|
|
|
s3 = "Meet me at the AM/PM on Sunset at 3:00 AM on December 3rd, 2003"
|
|
|
|
s4 = "Meet me at 3:00AM on December 3rd, 2003 at the AM/PM on Sunset"
|
|
|
|
|
|
|
|
self.assertEqual(parse(s1, fuzzy=True), datetime(1974, 3, 1))
|
|
|
|
self.assertEqual(parse(s2, fuzzy=True), datetime(2020, 6, 8))
|
|
|
|
self.assertEqual(parse(s3, fuzzy=True), datetime(2003, 12, 3, 3))
|
|
|
|
self.assertEqual(parse(s4, fuzzy=True), datetime(2003, 12, 3, 3))
|
|
|
|
|
|
|
|
def testFuzzyIgnoreAMPM(self):
|
|
|
|
s1 = "Jan 29, 1945 14:45 AM I going to see you there?"
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.warns(UnknownTimezoneWarning):
|
|
|
|
res = parse(s1, fuzzy=True)
|
|
|
|
self.assertEqual(res, datetime(1945, 1, 29, 14, 45))
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testRandomFormat24(self):
|
|
|
|
self.assertEqual(parse("0:00 PM, PST", default=self.default,
|
|
|
|
ignoretz=True),
|
|
|
|
datetime(2003, 9, 25, 12, 0))
|
|
|
|
|
|
|
|
def testRandomFormat26(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.warns(UnknownTimezoneWarning):
|
|
|
|
res = parse("5:50 A.M. on June 13, 1990")
|
2018-10-31 16:08:29 +00:00
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
self.assertEqual(res, datetime(1990, 6, 13, 5, 50))
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testUnspecifiedDayFallback(self):
|
|
|
|
# Test that for an unspecified day, the fallback behavior is correct.
|
|
|
|
self.assertEqual(parse("April 2009", default=datetime(2010, 1, 31)),
|
|
|
|
datetime(2009, 4, 30))
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def testUnspecifiedDayFallbackFebNoLeapYear(self):
|
2018-10-31 16:08:29 +00:00
|
|
|
self.assertEqual(parse("Feb 2007", default=datetime(2010, 1, 31)),
|
|
|
|
datetime(2007, 2, 28))
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def testUnspecifiedDayFallbackFebLeapYear(self):
|
2018-10-31 16:08:29 +00:00
|
|
|
self.assertEqual(parse("Feb 2008", default=datetime(2010, 1, 31)),
|
|
|
|
datetime(2008, 2, 29))
|
|
|
|
|
|
|
|
def testErrorType01(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse('shouldfail')
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testCorrectErrorOnFuzzyWithTokens(self):
|
2022-01-24 04:07:52 +00:00
|
|
|
assertRaisesRegex(self, ParserError, 'Unknown string format',
|
2018-10-31 16:08:29 +00:00
|
|
|
parse, '04/04/32/423', fuzzy_with_tokens=True)
|
2022-01-24 04:07:52 +00:00
|
|
|
assertRaisesRegex(self, ParserError, 'Unknown string format',
|
2018-10-31 16:08:29 +00:00
|
|
|
parse, '04/04/04 +32423', fuzzy_with_tokens=True)
|
2022-01-24 04:07:52 +00:00
|
|
|
assertRaisesRegex(self, ParserError, 'Unknown string format',
|
2018-10-31 16:08:29 +00:00
|
|
|
parse, '04/04/0d4', fuzzy_with_tokens=True)
|
|
|
|
|
|
|
|
def testIncreasingCTime(self):
|
|
|
|
# This test will check 200 different years, every month, every day,
|
|
|
|
# every hour, every minute, every second, and every weekday, using
|
|
|
|
# a delta of more or less 1 year, 1 month, 1 day, 1 minute and
|
|
|
|
# 1 second.
|
|
|
|
delta = timedelta(days=365+31+1, seconds=1+60+60*60)
|
|
|
|
dt = datetime(1900, 1, 1, 0, 0, 0, 0)
|
|
|
|
for i in range(200):
|
2022-01-24 04:07:52 +00:00
|
|
|
assert parse(dt.ctime()) == dt
|
2018-10-31 16:08:29 +00:00
|
|
|
dt += delta
|
|
|
|
|
|
|
|
def testIncreasingISOFormat(self):
|
|
|
|
delta = timedelta(days=365+31+1, seconds=1+60+60*60)
|
|
|
|
dt = datetime(1900, 1, 1, 0, 0, 0, 0)
|
|
|
|
for i in range(200):
|
2022-01-24 04:07:52 +00:00
|
|
|
assert parse(dt.isoformat()) == dt
|
2018-10-31 16:08:29 +00:00
|
|
|
dt += delta
|
|
|
|
|
|
|
|
def testMicrosecondsPrecisionError(self):
|
|
|
|
# Skip found out that sad precision problem. :-(
|
|
|
|
dt1 = parse("00:11:25.01")
|
|
|
|
dt2 = parse("00:12:10.01")
|
2022-01-24 04:07:52 +00:00
|
|
|
assert dt1.microsecond == 10000
|
|
|
|
assert dt2.microsecond == 10000
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testMicrosecondPrecisionErrorReturns(self):
|
|
|
|
# One more precision issue, discovered by Eric Brown. This should
|
|
|
|
# be the last one, as we're no longer using floating points.
|
|
|
|
for ms in [100001, 100000, 99999, 99998,
|
|
|
|
10001, 10000, 9999, 9998,
|
|
|
|
1001, 1000, 999, 998,
|
|
|
|
101, 100, 99, 98]:
|
|
|
|
dt = datetime(2008, 2, 27, 21, 26, 1, ms)
|
2022-01-24 04:07:52 +00:00
|
|
|
assert parse(dt.isoformat()) == dt
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testCustomParserInfo(self):
|
|
|
|
# Custom parser info wasn't working, as Michael Elsdörfer discovered.
|
|
|
|
from dateutil.parser import parserinfo, parser
|
|
|
|
|
|
|
|
class myparserinfo(parserinfo):
|
|
|
|
MONTHS = parserinfo.MONTHS[:]
|
|
|
|
MONTHS[0] = ("Foo", "Foo")
|
|
|
|
myparser = parser(myparserinfo())
|
|
|
|
dt = myparser.parse("01/Foo/2007")
|
2022-01-24 04:07:52 +00:00
|
|
|
assert dt == datetime(2007, 1, 1)
|
|
|
|
|
|
|
|
def testCustomParserShortDaynames(self):
|
|
|
|
# Horacio Hoyos discovered that day names shorter than 3 characters,
|
|
|
|
# for example two letter German day name abbreviations, don't work:
|
|
|
|
# https://github.com/dateutil/dateutil/issues/343
|
|
|
|
from dateutil.parser import parserinfo, parser
|
|
|
|
|
|
|
|
class GermanParserInfo(parserinfo):
|
|
|
|
WEEKDAYS = [("Mo", "Montag"),
|
|
|
|
("Di", "Dienstag"),
|
|
|
|
("Mi", "Mittwoch"),
|
|
|
|
("Do", "Donnerstag"),
|
|
|
|
("Fr", "Freitag"),
|
|
|
|
("Sa", "Samstag"),
|
|
|
|
("So", "Sonntag")]
|
|
|
|
|
|
|
|
myparser = parser(GermanParserInfo())
|
|
|
|
dt = myparser.parse("Sa 21. Jan 2017")
|
|
|
|
self.assertEqual(dt, datetime(2017, 1, 21))
|
2018-10-31 16:08:29 +00:00
|
|
|
|
|
|
|
def testNoYearFirstNoDayFirst(self):
|
|
|
|
dtstr = '090107'
|
|
|
|
|
|
|
|
# Should be MMDDYY
|
|
|
|
self.assertEqual(parse(dtstr),
|
|
|
|
datetime(2007, 9, 1))
|
|
|
|
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=False, dayfirst=False),
|
|
|
|
datetime(2007, 9, 1))
|
|
|
|
|
|
|
|
def testYearFirst(self):
|
|
|
|
dtstr = '090107'
|
|
|
|
|
|
|
|
# Should be MMDDYY
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=True),
|
|
|
|
datetime(2009, 1, 7))
|
|
|
|
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=True, dayfirst=False),
|
|
|
|
datetime(2009, 1, 7))
|
|
|
|
|
|
|
|
def testDayFirst(self):
|
|
|
|
dtstr = '090107'
|
|
|
|
|
|
|
|
# Should be DDMMYY
|
|
|
|
self.assertEqual(parse(dtstr, dayfirst=True),
|
|
|
|
datetime(2007, 1, 9))
|
|
|
|
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=False, dayfirst=True),
|
|
|
|
datetime(2007, 1, 9))
|
|
|
|
|
|
|
|
def testDayFirstYearFirst(self):
|
|
|
|
dtstr = '090107'
|
|
|
|
# Should be YYDDMM
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=True, dayfirst=True),
|
|
|
|
datetime(2009, 7, 1))
|
|
|
|
|
|
|
|
def testUnambiguousYearFirst(self):
|
|
|
|
dtstr = '2015 09 25'
|
|
|
|
self.assertEqual(parse(dtstr, yearfirst=True),
|
|
|
|
datetime(2015, 9, 25))
|
|
|
|
|
|
|
|
def testUnambiguousDayFirst(self):
|
|
|
|
dtstr = '2015 09 25'
|
2022-01-24 04:07:52 +00:00
|
|
|
self.assertEqual(parse(dtstr, dayfirst=True),
|
2018-10-31 16:08:29 +00:00
|
|
|
datetime(2015, 9, 25))
|
|
|
|
|
|
|
|
def testUnambiguousDayFirstYearFirst(self):
|
|
|
|
dtstr = '2015 09 25'
|
|
|
|
self.assertEqual(parse(dtstr, dayfirst=True, yearfirst=True),
|
|
|
|
datetime(2015, 9, 25))
|
|
|
|
|
2022-01-24 04:07:52 +00:00
|
|
|
def test_mstridx(self):
|
|
|
|
# See GH408
|
|
|
|
dtstr = '2015-15-May'
|
|
|
|
self.assertEqual(parse(dtstr),
|
|
|
|
datetime(2015, 5, 15))
|
|
|
|
|
|
|
|
def test_idx_check(self):
|
|
|
|
dtstr = '2017-07-17 06:15:'
|
|
|
|
# Pre-PR, the trailing colon will cause an IndexError at 824-825
|
|
|
|
# when checking `i < len_l` and then accessing `l[i+1]`
|
|
|
|
res = parse(dtstr, fuzzy=True)
|
|
|
|
assert res == datetime(2017, 7, 17, 6, 15)
|
|
|
|
|
|
|
|
def test_hmBY(self):
|
|
|
|
# See GH#483
|
|
|
|
dtstr = '02:17NOV2017'
|
|
|
|
res = parse(dtstr, default=self.default)
|
|
|
|
assert res == datetime(2017, 11, self.default.day, 2, 17)
|
|
|
|
|
|
|
|
def test_validate_hour(self):
|
|
|
|
# See GH353
|
|
|
|
invalid = "201A-01-01T23:58:39.239769+03:00"
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(invalid)
|
|
|
|
|
|
|
|
def test_era_trailing_year(self):
|
|
|
|
dstr = 'AD2001'
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res.year == 2001, res
|
|
|
|
|
|
|
|
def test_includes_timestr(self):
|
|
|
|
timestr = "2020-13-97T44:61:83"
|
|
|
|
|
|
|
|
try:
|
|
|
|
parse(timestr)
|
|
|
|
except ParserError as e:
|
|
|
|
assert e.args[1] == timestr
|
|
|
|
else:
|
|
|
|
pytest.fail("Failed to raise ParserError")
|
|
|
|
|
|
|
|
|
|
|
|
class TestOutOfBounds(object):
|
|
|
|
|
|
|
|
def test_no_year_zero(self):
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse("0000 Jun 20")
|
|
|
|
|
|
|
|
def test_out_of_bound_day(self):
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse("Feb 30, 2007")
|
|
|
|
|
|
|
|
def test_illegal_month_error(self):
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse("0-100")
|
|
|
|
|
|
|
|
def test_day_sanity(self, fuzzy):
|
|
|
|
dstr = "2014-15-25"
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(dstr, fuzzy=fuzzy)
|
|
|
|
|
|
|
|
def test_minute_sanity(self, fuzzy):
|
|
|
|
dstr = "2014-02-28 22:64"
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(dstr, fuzzy=fuzzy)
|
|
|
|
|
|
|
|
def test_hour_sanity(self, fuzzy):
|
|
|
|
dstr = "2014-02-28 25:16 PM"
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(dstr, fuzzy=fuzzy)
|
|
|
|
|
|
|
|
def test_second_sanity(self, fuzzy):
|
|
|
|
dstr = "2014-02-28 22:14:64"
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(dstr, fuzzy=fuzzy)
|
|
|
|
|
|
|
|
|
|
|
|
class TestParseUnimplementedCases(object):
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_somewhat_ambiguous_string(self):
|
|
|
|
# Ref: github issue #487
|
|
|
|
# The parser is choosing the wrong part for hour
|
|
|
|
# causing datetime to raise an exception.
|
|
|
|
dtstr = '1237 PM BRST Mon Oct 30 2017'
|
|
|
|
res = parse(dtstr, tzinfo=self.tzinfos)
|
|
|
|
assert res == datetime(2017, 10, 30, 12, 37, tzinfo=self.tzinfos)
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_YmdH_M_S(self):
|
|
|
|
# found in nasdaq's ftp data
|
|
|
|
dstr = '1991041310:19:24'
|
|
|
|
expected = datetime(1991, 4, 13, 10, 19, 24)
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected, (res, expected)
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_first_century(self):
|
|
|
|
dstr = '0031 Nov 03'
|
|
|
|
expected = datetime(31, 11, 3)
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected, res
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_era_trailing_year_with_dots(self):
|
|
|
|
dstr = 'A.D.2001'
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res.year == 2001, res
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_ad_nospace(self):
|
|
|
|
expected = datetime(6, 5, 19)
|
|
|
|
for dstr in [' 6AD May 19', ' 06AD May 19',
|
|
|
|
' 006AD May 19', ' 0006AD May 19']:
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected, (dstr, res)
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_four_letter_day(self):
|
|
|
|
dstr = 'Frid Dec 30, 2016'
|
|
|
|
expected = datetime(2016, 12, 30)
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_non_date_number(self):
|
|
|
|
dstr = '1,700'
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(dstr)
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_on_era(self):
|
|
|
|
# This could be classified as an "eras" test, but the relevant part
|
|
|
|
# about this is the ` on `
|
|
|
|
dstr = '2:15 PM on January 2nd 1973 A.D.'
|
|
|
|
expected = datetime(1973, 1, 2, 14, 15)
|
|
|
|
res = parse(dstr)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_extraneous_year(self):
|
|
|
|
# This was found in the wild at insidertrading.org
|
|
|
|
dstr = "2011 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d NOVEMBER 7, 2012"
|
|
|
|
res = parse(dstr, fuzzy_with_tokens=True)
|
|
|
|
expected = datetime(2012, 11, 7)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_extraneous_year_tokens(self):
|
|
|
|
# This was found in the wild at insidertrading.org
|
|
|
|
# Unlike in the case above, identifying the first "2012" as the year
|
|
|
|
# would not be a problem, but inferring that the latter 2012 is hhmm
|
|
|
|
# is a problem.
|
|
|
|
dstr = "2012 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d NOVEMBER 7, 2012"
|
|
|
|
expected = datetime(2012, 11, 7)
|
|
|
|
(res, tokens) = parse(dstr, fuzzy_with_tokens=True)
|
|
|
|
assert res == expected
|
|
|
|
assert tokens == ("2012 MARTIN CHILDREN'S IRREVOCABLE TRUST u/a/d ",)
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_extraneous_year2(self):
|
|
|
|
# This was found in the wild at insidertrading.org
|
|
|
|
dstr = ("Berylson Amy Smith 1998 Grantor Retained Annuity Trust "
|
|
|
|
"u/d/t November 2, 1998 f/b/o Jennifer L Berylson")
|
|
|
|
res = parse(dstr, fuzzy_with_tokens=True)
|
|
|
|
expected = datetime(1998, 11, 2)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_extraneous_year3(self):
|
|
|
|
# This was found in the wild at insidertrading.org
|
|
|
|
dstr = "SMITH R & WEISS D 94 CHILD TR FBO M W SMITH UDT 12/1/1994"
|
|
|
|
res = parse(dstr, fuzzy_with_tokens=True)
|
|
|
|
expected = datetime(1994, 12, 1)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_unambiguous_YYYYMM(self):
|
|
|
|
# 171206 can be parsed as YYMMDD. However, 201712 cannot be parsed
|
|
|
|
# as instance of YYMMDD and parser could fallback to YYYYMM format.
|
|
|
|
dstr = "201712"
|
|
|
|
res = parse(dstr)
|
|
|
|
expected = datetime(2017, 12, 1)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
@pytest.mark.xfail
|
|
|
|
def test_extraneous_numerical_content(self):
|
|
|
|
# ref: https://github.com/dateutil/dateutil/issues/1029
|
|
|
|
# parser interprets price and percentage as parts of the date
|
|
|
|
dstr = "£14.99 (25% off, until April 20)"
|
|
|
|
res = parse(dstr, fuzzy=True, default=datetime(2000, 1, 1))
|
|
|
|
expected = datetime(2000, 4, 20)
|
|
|
|
assert res == expected
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.skipif(IS_WIN, reason="Windows does not use TZ var")
|
|
|
|
class TestTZVar(object):
|
|
|
|
def test_parse_unambiguous_nonexistent_local(self):
|
|
|
|
# When dates are specified "EST" even when they should be "EDT" in the
|
|
|
|
# local time zone, we should still assign the local time zone
|
|
|
|
with TZEnvContext('EST+5EDT,M3.2.0/2,M11.1.0/2'):
|
|
|
|
dt_exp = datetime(2011, 8, 1, 12, 30, tzinfo=tz.tzlocal())
|
|
|
|
dt = parse('2011-08-01T12:30 EST')
|
|
|
|
|
|
|
|
assert dt.tzname() == 'EDT'
|
|
|
|
assert dt == dt_exp
|
|
|
|
|
|
|
|
def test_tzlocal_in_gmt(self):
|
|
|
|
# GH #318
|
|
|
|
with TZEnvContext('GMT0BST,M3.5.0,M10.5.0'):
|
|
|
|
# This is an imaginary datetime in tz.tzlocal() but should still
|
|
|
|
# parse using the GMT-as-alias-for-UTC rule
|
|
|
|
dt = parse('2004-05-01T12:00 GMT')
|
|
|
|
dt_exp = datetime(2004, 5, 1, 12, tzinfo=tz.UTC)
|
|
|
|
|
|
|
|
assert dt == dt_exp
|
|
|
|
|
|
|
|
def test_tzlocal_parse_fold(self):
|
|
|
|
# One manifestion of GH #318
|
|
|
|
with TZEnvContext('EST+5EDT,M3.2.0/2,M11.1.0/2'):
|
|
|
|
dt_exp = datetime(2011, 11, 6, 1, 30, tzinfo=tz.tzlocal())
|
|
|
|
dt_exp = tz.enfold(dt_exp, fold=1)
|
|
|
|
dt = parse('2011-11-06T01:30 EST')
|
|
|
|
|
|
|
|
# Because this is ambiguous, until `tz.tzlocal() is tz.tzlocal()`
|
|
|
|
# we'll just check the attributes we care about rather than
|
|
|
|
# dt == dt_exp
|
|
|
|
assert dt.tzname() == dt_exp.tzname()
|
|
|
|
assert dt.replace(tzinfo=None) == dt_exp.replace(tzinfo=None)
|
|
|
|
assert getattr(dt, 'fold') == getattr(dt_exp, 'fold')
|
|
|
|
assert dt.astimezone(tz.UTC) == dt_exp.astimezone(tz.UTC)
|
|
|
|
|
|
|
|
|
|
|
|
def test_parse_tzinfos_fold():
|
|
|
|
NYC = tz.gettz('America/New_York')
|
|
|
|
tzinfos = {'EST': NYC, 'EDT': NYC}
|
|
|
|
|
|
|
|
dt_exp = tz.enfold(datetime(2011, 11, 6, 1, 30, tzinfo=NYC), fold=1)
|
|
|
|
dt = parse('2011-11-06T01:30 EST', tzinfos=tzinfos)
|
|
|
|
|
|
|
|
assert dt == dt_exp
|
|
|
|
assert dt.tzinfo is dt_exp.tzinfo
|
|
|
|
assert getattr(dt, 'fold') == getattr(dt_exp, 'fold')
|
|
|
|
assert dt.astimezone(tz.UTC) == dt_exp.astimezone(tz.UTC)
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('dtstr,dt', [
|
|
|
|
('5.6h', datetime(2003, 9, 25, 5, 36)),
|
|
|
|
('5.6m', datetime(2003, 9, 25, 0, 5, 36)),
|
|
|
|
# '5.6s' never had a rounding problem, test added for completeness
|
|
|
|
('5.6s', datetime(2003, 9, 25, 0, 0, 5, 600000))
|
|
|
|
])
|
|
|
|
def test_rounding_floatlike_strings(dtstr, dt):
|
|
|
|
assert parse(dtstr, default=datetime(2003, 9, 25)) == dt
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.parametrize('value', ['1: test', 'Nan'])
|
|
|
|
def test_decimal_error(value):
|
|
|
|
# GH 632, GH 662 - decimal.Decimal raises some non-ParserError exception
|
|
|
|
# when constructed with an invalid value
|
|
|
|
with pytest.raises(ParserError):
|
|
|
|
parse(value)
|
|
|
|
|
|
|
|
def test_parsererror_repr():
|
|
|
|
# GH 991 — the __repr__ was not properly indented and so was never defined.
|
|
|
|
# This tests the current behavior of the ParserError __repr__, but the
|
|
|
|
# precise format is not guaranteed to be stable and may change even in
|
|
|
|
# minor versions. This test exists to avoid regressions.
|
|
|
|
s = repr(ParserError("Problem with string: %s", "2019-01-01"))
|
|
|
|
|
|
|
|
assert s == "ParserError('Problem with string: %s', '2019-01-01')"
|