chrono_english/
lib.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
//! ## Parsing English Dates
//!
//! I've always admired the ability of the GNU `date` command to
//! convert "English" expressions to dates and times with `date -d expr`.
//! `chrono-english` does similar expressions, although with extensions, so
//! that for instance you can specify both the day and the time "next friday 8pm".
//! No attempt at full natural language parsing is made - only a limited set of
//! patterns is supported.
//!
//! ## Supported Formats
//!
//! `chrono-english` does _absolute_ dates:  ISO-like dates "2018-04-01" and the month name forms
//! "1 April 2018" and "April 1, 2018". (There's no ambiguity so both of these forms are fine)
//!
//! The informal "01/04/18" or American form "04/01/18" is supported.
//! There is a `Dialect` enum to specify what kind of date English you would like to speak.
//! Both short and long years are accepted in this form; short dates pivot between 1940 and 2040.
//!
//! Then there are are _relative_ dates like 'April 1' and '9/11' (this
//! if using `Dialect::Us`). The current year is assumed, but this can be modified by 'next'
//! and 'last'. For instance, it is now the 13th of March, 2018: 'April 1' and 'next April 1'
//! are in 2018; 'last April 1' is in 2017.
//!
//! Another relative form is simply a month name
//! like 'apr' or 'April' (case-insensitive, only first three letters significant) where the
//! day is assumed to be the 1st.
//!
//! A week-day works in the same way: 'friday' means this
//! coming Friday, relative to today. 'last Friday' is unambiguous,
//! but 'next Friday' has different meanings; in the US it means the same as 'Friday'
//! but otherwise it means the Friday of next week (plus 7 days)
//!
//! Date and time can be specified also by a number of time units. So "2 days", "3 hours".
//! Again, first three letters, but 'd','m' and 'y' are understood (so "3h"). We make
//! a distinction between _second_ intervals (seconds,minutes,hours,days,weeks) and _month_
//! intervals (months,years).  Month intervals always give us the same date, if possible
//! But adding a month to "30 Jan" will give "28 Feb" or "29 Feb" depending if a leap year.
//!
//! Finally, dates may be followed by time. Either 'formal' like 18:03, with optional
//! second (like 18:03:40) or 'informal' like 6.03pm. So one gets "next friday 8pm' and so
//! forth.
//!
//! ## API
//!
//! There are two entry points: `parse_date_string` and `parse_duration`. The
//! first is given the date string, a `DateTime` from which relative dates and
//! times operate, and a dialect (either `Dialect::Uk` or `Dialect::Us`
//! currently.) The base time also specifies the desired timezone.
//!
//! ```ignore
//! extern crate chrono_english;
//! extern crate chrono;
//! use chrono_english::{parse_date_string,Dialect};
//!
//! use chrono::prelude::*;
//!
//! let date_time = parse_date_string("next friday 8pm", Local::now(), Dialect::Uk)?;
//! println!("{}",date_time.format("%c"));
//! ```
//!
//! There is a little command-line program `parse-date` in the `examples` folder which can be used to play
//! with these expressions.
//!
//! The other function, `parse_duration`, lets you access just the relative part
//! of a string like 'two days ago' or '12 hours'. If successful, returns an
//! `Interval`, which is a number of seconds, days, or months.
//!
//! ```
//! use chrono_english::{parse_duration,Interval};
//!
//! assert_eq!(parse_duration("15m ago").unwrap(), Interval::Seconds(-15 * 60));
//! ```
//!

extern crate chrono;
extern crate scanlex;
use chrono::prelude::*;

mod errors;
mod parser;
mod types;
use errors::*;
use types::*;

pub use errors::{DateError, DateResult};
pub use types::Interval;

#[derive(Clone, Copy, Debug)]
pub enum Dialect {
    Uk,
    Us,
}

pub fn parse_date_string<Tz: TimeZone>(
    s: &str,
    now: DateTime<Tz>,
    dialect: Dialect,
) -> DateResult<DateTime<Tz>>
where
    Tz::Offset: Copy,
{
    let mut dp = parser::DateParser::new(s);
    if let Dialect::Us = dialect {
        dp = dp.american_date();
    }
    let d = dp.parse()?;

    // we may have explicit hour:minute:sec
    let tspec = match d.time {
        Some(tspec) => tspec,
        None => TimeSpec::new_empty(),
    };
    if tspec.offset.is_some() {
        //   return DateTime::fix()::parse_from_rfc3339(s);
    }
    let date_time = if let Some(dspec) = d.date {
        dspec
            .to_date_time(now, tspec, dp.american)
            .or_err("bad date")?
    } else {
        // no date, time set for today's date
        tspec.to_date_time(now.date()).or_err("bad time")?
    };
    Ok(date_time)
}

pub fn parse_duration(s: &str) -> DateResult<Interval> {
    let mut dp = parser::DateParser::new(s);
    let d = dp.parse()?;

    if d.time.is_some() {
        return date_result("unexpected time component");
    }

    // shouldn't happen, but.
    if d.date.is_none() {
        return date_result("could not parse date");
    }

    match d.date.unwrap() {
        DateSpec::Absolute(_) => date_result("unexpected absolute date"),
        DateSpec::FromName(_) => date_result("unexpected date component"),
        DateSpec::Relative(skip) => Ok(skip.to_interval()),
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    const FMT_ISO: &str = "%+";

    fn display(t: DateResult<DateTime<Utc>>) -> String {
        t.unwrap().format(FMT_ISO).to_string()
    }

    #[test]
    fn basics() {
        let base = parse_date_string("2018-03-21 11:00", Utc::now(), Dialect::Uk).unwrap();

        // Day of week - relative to today. May have a time part
        assert_eq!(
            display(parse_date_string("friday", base, Dialect::Uk)),
            "2018-03-23T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("friday 10:30", base, Dialect::Uk)),
            "2018-03-23T10:30:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("friday 8pm", base, Dialect::Uk)),
            "2018-03-23T20:00:00+00:00"
        );

        // The day of week is the _next_ day after today, so "Tuesday" is the next Tuesday after Wednesday
        assert_eq!(
            display(parse_date_string("tues", base, Dialect::Uk)),
            "2018-03-27T00:00:00+00:00"
        );

        // The expression 'next Monday' is ambiguous; in the US it means the day following (same as 'Monday')
        // (This is how the `date` command interprets it)
        assert_eq!(
            display(parse_date_string("next mon", base, Dialect::Us)),
            "2018-03-26T00:00:00+00:00"
        );
        // but otherwise it means the day in the next week..
        assert_eq!(
            display(parse_date_string("next mon", base, Dialect::Uk)),
            "2018-04-02T00:00:00+00:00"
        );

        assert_eq!(
            display(parse_date_string("last fri 9.30", base, Dialect::Uk)),
            "2018-03-16T09:30:00+00:00"
        );

        // date expressed as month, day - relative to today. May have a time part
        assert_eq!(
            display(parse_date_string("9/11", base, Dialect::Us)),
            "2018-09-11T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("last 9/11", base, Dialect::Us)),
            "2017-09-11T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("last 9/11 9am", base, Dialect::Us)),
            "2017-09-11T09:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("April 1 8.30pm", base, Dialect::Uk)),
            "2018-04-01T20:30:00+00:00"
        );

        // advance by time unit from today
        // without explicit time, use base time - otherwise override
        assert_eq!(
            display(parse_date_string("2d", base, Dialect::Uk)),
            "2018-03-23T11:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("2d 03:00", base, Dialect::Uk)),
            "2018-03-23T03:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("3 weeks", base, Dialect::Uk)),
            "2018-04-11T11:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("3h", base, Dialect::Uk)),
            "2018-03-21T14:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("6 months", base, Dialect::Uk)),
            "2018-09-21T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("6 months ago", base, Dialect::Uk)),
            "2017-09-21T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("3 hours ago", base, Dialect::Uk)),
            "2018-03-21T08:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string(" -3h", base, Dialect::Uk)),
            "2018-03-21T08:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string(" -3 month", base, Dialect::Uk)),
            "2017-12-21T00:00:00+00:00"
        );

        // absolute date with year, month, day - formal ISO and informal UK or US
        assert_eq!(
            display(parse_date_string("2017-06-30", base, Dialect::Uk)),
            "2017-06-30T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("30/06/17", base, Dialect::Uk)),
            "2017-06-30T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("06/30/17", base, Dialect::Us)),
            "2017-06-30T00:00:00+00:00"
        );

        // may be followed by time part, formal and informal
        assert_eq!(
            display(parse_date_string("2017-06-30 08:20:30", base, Dialect::Uk)),
            "2017-06-30T08:20:30+00:00"
        );
        assert_eq!(
            display(parse_date_string(
                "2017-06-30 08:20:30 +02:00",
                base,
                Dialect::Uk
            )),
            "2017-06-30T06:20:30+00:00"
        );
        assert_eq!(
            display(parse_date_string(
                "2017-06-30 08:20:30 +0200",
                base,
                Dialect::Uk
            )),
            "2017-06-30T06:20:30+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30T08:20:30Z", base, Dialect::Uk)),
            "2017-06-30T08:20:30+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30T08:20:30", base, Dialect::Uk)),
            "2017-06-30T08:20:30+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30 8.20", base, Dialect::Uk)),
            "2017-06-30T08:20:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30 8.30pm", base, Dialect::Uk)),
            "2017-06-30T20:30:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30 8:30pm", base, Dialect::Uk)),
            "2017-06-30T20:30:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("2017-06-30 2am", base, Dialect::Uk)),
            "2017-06-30T02:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("30 June 2018", base, Dialect::Uk)),
            "2018-06-30T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("June 30, 2018", base, Dialect::Uk)),
            "2018-06-30T00:00:00+00:00"
        );
        assert_eq!(
            display(parse_date_string("June   30,    2018", base, Dialect::Uk)),
            "2018-06-30T00:00:00+00:00"
        );
    }

    fn get_err(r: DateResult<Interval>) -> String {
        r.err().unwrap().to_string()
    }

    #[test]
    fn durations() {
        assert_eq!(parse_duration("6h").unwrap(), Interval::Seconds(6 * 3600));
        assert_eq!(
            parse_duration("4 hours ago").unwrap(),
            Interval::Seconds(-4 * 3600)
        );
        assert_eq!(parse_duration("5 min").unwrap(), Interval::Seconds(5 * 60));
        assert_eq!(parse_duration("10m").unwrap(), Interval::Seconds(10 * 60));
        assert_eq!(
            parse_duration("15m ago").unwrap(),
            Interval::Seconds(-15 * 60)
        );

        assert_eq!(parse_duration("1 day").unwrap(), Interval::Days(1));
        assert_eq!(parse_duration("2 days ago").unwrap(), Interval::Days(-2));
        assert_eq!(parse_duration("3 weeks").unwrap(), Interval::Days(21));
        assert_eq!(parse_duration("2 weeks ago").unwrap(), Interval::Days(-14));

        assert_eq!(parse_duration("1 month").unwrap(), Interval::Months(1));
        assert_eq!(parse_duration("6 months").unwrap(), Interval::Months(6));
        assert_eq!(parse_duration("8 years").unwrap(), Interval::Months(12 * 8));

        // errors
        assert_eq!(
            get_err(parse_duration("2020-01-01")),
            "unexpected absolute date"
        );
        assert_eq!(
            get_err(parse_duration("2 days 15:00")),
            "unexpected time component"
        );
        assert_eq!(
            get_err(parse_duration("tuesday")),
            "unexpected date component"
        );
        assert_eq!(
            get_err(parse_duration("bananas")),
            "expected week day or month name"
        );
    }
}