sclass EnglishDateParser > DateStructures { replace P with ParsedWithTokens. bool assumeFuture = true; // e.g. for "tuesday" [not used] LS tok; int maxTokens = 3; L
> longestParses(S s) { ret pwt_topDogs(pwt_filterByType SomeDate(allParses(s))); } SomeDate parse(S s) { ret getVar(first(longestParses(s))); } ItIt
allParses(S s) { // tokenize, initialize tok = javaTok(s); new L
out;
L > initials = concatMap(codeTokens, lai -> pwt_followingTokens(1, maxTokens, lai));
// find numbers
L > numbers = pwt_transform(number(), initials);
// find ordinals (1st, 2nd, ...)
new L > ordinals;
for (P > years = pwt_filter isYear(numbers);
out.addAll(years);
L > months = pwt_filter isMonthNr(numbers);
L > dayOfMonths = pwt_filter isDayOfMonth(numbers);
L > weekdays = concatMap parseWeekday(codeTokens);
out.addAll(weekdays);
// month names
L > monthNames = concatMap parseMonthName(codeTokens);
out.addAll(monthNames);
// month name + year, e.g. "February 2020"
out.addAll(pwt_combine(monthNames, years, (month, year) -> new Month(month.month, new Year(year))));
// month name + ordinal, e.g. "March 4th"
out.addAll(pwt_combine(monthNames, ordinals, (month, ord) -> new Day(ord, month)));
// yesterday, today, tomorrow
// "next > parseFixedToken(S token, ListAndIndex > parseFixedToken_before(S token, ListAndIndex > parseOneOfFixedTokens(Set > parseWeekday(ListAndIndex > parseMonthName(ListAndIndex ord : parseToTheRight(fixedToken("st", "nd", "rd", "th"), number))
ordinals.add(pwt_combine(number, ord));
//print(+ordinals);
// "in in : print("in", parseToTheLeft(fixedToken("in"), number)))
for (P days : parseToTheRight(fixedToken("day", "days"), number))
out.add(pwt_combine(new TodayPlus(number!), in, days));
// " daysFromNow : parseToTheRight(fixedToken("day from now", "days from now"), number))
out.add(pwt_combine(new TodayPlus(number!), number, daysFromNow));
L next : parseToTheLeft(fixedToken("next"), weekday))
out.add(pwt_combine(new Weekday(weekday->weekday, new CurrentWeekPlus(1)), next, weekday));
for (P slash : parseToTheRight(fixedToken("/"), year))
for (P slash2 : parseToTheRight(fixedToken("/"), month))
for (P number() {
ret s -> isInteger(s) ? parseInt(s) : null;
}
bool isYear(int n) {
ret between(n, 1900, 2100);
}
bool isMonthNr(int n) {
ret between(n, 1, 12);
}
bool isDayOfMonth(int n) {
ret between(n, 1, 31);
}
IF1 fixedToken(S... tokens) { ret fixedToken(litciset(tokens)); }
IF1 fixedToken(Set set) { ret t -> contains(set, t) ? t : null; }
ItIt toParse) {
ret filterI(pwt_followingTokens(1, maxTokens, toParse), p -> eqic(p!, token));
}
ItIt toParse) {
ret filterI(pwt_precedingTokens(1, maxTokens, toParse), p -> eqic(p!, token));
}
ItIt tokens, ListAndIndex toParse) {
ret filterI(pwt_followingTokens(1, maxTokens, toParse), p -> contains(tokens, p!));
}
ItIt toParse) {
ret pwt_mapI(s -> new Weekday(parseEnglishWeekday(s)), parseOneOfFixedTokens(englishWeekdays_ciSet(), toParse));
}
ItIt toParse) {
ret pwt_mapI(s -> new Month(parseEnglishMonthName(s)), parseOneOfFixedTokens(englishMonthNames_ciSet(), toParse));
}
L