2005-09-15 09:58:31 -04:00
|
|
|
/* Parser of HTTP date */
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
#include "config.h"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
|
|
|
|
#ifdef HAVE_SYS_TIME_H
|
|
|
|
#include <sys/time.h>
|
|
|
|
#endif
|
|
|
|
#include <time.h>
|
|
|
|
|
|
|
|
#include "elinks.h"
|
|
|
|
|
|
|
|
#include "protocol/date.h"
|
|
|
|
#include "util/conv.h"
|
|
|
|
#include "util/time.h"
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Sun, 06 Nov 1994 08:49:37 GMT ; RFC 822, updated by RFC 1123
|
|
|
|
* Sunday, 06-Nov-94 08:49:37 GMT ; RFC 850, obsoleted by RFC 1036
|
|
|
|
* Sun Nov 6 08:49:37 1994 ; ANSI C's asctime() format
|
|
|
|
*/
|
|
|
|
|
|
|
|
int
|
2021-01-02 10:20:27 -05:00
|
|
|
parse_year(const char **date_p, char *end)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *date = *date_p;
|
2005-09-15 09:58:31 -04:00
|
|
|
int year;
|
|
|
|
|
|
|
|
if ((end && date + 1 >= end)
|
|
|
|
|| !isdigit(date[0])
|
|
|
|
|| !isdigit(date[1]))
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
year = (date[0] - '0') * 10 + date[1] - '0';
|
|
|
|
|
|
|
|
if ((!end || date + 3 < end)
|
|
|
|
&& isdigit(date[2])
|
|
|
|
&& isdigit(date[3])) {
|
|
|
|
/* Four digits date */
|
|
|
|
year = year * 10 + date[2] - '0';
|
|
|
|
year = year * 10 + date[3] - '0' - 1900;
|
|
|
|
date += 4;
|
|
|
|
|
|
|
|
} else if (year < 70) {
|
|
|
|
/* Assuming the epoch starting at 1.1.1970 so it's already next
|
|
|
|
* century. --wget */
|
|
|
|
year += 100;
|
|
|
|
date += 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
*date_p = date;
|
|
|
|
return year;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2021-01-02 10:20:27 -05:00
|
|
|
parse_month(const char **buf, char *end)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *month = *buf;
|
2005-09-15 09:58:31 -04:00
|
|
|
int monthnum;
|
|
|
|
|
|
|
|
/* Check that the buffer has atleast 3 chars. */
|
|
|
|
if ((end && month + 2 > end)
|
|
|
|
|| !month[0] || !month[1] || !month[2])
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
monthnum = month2num(month);
|
|
|
|
|
|
|
|
if (monthnum != -1)
|
|
|
|
*buf += 3;
|
|
|
|
|
|
|
|
return monthnum;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* Return day number. */
|
|
|
|
int
|
2021-01-02 10:20:27 -05:00
|
|
|
parse_day(const char **date_p, char *end)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *date = *date_p;
|
2005-09-15 09:58:31 -04:00
|
|
|
int day;
|
|
|
|
|
|
|
|
if ((end && date >= end) || !isdigit(*date))
|
|
|
|
return 32;
|
|
|
|
day = *date++ - '0';
|
|
|
|
|
|
|
|
if ((!end || date < end) && isdigit(*date)) {
|
|
|
|
day = day * 10 + *date++ - '0';
|
|
|
|
}
|
|
|
|
|
|
|
|
*date_p = date;
|
|
|
|
return day;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2021-01-02 10:20:27 -05:00
|
|
|
parse_time(const char **time, struct tm *tm, char *end)
|
2005-09-15 09:58:31 -04:00
|
|
|
{
|
|
|
|
unsigned char h1, h2, m1, m2;
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *date = *time;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
#define check_time(tm) \
|
|
|
|
((tm)->tm_hour <= 23 && (tm)->tm_min <= 59 && (tm)->tm_sec <= 59)
|
|
|
|
|
|
|
|
/* Eat HH:MM */
|
|
|
|
if (end && date + 5 > end)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
h1 = *date++; if (!isdigit(h1)) return 0;
|
|
|
|
h2 = *date++; if (!isdigit(h2)) return 0;
|
|
|
|
|
|
|
|
if (*date++ != ':') return 0;
|
|
|
|
|
|
|
|
m1 = *date++; if (!isdigit(m1)) return 0;
|
|
|
|
m2 = *date++; if (!isdigit(m2)) return 0;
|
|
|
|
|
|
|
|
tm->tm_hour = (h1 - '0') * 10 + h2 - '0';
|
|
|
|
tm->tm_min = (m1 - '0') * 10 + m2 - '0';
|
2008-02-27 06:24:58 -05:00
|
|
|
tm->tm_sec = 0;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
/* Eat :SS or [PA]M or nothing */
|
|
|
|
if (end && date + 2 >= end) {
|
|
|
|
*time = date;
|
|
|
|
return check_time(tm);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (*date == ':') {
|
|
|
|
unsigned char s1, s2;
|
|
|
|
|
|
|
|
date++;
|
|
|
|
|
|
|
|
if (end && date + 2 >= end)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
s1 = *date++; if (!isdigit(s1)) return 0;
|
|
|
|
s2 = *date++; if (!isdigit(s2)) return 0;
|
|
|
|
|
|
|
|
tm->tm_sec = (s1 - '0') * 10 + s2 - '0';
|
|
|
|
|
|
|
|
} else if (*date == 'A' || *date == 'P') {
|
|
|
|
/* Adjust hour from AM/PM. The sequence goes 11:00AM, 12:00PM,
|
|
|
|
* 01:00PM ... 11:00PM, 12:00AM, 01:00AM. --wget */
|
|
|
|
if (tm->tm_hour == 12)
|
|
|
|
tm->tm_hour = 0;
|
|
|
|
|
|
|
|
if (*date++ == 'P')
|
|
|
|
tm->tm_hour += 12;
|
|
|
|
|
|
|
|
if (*date++ != 'M')
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
*time = date;
|
|
|
|
|
|
|
|
return check_time(tm);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static time_t
|
|
|
|
my_timegm(struct tm *tm)
|
|
|
|
{
|
|
|
|
time_t t = 0;
|
|
|
|
|
|
|
|
/* Okay, the next part of the code is somehow problematic. Now, we use
|
|
|
|
* own code for calculating the number of seconds from 1.1.1970,
|
|
|
|
* brought here by SC from w3m. I don't like it a lot, but it's 100%
|
|
|
|
* portable, it's faster and it's shorter. --pasky */
|
|
|
|
#if 0
|
|
|
|
#ifdef HAVE_TIMEGM
|
|
|
|
t = timegm(tm);
|
|
|
|
#else
|
|
|
|
/* Since mktime thinks we have localtime, we need a wrapper
|
|
|
|
* to handle GMT. */
|
|
|
|
/* FIXME: It was reported that it doesn't work somewhere :/. */
|
|
|
|
{
|
2021-01-02 10:20:27 -05:00
|
|
|
char *tz = getenv("TZ");
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (tz && *tz) {
|
|
|
|
/* Temporary disable timezone in-place. */
|
|
|
|
unsigned char tmp = *tz;
|
|
|
|
|
|
|
|
*tz = '\0';
|
|
|
|
tzset();
|
|
|
|
|
|
|
|
t = mktime(tm);
|
|
|
|
|
|
|
|
*tz = tmp;
|
|
|
|
tzset();
|
|
|
|
|
|
|
|
} else {
|
|
|
|
/* Already GMT, cool! */
|
|
|
|
t = mktime(tm);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#else
|
|
|
|
/* Following code was borrowed from w3m, and its developers probably
|
|
|
|
* borrowed it from somewhere else as well, altough they didn't bother
|
|
|
|
* to mention that. */ /* Actually, same code appears to be in lynx as
|
|
|
|
* well.. oh well. :) */
|
|
|
|
/* See README.timegm for explanation about how this works. */
|
|
|
|
tm->tm_mon -= 2;
|
|
|
|
if (tm->tm_mon < 0) {
|
|
|
|
tm->tm_mon += 12;
|
|
|
|
tm->tm_year--;
|
|
|
|
}
|
|
|
|
tm->tm_mon *= 153; tm->tm_mon += 2;
|
|
|
|
tm->tm_year -= 68;
|
|
|
|
|
2007-01-13 08:38:02 -05:00
|
|
|
/* Bug 924: Assumes all years divisible by 4 are leap years,
|
|
|
|
* even though e.g. 2100 is not. */
|
2005-09-15 09:58:31 -04:00
|
|
|
tm->tm_mday += tm->tm_year * 1461 / 4;
|
|
|
|
tm->tm_mday += ((tm->tm_mon / 5) - 672);
|
|
|
|
|
|
|
|
t = ((tm->tm_mday * 60 * 60 * 24) +
|
|
|
|
(tm->tm_hour * 60 * 60) +
|
|
|
|
(tm->tm_min * 60) +
|
|
|
|
tm->tm_sec);
|
|
|
|
#endif
|
|
|
|
|
|
|
|
if (t == (time_t) -1) return 0;
|
|
|
|
|
|
|
|
return t;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
time_t
|
2021-01-02 10:20:27 -05:00
|
|
|
parse_date(char **date_pos, char *end,
|
2005-09-15 09:58:31 -04:00
|
|
|
int update_pos, int skip_week_day)
|
|
|
|
{
|
|
|
|
#define skip_time_sep(date, end) \
|
|
|
|
do { \
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *start = (date); \
|
2005-09-15 09:58:31 -04:00
|
|
|
while ((!(end) || (date) < (end)) \
|
|
|
|
&& (*(date) == ' ' || *(date) == '-')) \
|
|
|
|
(date)++; \
|
|
|
|
if (date == start) return 0; \
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
struct tm tm;
|
2021-01-02 10:20:27 -05:00
|
|
|
const char *date = (const char *) *date_pos;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
if (!date) return 0;
|
|
|
|
|
|
|
|
if (skip_week_day) {
|
|
|
|
/* Skip day-of-week */
|
|
|
|
for (; (!end || date < end) && *date != ' '; date++)
|
|
|
|
if (!*date) return 0;
|
|
|
|
|
|
|
|
/* As pasky said who cares if we allow '-'s here? */
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isdigit(*date)) {
|
|
|
|
/* RFC 1036 / RFC 1123 */
|
|
|
|
|
|
|
|
/* Eat day */
|
|
|
|
|
|
|
|
/* date++; */
|
|
|
|
tm.tm_mday = parse_day(&date, end);
|
|
|
|
if (tm.tm_mday > 31) return 0;
|
|
|
|
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat month */
|
|
|
|
|
|
|
|
tm.tm_mon = parse_month(&date, end);
|
|
|
|
if (tm.tm_mon < 0) return 0;
|
|
|
|
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat year */
|
|
|
|
|
|
|
|
tm.tm_year = parse_year(&date, end);
|
|
|
|
if (tm.tm_year < 0) return 0;
|
|
|
|
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat time */
|
|
|
|
|
|
|
|
if (!parse_time(&date, &tm, end)) return 0;
|
|
|
|
|
|
|
|
} else {
|
|
|
|
/* ANSI C's asctime() format */
|
|
|
|
|
|
|
|
/* Eat month */
|
|
|
|
|
|
|
|
tm.tm_mon = parse_month(&date, end);
|
|
|
|
if (tm.tm_mon < 0) return 0;
|
|
|
|
|
|
|
|
/* I know, we shouldn't allow '-', but who cares ;). --pasky */
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat day */
|
|
|
|
|
|
|
|
tm.tm_mday = parse_day(&date, end);
|
|
|
|
if (tm.tm_mday > 31) return 0;
|
|
|
|
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat time */
|
|
|
|
|
|
|
|
if (!parse_time(&date, &tm, end)) return 0;
|
|
|
|
|
|
|
|
skip_time_sep(date, end);
|
|
|
|
|
|
|
|
/* Eat year */
|
|
|
|
|
|
|
|
tm.tm_year = parse_year(&date, end);
|
|
|
|
if (tm.tm_year < 0) return 0;
|
|
|
|
}
|
|
|
|
#undef skip_time_sep
|
|
|
|
|
|
|
|
if (update_pos)
|
2021-01-02 10:20:27 -05:00
|
|
|
*date_pos = (char *) date;
|
2005-09-15 09:58:31 -04:00
|
|
|
|
|
|
|
return (time_t) my_timegm(&tm);
|
|
|
|
}
|