[net.sources] date <-> day-number software sought

wendt@bocklin.UUCP (06/28/85)

I'm looking for software capable of converting mm/dd/yy dates into
day numbers and back.  Has to work at least back to 1900 and forward
to 2100.  Has anybody got a biorythm program in C that I could
canabilize?  Reply here and thank you:

Alan Wendt
arizona!wendt

nrh@inmet.UUCP (07/03/85)

Here are two routines, jday.c and jdate.c that have served
me pretty well.  They are translations from ALGOL in Collected
Algorithms of CACM.
/*
** Takes a date, and returns a Julian day. A Julian day is the number of
** days since some base date  (in the very distant past).
** Handy for getting date of x number of days after a given Julian date
** (use jdate to get that from the Gregorian date).
** Author: Robert G. Tantzen, translator: Nat Howard
** Translated from the algol original in Collected Algorithms of CACM
** (This and jdate are algorithm 199).
*/
long
jday(mon, day, year)
int mon, day, year;
{
	long m = mon, d = day, y = year;
	long c, ya, j;

	if(m > 2) m -= 3;
	else {
		m += 9;
		--y;
	}
	c = y/100L;
	ya = y - (100L * c);
	j = (146097L * c) /4L + (1461L * ya) / 4L + (153L * m + 2L)/5L + d + 1721119L;
	return(j);
}
/* Julian date converter. Takes a julian date (the number of days since
** some distant epoch or other), and returns an int pointer to static space.
** ip[0] = month;
** ip[1] = day of month;
** ip[2] = year (actual year, like 1977, not 77 unless it was  77 a.d.);
** ip[3] = day of week (0->Sunday to 6->Saturday)
** These are Gregorian.
** Copied from Algorithm 199 in Collected algorithms of the CACM
** Author: Robert G. Tantzen, Translator: Nat Howard
*/
int *
jdate(j)
long j;
{
	static int ret[4];

	long d, m, y;

	ret[3] = (j + 1L)%7L;
	j -= 1721119L;
	y = (4L * j - 1L)/146097L;
	j = 4L * j - 1L - 146097L * y;
	d = j/4L;
	j = (4L * d + 3L)/1461L;
	d = 4L * d + 3L - 1461L * j;
	d = (d + 4L)/4L;
	m = (5L * d - 3L)/153L;
	d = 5L * d - 3 - 153L * m;
	d = (d + 5L) / 5L;
	y = 100L * y + j;
	if(m < 10) 
		m += 3;
	else {
		m -= 9;
		++y;
	}
	ret[0] =  m;
	ret[1] = d;
	ret[2] = y;
	return(ret);
}

root@bu-cs.UUCP (Barry Shein) (07/06/85)

Here's a string->tm converter that I wrote quite some time ago
that takes several forms of date input and heuristically tries
to figure out what it might be, more or less inspired by TOPS-20
(handles more date formats I think.)

This is what date(1) should have been built out of!

It's just one file, the comments should be enough to figure out
what is going on (very simple to interface, probably hairy to
modify tho.) Put it into a file called gdate.c

	-Barry Shein, Boston University

----------------shear here------------------
#include <stdio.h>
#include <ctype.h>
/*
 *	in 4.2bsd they moved time.h to <sys/time.h>
 */
#define BSD42
#ifdef BSD42
#include <sys/time.h>
#else
#include <time.h>
#endif
#define MAXTOK 20
/*
 * routines to turn a date from various formats to other formats
 *
 *	Primary interesting routine is gdate() which eats a date
 *	string of several common formats (see comment) and
 *	fills in a standard UNIX tm structure.
 **	Barry Shein, Boston University
 *	if you compile it -DDEBUG (with DEBUG defined) it will
 *	pull in a main() routine to run standalone for testing.
 */
#define AMBIG  -1	/* ambiguous month */
#define FALSE  -2	/* bad syntax	   */
char *months[] = {
	"january", "february", "march", "april", "may", "june", "july",
	"august", "september", "october", "november", "december", 0
} ;
char *dow[] = {
	"sunday", "monday", "tuesday", "wednesday", "thursday",
	"friday", "saturday", 0
} ;
/*
 *	known time-zone name list
 */
char *tz[] = 
{
	"adt", "ast", "edt", "est", "cdt", "cst", "mst", "mdt",
	"pdt", "pst", "gmt",
	0
} ;
char mdays[] = {
	31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31
} ;
lcase(c) register char c ;
{
	return(isupper(c) ? tolower(c) : c) ;
}
/*
 *  get a digit string from sp into bp (buffer) returning new sp
 */
char *
dstring(bp,sp) register char *sp, *bp  ;
{
	register int i = 0 ;
	while(isdigit(*sp))
		if(i++ == MAXTOK) break ;
		else *bp++ = *sp++ ;
	*bp = '\0' ;
	return(sp) ;
}
/*
 *  skip white space returning updated ptr
 */
char *
skipw(sp) register char *sp ;
{
	while(isspace(*sp) || *sp == '-') ++sp ;
	return(sp) ;
}
/*
 *  return how many chars of s1 prefix s2
 */
prefix(s1,s2) register char *s1, *s2 ;
{
	register int i = 0  ;

	for(; *s1 == *s2 ; s1++,s2++,i++)
		if(*s2 == '\0') break ;
	return(*s1 == '\0' ? i : 0) ;
}
/*
 *  look up str in list for non-ambiguous (prefix) match
 */
find(sp,lp) register char *sp, **lp ;
{
	int i,j,ambig = 0 ;
	register int k ;
	int ret  = FALSE ;

	for(i = 0,k = 0 ; *lp ; lp++,k++)
		if((j  = prefix(sp,*lp)) > i)
		{
			ambig = 0 ;
			i = j ;
			ret = k + 1 ;
		}
		else if(j && (i == j)) ++ambig ;
	return(ambig ? AMBIG : ret) ;
}
/*
 * like find but demands exact match
 */
lookup(sp,lp) register char *sp, **lp ;
{
	int i = 0 ;

	for(i=0 ; *lp ; lp++,i++)
		if(strcmp(sp,*lp) == 0) return(i+1) ;
	return(0) ;
}
/*
 * extract a token
 */
char *
extract(bp,sp) register char *bp, *sp ;
{
	register int i = 0 ;

	sp = skipw(sp) ;
	for(; isalnum(*sp); sp++)
		if(i++ == MAXTOK) break ;
		else *bp++ = lcase(*sp) ;
	*bp = '\0' ;
	return(sp) ;
}
/*
 *  fill up an area with a value (eg. zeros)
 */
fill(cp,c,n) register char *cp, c ; register int n ;
{
	while(n--) *cp++ = c ;
}

char *gdate(), *gtime() ;
long totime() ;
#if DEBUG
/*
 *  test driver
 *	translates first arg from command line (argv[1])
 *	and dumps out structure built.
 */
usage(sp) char *sp ;
{
	fprintf(stderr,"Usage: %s date\n",sp) ;
	exit(1) ;
}
main(argc,argv) int argc ; char **argv ;
{
	char *cp ;
	struct tm tm ;
	long t,t2 ;

	if(argc != 2) usage(*argv) ;
	if((cp = gdate(*++argv,&tm)) != NULL)
		printf("error: %s (%s)\n",*argv,cp) ;
	printf("year : %d month: %d day: %d\n",
		tm.tm_year,tm.tm_mon,tm.tm_mday);
	printf("day of month: %d hour: %d minute: %d second: %d\n",
		tm.tm_mday,tm.tm_hour,tm.tm_min,tm.tm_sec) ;
	printf("day of year: %d day of week: %d dst: %d\n",
		tm.tm_yday, tm.tm_wday, tm.tm_isdst) ;
	time(&t) ;
	t2 = totime(&tm) ;
	printf("%D %D %D\n",t,t2,t2-t) ;
	exit(0) ;
}
#endif	/* DEBUG */
/*
 *	gdate(date_str_ptr,time_buf_ptr)
 *	(see CTIME(3) in UPM for second arg format)
 *	takes many reasonable date strings and translates to
 *	the time-buf structure (integers)
 *
 *	formats (eg.):
 *		oct 19, 1983
 *		OcT 19, 1983 12:43
 *		oCt 19, 1983 12:43:33
 *		oct 19 1983 ...
 *		19 oct 83 ....
 *		10/19/83 12:43:33
 *		19-OCT-83 12:43:00 (DEC style)
 *		Wed Oct 19 12:43 EST 83 (UNIX style)
 *		oct. 19, 83 1:44 pm est
 *		831019124333	(see date(1))
 *	some variations on those themes also.
 *
 *	BUGS: probably a few (maybe some in the eye of the beholder)
 *		does not set dst flag (unless 'EDT' is in string)
 */
char *
gdate(sp,tp) register char *sp ; register struct tm *tp ;
{
	char buf[MAXTOK] ;

	fill(tp,'\0',sizeof *tp) ;
	sp = skipw(sp) ;
	if(isdigit(*sp))	/* either '7/12/83' or '12 jul 83' */
	{
		if(isdigit(sp[1]) && isdigit(sp[2])) /* UNIX yymmddhhmmss */
		{
			buf[2] = '\0' ;
			strncpy(buf,sp,2) ;
			tp->tm_year = atoi(buf) ;
			strncpy(buf,sp += 2,2) ;
			tp->tm_mon = atoi(buf) ;
			sp += 2 ;
			if(!isdigit(*sp)) goto badday ;
			strncpy(buf,sp,2) ;
			tp->tm_mday = atoi(buf) ;
			sp += 2 ;
			if(!isdigit(*sp)) goto check ;
			strncpy(buf,sp,2) ;
			tp->tm_hour ;
			sp += 2 ;
			if(!isdigit(*sp)) goto check ;
			strncpy(buf,sp,2) ;
			tp->tm_min = atoi(buf) ;
			sp += 2 ;
			if(!isdigit(*sp)) goto check ;
			strncpy(buf,sp,2) ;
			tp->tm_min = atoi(buf) ;
			goto check ;
		}
		sp = dstring(buf,sp) ;
		sp = skipw(sp) ;
		if(*sp == '/')	/* must be '7/12/83' */
		{
			if((tp->tm_mon = atoi(buf)) < 1 || (tp->tm_mon > 12))
			{
				tp->tm_mon = FALSE ;
				goto badmon ;
			}
			sp = skipw(++sp) ;
			if(!isdigit(*sp)) goto badday ;
			sp = dstring(buf,sp) ;
			tp->tm_mday = atoi(buf) ;

			sp = skipw(sp) ;
			if(*sp != '/') goto badyr ;
			sp = skipw(++sp) ;
			if(!isdigit(*sp)) goto badyr ;
			sp = dstring(buf,sp) ;
			tp->tm_year = atoi(buf) ;

			sp = gtime(sp,tp) ;
		}
		else
		{
			/*
			 * must be '12 jul 83'
			 */
			tp->tm_mday = atoi(buf) ;

			sp = extract(buf,sp) ;
			if((tp->tm_mon = find(buf,months)) < 1) goto badmon ;

			if(*sp == '.') ++sp ;
			sp = skipw(sp) ;

			if(!isdigit(*sp)) goto badyr ;
			sp = dstring(buf,sp) ;
			tp->tm_year = atoi(buf) ;

			sp = gtime(sp,tp) ;
		}
	}
	else
	{
		int flag = 0 ;	/* used to indicate looking for UNIX style */

		/*
		 * either 'jul 12 83' or (UNIX) Wed jul 12 18:33 EST 1983
		 */
		sp = extract(buf,sp) ;
		if(find(buf,dow) > 0)
		{
			sp = extract(buf,sp) ;
			++flag ;
		}

		if((tp->tm_mon = find(buf,months)) < 1) goto badmon ;

		if(*sp == '.') ++sp ;
		sp = skipw(sp) ;

		if(!isdigit(*sp)) goto badday ;
		sp = dstring(buf,sp) ;
		tp->tm_mday = atoi(buf) ;

		sp = skipw(sp) ;
		if(*sp == ',') sp++ ;
		sp = skipw(sp) ;

		if(flag) sp = skipw(gtime(sp,tp)) ;

		if(!isdigit(*sp)) goto badyr ;
		sp = dstring(buf,sp) ;
		tp->tm_year = atoi(buf) ;

		if(!flag) sp = gtime(sp,tp) ;
	}
check:
	/*
	 * check for ridiculous numbers
	 */
	if(tp->tm_mday < 1) goto badday ;
	if(tp->tm_mday > mdays[tp->tm_mon-1])
		if(!((tp->tm_mon == 2) &&	/* check for Feb 29 */
			(tp->tm_mday == 29) && (days(tp->tm_year) == 365) ))
				goto badday ;
	if(tp->tm_year >= 1900) tp->tm_year -= 1900 ;
	if(tp->tm_hour > 23)
	{
		tp->tm_hour = FALSE ;
		return(sp) ;
	}
	if(tp->tm_min > 59)
	{
		tp->tm_hour = FALSE ;
		return(sp) ;
	}
	if(tp->tm_sec > 59)
	{
		tp->tm_sec = FALSE ;
		return(sp) ;
	}
	/*
	 *	fill in day of year, day of week (these calls must be
	 *	in this order as dowk() needs doyr()
	 */

	doyr(tp) ;
	dowk(tp) ;
	/*
	 * all done !
	 */
	return(NULL) ;
badday :
	tp->tm_mday = FALSE ;
	return(sp) ;
badmon :
	return(sp) ;
badyr :
	tp->tm_year = FALSE ;
	return(sp) ;
}
/*
 *  get  hh:mm:ss
 */
char *
gtime(sp,tp) register char *sp ; register struct tm *tp ;
{
	char buf[MAXTOK],*cp ;

	sp = skipw(sp) ;
	if(isdigit(*sp))
	{
		sp = dstring(buf,sp) ;
		tp->tm_hour = atoi(buf) ;
		sp = skipw(sp) ;
		if(*sp == ':') sp = skipw(++sp) ;
		else goto out ;
		if(isdigit(*sp))
		{
			sp = dstring(buf,sp) ;
			tp->tm_min = atoi(buf) ;
			sp = skipw(sp) ;
			if(*sp == ':') sp = skipw(++sp) ;
			else goto out ;
			if(isdigit(*sp))
			{
				sp = dstring(buf,sp) ;
				tp->tm_sec = atoi(buf) ;
			}
		}
	}
out :
	sp = skipw(sp) ;
	if(isalpha(*sp))	/* PM:AM or time zone or both */
	{
		cp = extract(buf,sp) ;
		if(strcmp(buf,"am") == 0 || strcmp(buf,"pm") == 0)
		{
			if(buf[0] == 'p' && tp->tm_hour < 12)
				tp->tm_hour += 12 ;
			sp = cp = skipw(cp) ;
			cp = extract(buf,cp) ;
		}
		if(lookup(buf,tz))
		{
			if(buf[1] == 'd') tp->tm_isdst++ ;
			sp = skipw(cp) ;
		}
	}
	return(sp) ;
}
/*
 *	Ok, you were all wondering so here it is folks...
 *	THE LEAP YEAR CALCULATION
 *	note: does not take into account 1752.
 */
days(y) register int y ;
{
	if(y < 1970) y += 1900 ;
	if(((y % 4) == 0) && ( (y % 100) || ((y % 400)==0) )) y = 366 ;
	else y = 365 ;
	return(y) ;
}
#include <sys/types.h>
#include <sys/timeb.h>
/*
 *	translate a time.h structure to seconds since 1/1/70
 *	(ie. UNIX internal time format...GMT)
 */
long
totime(tp) register struct tm *tp ;
{
	long ret = 0 ;
	int i,j ;
	struct timeb tb ;

	if(tp->tm_year < 70) return(0) ;
	for(i=1970,j=tp->tm_year+1900 ; i<j ; i++)
		ret += days(i) ;
	for(i=1 ; i < tp->tm_mon ; i++)
		ret += mdays[i-1] ;
	if((days(tp->tm_year) == 366) && (tp->tm_mon > 2)) ++ret ;
	ret += (tp->tm_mday - 1) ;
	ret *= 24 ;
	ret += tp->tm_hour ;
	ret *= 60 ;
	ftime(&tb) ;
	ret += (tp->tm_min + tb.timezone) ;
	ret *= 60 ;
	ret += tp->tm_sec ;
	return(ret) ;
}
/*
 *	return day of the week
 *	of jan 1 of given year
 */

jan1(yr)
{
	register y, d;

/*
 *	normal gregorian calendar
 *	one extra day per four years
 */

	y = yr;
	d = 4+y+(y+3)/4;

/*
 *	julian calendar
 *	regular gregorian
 *	less three days per 400
 */

	if(y > 1800) {
		d -= (y-1701)/100;
		d += (y-1601)/400;
	}

/*
 *	take care of weirdness at 1752.
 */

	if(y > 1752)
		d += 3;

	return(d%7);
}
/*
 *	given day of year and year calculate and insert day-of-week (0..6)
 */
dowk(tp) register struct tm *tp ;
{
	tp->tm_wday = (jan1(tp->tm_year+1900) + tp->tm_yday) % 7 ;
}
/*
 *	calculate day of year from year
 */
doyr(tp) register struct tm *tp ;
{
	register int i,j ;

	j = ((tp->tm_mon > 2) && (days(tp->tm_year) == 366)) ? 1 : 0 ;
	for(i=1 ; i < tp->tm_mon ; i++)
		j += mdays[i-1] ;
	tp->tm_yday = j + tp->tm_mday - 1 ;
}

honey@down.FUN (Peter Honeyman) (07/08/85)

along similar lines, here's a program (fragment) that converts a date
string to the obvious integer.  the scope of getdate() is unknown to
me, but i use this on ctime format date strings regularly.
	peter

/*
 * emitc -- convert time into an int.  compile with
 * getdate.o, which can be found with netnews source.
 */

#include <stdio.h>
#include <sys/types.h>
#include <sys/timeb.h>

main(argc, argv)
char	**argv;
{
	if (argc == 1)
		printf("%ld\n", time((time_t *) 0));
	else {
		char	buf[BUFSIZ], *bptr = buf;

		*bptr = 0;
		while (--argc) {
			strcpy(bptr, *++argv);
			bptr += strlen(bptr);
			*bptr++ = ' ';
		}
		*--bptr = 0;
		printf("%ld\n", getdate(buf, (struct timeb *) 0));
	}
	exit(0);
}