hypermess/hypermail/src/struct.c - view

File: [Public] / hypermess / hypermail / src / struct.c
Revision 1.4: download - view: text, annotated - select for diffs
Fri Oct 29 15:40:08 1999 UTC (24 years, 7 months ago) by kahan
Branches: MAIN
CVS tags: HEAD

JK: upgrading to 2b26

/* ** Copyright (C) 1994, 1995 Enterprise Integration Technologies Corp. ** VeriFone Inc./Hewlett-Packard. All Rights Reserved. ** Kevin Hughes, kev@kevcom.com 3/11/94 ** Kent Landfield, kent@landfield.com 4/6/97 ** ** This program and library is free software; you can redistribute it and/or ** modify it under the terms of the GNU (Library) General Public License ** as published by the Free Software Foundation; either version 2 ** of the License, or any later version. ** ** This program is distributed in the hope that it will be useful, ** but WITHOUT ANY WARRANTY; without even the implied warranty of ** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ** GNU (Library) General Public License for more details. ** ** You should have received a copy of the GNU (Library) General Public License ** along with this program; if not, write to the Free Software ** Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA */ /* Define the following define to enable better date debugging */ /*#define PH_DATE_DEBUG */ int rbs = 0; int rbs_bigtime = 0; #include "hypermail.h" #include "dmatch.h" #include "setup.h" #include "struct.h" struct body *hashnumlookup(int, struct emailinfo **); /* ** Ladies and germs - the hash function. */ unsigned hash(char *s) { unsigned hashval; /* We MUST deal with NULL pointers passed to this */ if (!s) return HASHSIZE - 1; /* (Daniel) I think a high value is fun ;-) */ for (hashval = 0; *s; s++) hashval = *s + 31 * hashval; return (hashval % HASHSIZE); } /* ** The structure most of everything else depends on. ** Hashes a message - header info, pointer to a list of body lines - ** by number, message ID, date, and subject, so an article can be ** handily looked up and retrieved using any of these criteria. */ struct emailinfo *addhash(int num, char *date, char *name, char *email, char *msgid, char *subject, char *inreply, char *fromdate, char *charset, char *isodate, char *isofromdate, struct body *sp) { struct emailinfo *e; struct hashemail *h; unsigned hashval; char numstr[NUMSTRLEN]; bool fromdate_valid = 1, date_valid = 1; bool msgid_dup = 0; bool msgid_missing = 0; static int freedummy = 0; char *newmsgid; if (!msgid) { /* SEVERE ERROR, all mails MUST have a Message-ID, ignore it! */ if (set_require_msgids) { printf ("Message-ID is missing, ignoring message with subject '%s'.\n", subject ? subject : "<unknown>"); return NULL; } else { msgid_missing = 1; } } if (!msgid_missing) { h = (struct hashemail *)etable[hash(msgid)]; while (h) { if (!strcmp(h->data->msgid, msgid)) { msgid_dup = 1; break; } h = h->next; } } if (msgid_dup && set_discard_dup_msgids) { printf ("%d: Message-ID collision, '%s' already present - discarding message.\n", num, msgid); return NULL; } if (msgid_dup || msgid_missing) { /* * This is broken. It needs to be corrected so that * the original message id is a component of the * generated message-id instead of a total unrelated * dummy msg-id. Good enough for now though... */ newmsgid = emalloc(MSGDSTRLEN); do { msgid_dup = 0; sprintf(newmsgid, "%d.%4.4d@hypermail.dummy", time(NULL), freedummy); h = (struct hashemail *)etable[hash(newmsgid)]; while (h) { if (!strcmp(h->data->msgid, newmsgid)) { msgid_dup = 1; break; } h = h->next; } freedummy++; } while (msgid_dup && (freedummy < 1000)); if (!msgid_dup) { if (msgid_missing) printf("\n%d Message-ID missing, using %s instead.\n", num, newmsgid); else printf("\n%d Message-ID collision, '%s' already present - using %s instead.\n", num, msgid, newmsgid); msgid = newmsgid; } else { if (msgid_missing) printf("\n%d Message-ID missing, failed to find free id - dropping message.\n", num); else printf ("\n%d Message-ID collision, '%s' already present - failed to find free id - dropping message.\n", num, msgid); return NULL; } } e = (struct emailinfo *)emalloc(sizeof(struct emailinfo)); e->msgnum = num; e->emailaddr = strsav(email); if ((name == NULL) || (*name == '\0')) e->name = strsav(email); else e->name = strsav(name); /* fromdate may be empty (zero length string rather than NULL) * date will always have something in it - either a date or * the NODATE string "(no date)" */ if (isodate != NULL && isofromdate != NULL) { e->date = iso_to_secs(isodate); e->fromdate = iso_to_secs(isofromdate); e->fromdatestr = strsav(fromdate); e->datestr = strsav(date); } else { if (!strcmp(date, NODATE)) { date_valid = 0; } else { if ((e->date = convtoyearsecs(date)) == -1) date_valid = 0; } if (!*fromdate) { fromdate_valid = 0; } else { if ((e->fromdate = convtoyearsecs(fromdate)) == -1) fromdate_valid = 0; } if (fromdate_valid && !date_valid) { #ifdef PH_DATE_DEBUG fprintf(stderr, "%d: %s: using fromdate '%s' for both (date '%s')\n", num, msgid, fromdate, date); #endif e->fromdatestr = strsav(fromdate); e->datestr = strsav(fromdate); e->date = e->fromdate; } else if (!fromdate_valid && date_valid) { #ifdef PH_DATE_DEBUG fprintf(stderr, "%d: %s: using date '%s' for both (fromdate '%s')\n", num, msgid, date, fromdate); #endif e->fromdatestr = strsav(date); e->datestr = strsav(date); e->fromdate = e->date; } else if (!fromdate_valid && !date_valid) { #ifdef PH_DATE_DEBUG fprintf(stderr, "%d: %s: fromdate '%s' and date '%s' both bad\n", num, msgid, fromdate, date); #endif e->fromdatestr = strsav(fromdate); e->datestr = strsav(date); } else { e->fromdatestr = strsav(fromdate); e->datestr = strsav(date); #ifdef PH_DATE_DEBUG if (e->date > e->fromdate) { rbs++; if ((e->date - e->fromdate) > 4200) { /* if more than 1:10 off */ char fromdate_parsed[26]; char date_parsed[26]; strcpy(fromdate_parsed, ctime(&(e->fromdate))); strcpy(date_parsed, ctime(&(e->date))); date_parsed[24] = '\0'; fromdate_parsed[24] = '\0'; rbs_bigtime++; fprintf(stderr, "%d [%d:%d]: %s: received before sent\n %-38.38s %-30.38s\n %-38.38s %-38.38s\n", num, rbs, rbs_bigtime, msgid, fromdate, date, fromdate_parsed, date_parsed); } } #endif } } e->msgid = strsav(msgid); e->subject = strsav(subject); e->inreplyto = strsav(inreply); e->charset = strsav(charset); e->flags = 0; e->bodylist = sp; /* Added by Daniel 1999-03-19, we need this hash later to find the mail we replied to */ h = (struct hashemail *)emalloc(sizeof(struct hashemail)); hashval = hash(inreply); h->next = etable[hashval]; h->data = e; etable[hashval] = h; h = (struct hashemail *)emalloc(sizeof(struct hashemail)); hashval = hash(date); h->next = etable[hashval]; h->data = e; etable[hashval] = h; h = (struct hashemail *)emalloc(sizeof(struct hashemail)); #if 0 printf("ADD msgid %s to HASH!\n", msgid); #endif hashval = hash(msgid); h->next = etable[hashval]; h->data = e; etable[hashval] = h; h = (struct hashemail *)emalloc(sizeof(struct hashemail)); hashval = hash(subject); h->next = etable[hashval]; h->data = e; etable[hashval] = h; h = (struct hashemail *)emalloc(sizeof(struct hashemail)); sprintf(numstr, "%d", num); hashval = hash(numstr); h->next = etable[hashval]; h->data = e; etable[hashval] = h; return e; /* the actual mail struct pointer */ } /* * Given an "in-reply-to:" field and a message number, this function * retrieves information about the message that this message is a * reply to. * If all else fails but a reply is * found by comparing subjects, issubjmatch is set to 1. * * Daniel 1999-03-19. Changed return type and parameters. */ struct emailinfo *hashreplylookup(int msgnum, char *inreply, int *issubjmatch) { struct hashemail *ep; #if DEBUG_THREAD fprintf(stderr, "hashreplylookup(%d, '%s'...)\n", msgnum, inreply); #endif *issubjmatch = 0; ep = etable[hash(inreply)]; while (ep) { if ((msgnum != ep->data->msgnum) && (strcmp(inreply, ep->data->msgid) == 0)) { #if DEBUG_THREAD fprintf(stderr, "match on msgid [%d]\n", ep->data->msgnum); #endif return ep->data; } ep = ep->next; } ep = etable[hash(inreply)]; while (ep != NULL) { if ((msgnum != ep->data->msgnum) && (strstr(inreply, ep->data->datestr))) { #if DEBUG_THREAD fprintf(stderr, "match on date [%d]\n", ep->data->msgnum); #endif return ep->data; } ep = ep->next; } ep = etable[hash(inreply)]; while (ep != NULL) { if ((msgnum != ep->data->msgnum) && (strcmp(inreply, ep->data->subject) == 0)) { *issubjmatch = 1; #if DEBUG_THREAD fprintf(stderr, "match on subject [%d]\n", ep->data->msgnum); #endif return ep->data; } ep = ep->next; } return NULL; } /* * Given an "message-id:" field, this tries to retrieve information * about an article that has replied. If all else fails but a reply is * found by comparing subjects, issubjmatch is set to 1. * * Daniel 1999-03-24. New. */ struct emailinfo *hashmsgidlookup(char *msgid, int *issubjmatch) { struct hashemail *ep; *issubjmatch = 0; ep = etable[hash(msgid)]; while (ep) { if (strcmp(msgid, ep->data->inreplyto) == 0) { return ep->data; } ep = ep->next; } return NULL; } /* ** Same as the above function, but only returns the article number. */ int hashreplynumlookup(int msgnum, char *inreply, char *subject, int *maybereply) { struct hashemail *ep; #if DEBUG_THREAD > 1 fprintf(stderr, "hashreplynumlookup(%d, '%s'...)\n", msgnum, (inreply == NULL) ? "" : inreply); #endif *maybereply = 0; if ((inreply != NULL) && *inreply) { ep = etable[hash(inreply)]; while (ep) { if (strcmp(inreply, ep->data->msgid) == 0) { #if DEBUG_THREAD fprintf(stderr, "match on msgid %4d %4d\n", msgnum, ep->data->msgnum); #endif return ep->data->msgnum; } ep = ep->next; } ep = etable[hash(inreply)]; while (ep) { if ((msgnum != ep->data->msgnum) && (strstr(inreply, ep->data->datestr))) { #if DEBUG_THREAD fprintf(stderr, "match on date %4d %4d\n", msgnum, ep->data->msgnum); #endif return ep->data->msgnum; } ep = ep->next; } ep = etable[hash(inreply)]; while (ep != NULL) { if ((msgnum != ep->data->msgnum) && (strcmp(inreply, ep->data->subject) == 0)) { *maybereply = 1; #if DEBUG_THREAD fprintf(stderr, "match on subject %4d %4d\n", msgnum, ep->data->msgnum); #endif return ep->data->msgnum; } ep = ep->next; } } /* end of matching on inreply */ /* No match so far. Now try matching on the subject, removing * one instance of "re: " from the front of the subject each * time round the loop. */ { char *s, *saved_s; int lowest_so_far = 60000; /* arbitrary high number - higher than number of messages in archive */ int match = 0; s = emalloc(strlen(subject) + 1); saved_s = strcpy(s, subject); do { #if DEBUG_THREAD > 1 fprintf(stderr, "extra %s\n", s); #endif ep = etable[hash(s)]; while (ep != NULL) { if ((strcasecmp(s, ep->data->subject) == 0) && (msgnum != ep->data->msgnum)) { match = 1; if (ep->data->msgnum < lowest_so_far) lowest_so_far = ep->data->msgnum; } ep = ep->next; } s = oneunre(s); } while (s != NULL); free(saved_s); if (match) { *maybereply = 1; if (lowest_so_far < msgnum) { #if DEBUG_THREAD fprintf(stderr, "match on extra %4d %4d\n", msgnum, lowest_so_far); #endif return lowest_so_far; } else { #if DEBUG_THREAD fprintf(stderr, "match on extra %4d %4d discarded - less than %d\n", msgnum, lowest_so_far, msgnum); #endif return -1; } } } #if DEBUG_THREAD fprintf(stderr, "match NO MATCH %4d\n", msgnum); #endif return -1; } /* * From an article's number, retrieve all information associated with * that article. */ struct body *hashnumlookup(int num, struct emailinfo **emailp) { struct hashemail *ep; char numstr[NUMSTRLEN]; sprintf(numstr, "%d", num); for (ep = etable[hash(numstr)]; ep != NULL; ep = ep->next) if (ep->data && (num == ep->data->msgnum)) { /* return a mere pointer to it! */ *emailp = ep->data; return ep->data->bodylist; } return NULL; } /* ** Add a line to a linked list that makes up a boundary stack. This new one ** should be the new "active" boundary. ** ** "Adding" a NULL will retrieve the formerly used boundary pointer. */ struct boundary *bound(struct boundary *bnd, char *line) { struct boundary *newnode = NULL; if (line) { newnode = (struct boundary *)emalloc(sizeof(struct boundary)); newnode->line = strsav(line); newnode->next = NULL; newnode->prev = bnd; if (bnd) bnd->next = newnode; bnd = newnode; } else { if (bnd->prev) { /* go back to the previous */ bnd = bnd->prev; /* free the latest one */ free(bnd->next->line); free(bnd->next); } else { /* this is the last node */ free(bnd->line); free(bnd); bnd = NULL; } } return bnd; /* the new "active" boundary */ } /* ** Add a line to a linked list that makes up an article's body. */ struct body *addbody(struct body *bp, struct body **lp, /* points to the last pointer */ char *line, int flags) { struct body *tempnode; struct body *newnode = NULL; if (!(flags & BODY_CONTINUE)) { newnode = (struct body *)emalloc(sizeof(struct body)); memset(newnode, 0, sizeof(struct body)); newnode->line = strsav(line); newnode->html = (flags & BODY_HTMLIZED) ? 1 : 0; newnode->header = (flags & BODY_HEADER) ? 1 : 0; newnode->attached = (flags & BODY_ATTACHED) ? 1 : 0; newnode->next = NULL; } if (bp == NULL) { bp = newnode; *lp = bp; } else { tempnode = *lp; /* get pointer right away */ if (flags & BODY_CONTINUE) { /* this is a continuation of the previous line */ int newlen; char *newbuf; /* get the new size + 1 for the terminating zero */ newlen = strlen(tempnode->line) + strlen(line) + 1; /* extend the former memory area: */ newbuf = (char *)realloc(tempnode->line, newlen); /* if successful, continue */ if (newbuf) { /* remove LF from the first part: */ char *lf; lf = strchr(newbuf, '\n'); if (lf) *lf = 0; /* append the new part */ strcat(newbuf, line); /* point out the new buffer instead */ tempnode->line = newbuf; } } else { tempnode->next = newnode; *lp = newnode; } } return bp; } /* ** Remove the last empty lines, if any, from an article body's linked list. */ int rmlastlines(struct body *bp) { struct body *tempnode; for (tempnode = bp; tempnode->next != NULL && (tempnode->next->line)[0] != '\0'; tempnode = tempnode->next); if ((tempnode->line)[0] == '\n') { (tempnode->line)[0] = '\0'; return 1; } return 0; } /* ** If a message is a reply to another, that message's number and the number of ** the message it may be referring to is put in this list. */ struct reply *addreply(struct reply *rp, int fromnum, struct emailinfo *email, int maybereply) { struct reply *tempnode, *newnode; newnode = (struct reply *)emalloc(sizeof(struct reply)); newnode->frommsgnum = fromnum; if (email == NULL) newnode->msgnum = -1; else newnode->msgnum = email->msgnum; newnode->data = email; newnode->maybereply = maybereply; newnode->next = NULL; if (!rp) rp = newnode; else { for (tempnode = rp; tempnode->next != NULL; tempnode = tempnode->next); tempnode->next = newnode; } return rp; } /* ** Mark an article number as having been printed. */ struct printed *markasprinted(struct printed *pp, int num) { struct printed *tempnode, *newnode; newnode = (struct printed *)emalloc(sizeof(struct printed)); newnode->msgnum = num; newnode->next = NULL; if (pp == NULL) pp = newnode; else { for (tempnode = pp; tempnode->next != NULL; tempnode = tempnode->next); tempnode->next = newnode; } return pp; } /* ** Has an article already been printed? */ int wasprinted(struct printed *list, int num) { struct printed *pp; for (pp = list; pp != NULL; pp = pp->next) if (pp->msgnum == num) return 1; return 0; } /* ** Add article header information to a binary tree and sort by date, ** subject, or author. This is necessary for printing the index files. */ struct header *addheader(struct header *hp, struct emailinfo *email, int sorttype) { int isbigger; long yearsecs; isbigger = 0; if (hp == NULL) { hp = (struct header *)emalloc(sizeof(struct header)); if (!hp) return NULL; hp->data = email; if (sorttype == 2) { yearsecs = hp->data->datenum = email->fromdate; if (!firstdatenum || yearsecs < firstdatenum) firstdatenum = yearsecs; if (yearsecs > lastdatenum) lastdatenum = yearsecs; } else hp->data->datenum = 0; hp->left = hp->right = NULL; return hp; } switch (sorttype) { case 1: isbigger = (strcasecmp(email->name, hp->data->name) > 0) ? 0 : 1; break; case 0: isbigger = (strcasecmp(email->unre_subject, hp->data->unre_subject) > 0) ? 0 : 1; break; case 2: yearsecs = email->fromdate; if (set_reverse) isbigger = (yearsecs < hp->data->datenum) ? 0 : 1; else isbigger = (yearsecs >= hp->data->datenum) ? 0 : 1; if (!firstdatenum || yearsecs < firstdatenum) firstdatenum = yearsecs; if (yearsecs > lastdatenum) lastdatenum = yearsecs; break; } if (isbigger) hp->left = addheader(hp->left, email, sorttype); else hp->right = addheader(hp->right, email, sorttype); return hp; } /* ** And Now The List Addition Routines! */ void print_list(char *listname, struct hmlist *list) { struct hmlist *tlist; int set = 0; int len = 0; int line = 0; /* Daniel remade Nov 23 1998. Use a single line as far as possible */ for (tlist = list; tlist != NULL; tlist = tlist->next) { set++; if (!line++) { printf("%s = ", listname); len = strlen(listname) + 3; } else { if (len + strlen(tlist->val) > 78) { printf("\n%s = ", listname); len = strlen(listname) + 3; } else { printf(","); len++; } } printf("%s", tlist->val); len += strlen(tlist->val); } if (!set) printf("%s: %s\n", listname, lang[MSG_NO_ELEMENTS]); else printf("\n"); } /* ** Is the requested element in the list ? */ int inlist(struct hmlist *listname, char *wildcard) { struct hmlist *tlist; for (tlist = listname; tlist != NULL; tlist = tlist->next) { /* wildcard checks enabled! */ if (Match(wildcard, tlist->val)) return 1; } return 0; } /* ** What is the position of the requested element in the list ? */ int inlist_pos(struct hmlist *listname, char *wildcard) { struct hmlist *tlist; int i; for (i = 0, tlist = listname; tlist != NULL; i++, tlist = tlist->next) { /* wildcard checks enabled! */ if (Match(wildcard, tlist->val)) return i; } return -1; } /* ** Add element to the specified list */ struct hmlist *add_2_list(struct hmlist *listname, char *value) { struct hmlist *tnode, *newnode; newnode = (struct hmlist *)emalloc(sizeof(struct hmlist)); newnode->val = strsav(value); newnode->next = NULL; if (listname == NULL) listname = newnode; else { for (tnode = listname; tnode->next != NULL; tnode = tnode->next); tnode->next = newnode; } return listname; } struct hmlist *add_list(struct hmlist *listname, char *value) { register char *cp; register char *valp; /* * This needs to support lists specified on a single line, such as * inline = image/jpeg image/gif ... * inline = image/jpeg,image/gif ... * as well as lists specified on multiple lines. */ valp = value; cp = valp; while (*cp) { if (*cp == ' ' || *cp == ',') { if (*valp != ' ' && *valp != ',') { *cp = '\0'; listname = add_2_list(listname, valp); } valp = cp + 1; } cp++; } if (*valp) listname = add_2_list(listname, valp); return listname; }