NEWS: v14.5
[s-mailx.git] / thread.c
blob923320d0d3dd1c67f456a3d0265a95da86a796fa
1 /*@ S-nail - a mail user agent derived from Berkeley Mail.
2 *@ Message threading.
4 * Copyright (c) 2000-2004 Gunnar Ritter, Freiburg i. Br., Germany.
5 * Copyright (c) 2012 - 2013 Steffen "Daode" Nurpmeso <sdaoden@users.sf.net>.
6 */
7 /*
8 * Copyright (c) 2004
9 * Gunnar Ritter. All rights reserved.
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. All advertising materials mentioning features or use of this software
20 * must display the following acknowledgement:
21 * This product includes software developed by Gunnar Ritter
22 * and his contributors.
23 * 4. Neither the name of Gunnar Ritter nor the names of his contributors
24 * may be used to endorse or promote products derived from this software
25 * without specific prior written permission.
27 * THIS SOFTWARE IS PROVIDED BY GUNNAR RITTER AND CONTRIBUTORS ``AS IS'' AND
28 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 * ARE DISCLAIMED. IN NO EVENT SHALL GUNNAR RITTER OR CONTRIBUTORS BE LIABLE
31 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 * SUCH DAMAGE.
40 #ifndef HAVE_AMALGAMATION
41 # include "nail.h"
42 #endif
45 * Open addressing is used for Message-IDs because the maximum number of
46 * messages in the table is known in advance (== msgCount).
48 struct mitem {
49 struct message *mi_data;
50 char *mi_id;
53 struct msort {
54 union {
55 #ifdef HAVE_SPAM
56 ui_it ms_ui;
57 #endif
58 long ms_long;
59 char * ms_char;
60 } ms_u;
61 int ms_n;
64 static unsigned mhash(const char *cp, int mprime);
65 static struct mitem *mlook(char *id, struct mitem *mt, struct message *mdata,
66 int mprime);
67 static void adopt(struct message *parent, struct message *child, int dist);
68 static struct message *interlink(struct message *m, long cnt, int nmail);
69 static void finalize(struct message *mp);
70 #ifdef HAVE_SPAM
71 static int muilt(void const *a, void const *b);
72 #endif
73 static int mlonglt(const void *a, const void *b);
74 static int mcharlt(const void *a, const void *b);
75 static void lookup(struct message *m, struct mitem *mi, int mprime);
76 static void makethreads(struct message *m, long cnt, int nmail);
77 static char const *skipre(char const *cp);
78 static int colpt(int *msgvec, int cl);
79 static void colps(struct message *b, int cl);
80 static void colpm(struct message *m, int cl, int *cc, int *uc);
83 * Return the hash value for a message id modulo mprime, or mprime
84 * if the passed string does not look like a message-id.
86 static unsigned
87 mhash(const char *cp, int mprime)
90 unsigned h = 0, g, at = 0;
92 cp--;
93 while (*++cp) {
95 * Pay attention not to hash characters which are
96 * irrelevant for Message-ID semantics.
98 if (*cp == '(') {
99 cp = skip_comment(&cp[1]) - 1;
100 continue;
102 if (*cp == '"' || *cp == '\\')
103 continue;
104 if (*cp == '@')
105 at++;
106 h = ((h << 4) & 0xffffffff) + lowerconv(*cp & 0377);
107 if ((g = h & 0xf0000000) != 0) {
108 h = h ^ (g >> 24);
109 h = h ^ g;
112 return at ? h % (unsigned int)mprime : (unsigned int)mprime;
115 #define NOT_AN_ID ((struct mitem *)-1)
118 * Look up a message id. Returns NOT_AN_ID if the passed string does
119 * not look like a message-id.
121 static struct mitem *
122 mlook(char *id, struct mitem *mt, struct message *mdata, int mprime)
124 struct mitem *mp;
125 unsigned h, c, n = 0;
127 if (id == NULL && (id = hfield1("message-id", mdata)) == NULL)
128 return NULL;
129 if (mdata && mdata->m_idhash)
130 h = ~mdata->m_idhash;
131 else {
132 h = mhash(id, mprime);
133 if (h == (unsigned int)mprime)
134 return NOT_AN_ID;
136 mp = &mt[c = h];
137 while (mp->mi_id != NULL) {
138 if (msgidcmp(mp->mi_id, id) == 0)
139 break;
140 c += n&1 ? -((n+1)/2) * ((n+1)/2) : ((n+1)/2) * ((n+1)/2);
141 n++;
142 while (c >= (unsigned int)mprime)
143 c -= mprime;
144 mp = &mt[c];
146 if (mdata != NULL && mp->mi_id == NULL) {
147 mp->mi_id = id;
148 mp->mi_data = mdata;
149 mdata->m_idhash = ~h;
151 return mp->mi_id ? mp : NULL;
155 * Child is to be adopted by parent. A thread tree is structured
156 * as follows:
158 * ------ m_child ------ m_child
159 * | |-------------------->| |------------------------> . . .
160 * | |<--------------------| |<----------------------- . . .
161 * ------ m_parent ------ m_parent
162 * ^^ | ^
163 * | \____ m_younger | |
164 * | \ | |
165 * | ---- | |
166 * | \ | | m_elder
167 * | m_parent ---- | |
168 * | \ | |
169 * | ---- | |
170 * | \ + |
171 * | ------ m_child
172 * | | |------------------------> . . .
173 * | | |<----------------------- . . .
174 * | ------ m_parent
175 * | | ^
176 * \----- m_younger | |
177 * \ | |
178 * ---- | |
179 * \ | | m_elder
180 * m_parent ---- | |
181 * \ | |
182 * ---- | |
183 * \ + |
184 * ------ m_child
185 * | |------------------------> . . .
186 * | |<----------------------- . . .
187 * ------ m_parent
188 * | ^
189 * . . .
191 * The base message of a thread does not have a m_parent link. Elements
192 * connected by m_younger/m_elder links are replies to the same message,
193 * which is connected to them by m_parent links. The first reply to a
194 * message gets the m_child link.
196 static void
197 adopt(struct message *parent, struct message *child, int dist)
199 struct message *mp, *mq;
201 for (mp = parent; mp; mp = mp->m_parent)
202 if (mp == child)
203 return;
204 child->m_level = dist; /* temporarily store distance */
205 child->m_parent = parent;
206 if (parent->m_child != NULL) {
207 mq = NULL;
208 for (mp = parent->m_child; mp; mp = mp->m_younger) {
209 if (mp->m_date >= child->m_date) {
210 if (mp->m_elder)
211 mp->m_elder->m_younger = child;
212 child->m_elder = mp->m_elder;
213 mp->m_elder = child;
214 child->m_younger = mp;
215 if (mp == parent->m_child)
216 parent->m_child = child;
217 return;
219 mq = mp;
221 mq->m_younger = child;
222 child->m_elder = mq;
223 } else
224 parent->m_child = child;
228 * Connect all messages on the lowest thread level with m_younger/m_elder
229 * links.
231 static struct message *
232 interlink(struct message *m, long cnt, int nmail)
234 int i;
235 long n;
236 struct msort *ms;
237 struct message *root;
238 int autocollapse = !nmail && !(inhook&2) &&
239 value("autocollapse") != NULL;
241 ms = smalloc(sizeof *ms * cnt);
242 for (n = 0, i = 0; i < cnt; i++) {
243 if (m[i].m_parent == NULL) {
244 if (autocollapse)
245 colps(&m[i], 1);
246 ms[n].ms_u.ms_long = m[i].m_date;
247 ms[n].ms_n = i;
248 n++;
251 if (n > 0) {
252 qsort(ms, n, sizeof *ms, mlonglt);
253 root = &m[ms[0].ms_n];
254 for (i = 1; i < n; i++) {
255 m[ms[i-1].ms_n].m_younger = &m[ms[i].ms_n];
256 m[ms[i].ms_n].m_elder = &m[ms[i-1].ms_n];
258 } else
259 root = &m[0];
260 free(ms);
261 return root;
264 static void
265 finalize(struct message *mp)
267 long n;
269 for (n = 0; mp; mp = next_in_thread(mp)) {
270 mp->m_threadpos = ++n;
271 mp->m_level = mp->m_parent ?
272 mp->m_level + mp->m_parent->m_level : 0;
276 #ifdef HAVE_SPAM
277 static int
278 muilt(void const *a, void const *b)
280 struct msort const *xa = a, *xb = b;
281 int i;
283 i = (int)(xa->ms_u.ms_ui - xb->ms_u.ms_ui);
284 if (i == 0)
285 i = xa->ms_n - xb->ms_n;
286 return i;
288 #endif
290 static int
291 mlonglt(const void *a, const void *b)
293 struct msort const *xa = a, *xb = b;
294 int i;
296 i = (int)(xa->ms_u.ms_long - xb->ms_u.ms_long);
297 if (i == 0)
298 i = xa->ms_n - xb->ms_n;
299 return i;
302 static int
303 mcharlt(const void *a, const void *b)
305 struct msort const *xa = a, *xb = b;
306 int i;
308 i = strcoll(xa->ms_u.ms_char, xb->ms_u.ms_char);
309 if (i == 0)
310 i = xa->ms_n - xb->ms_n;
311 return i;
314 static void
315 lookup(struct message *m, struct mitem *mi, int mprime)
317 struct name *np;
318 struct mitem *ip;
319 char *cp;
320 long dist;
322 if (m->m_flag & MHIDDEN)
323 return;
324 dist = 1;
325 if ((cp = hfield1("in-reply-to", m)) != NULL) {
326 if ((np = extract(cp, GREF)) != NULL)
327 do {
328 if ((ip = mlook(np->n_name, mi, NULL, mprime))
329 != NULL && ip != NOT_AN_ID) {
330 adopt(ip->mi_data, m, 1);
331 return;
333 } while ((np = np->n_flink) != NULL);
335 if ((cp = hfield1("references", m)) != NULL) {
336 if ((np = extract(cp, GREF)) != NULL) {
337 while (np->n_flink != NULL)
338 np = np->n_flink;
339 do {
340 if ((ip = mlook(np->n_name, mi, NULL, mprime))
341 != NULL) {
342 if (ip == NOT_AN_ID)
343 continue; /* skip dist++ */
344 adopt(ip->mi_data, m, dist);
345 return;
347 dist++;
348 } while ((np = np->n_blink) != NULL);
353 static void
354 makethreads(struct message *m, long cnt, int nmail)
356 struct mitem *mt;
357 char *cp;
358 long i, mprime;
360 if (cnt == 0)
361 return;
362 mprime = nextprime(cnt);
363 mt = scalloc(mprime, sizeof *mt);
364 for (i = 0; i < cnt; i++) {
365 if ((m[i].m_flag&MHIDDEN) == 0) {
366 mlook(NULL, mt, &m[i], mprime);
367 if (m[i].m_date == 0) {
368 if ((cp = hfield1("date", &m[i])) != NULL)
369 m[i].m_date = rfctime(cp);
372 m[i].m_child = m[i].m_younger = m[i].m_elder =
373 m[i].m_parent = NULL;
374 m[i].m_level = 0;
375 if (!nmail && !(inhook&2))
376 m[i].m_collapsed = 0;
379 * Most folders contain the eldest messages first. Traversing
380 * them in descending order makes it more likely that younger
381 * brothers are found first, so elder ones can be prepended to
382 * the brother list, which is faster. The worst case is still
383 * in O(n^2) and occurs when all but one messages in a folder
384 * are replies to the one message, and are sorted such that
385 * youngest messages occur first.
387 for (i = cnt-1; i >= 0; i--)
388 lookup(&m[i], mt, mprime);
389 threadroot = interlink(m, cnt, nmail);
390 finalize(threadroot);
391 free(mt);
392 mb.mb_threaded = 1;
395 FL int
396 thread(void *vp)
398 if (mb.mb_threaded != 1 || vp == NULL || vp == (void *)-1) {
399 #ifdef HAVE_IMAP
400 if (mb.mb_type == MB_IMAP)
401 imap_getheaders(1, msgCount);
402 #endif
403 makethreads(message, msgCount, vp == (void *)-1);
404 if (mb.mb_sorted != NULL)
405 free(mb.mb_sorted);
406 mb.mb_sorted = sstrdup("thread");
408 if (vp && vp != (void *)-1 && !inhook && value("header"))
409 return headers(vp);
410 return 0;
413 FL int
414 unthread(void *vp)
416 struct message *m;
418 mb.mb_threaded = 0;
419 free(mb.mb_sorted);
420 mb.mb_sorted = NULL;
421 for (m = &message[0]; m < &message[msgCount]; m++)
422 m->m_collapsed = 0;
423 if (vp && !inhook && value("header"))
424 return headers(vp);
425 return 0;
428 FL struct message *
429 next_in_thread(struct message *mp)
431 if (mp->m_child)
432 return mp->m_child;
433 if (mp->m_younger)
434 return mp->m_younger;
435 while (mp->m_parent) {
436 if (mp->m_parent->m_younger)
437 return mp->m_parent->m_younger;
438 mp = mp->m_parent;
440 return NULL;
443 FL struct message *
444 prev_in_thread(struct message *mp)
446 if (mp->m_elder) {
447 mp = mp->m_elder;
448 while (mp->m_child) {
449 mp = mp->m_child;
450 while (mp->m_younger)
451 mp = mp->m_younger;
453 return mp;
455 return mp->m_parent;
458 FL struct message *
459 this_in_thread(struct message *mp, long n)
461 struct message *mq;
463 if (n == -1) { /* find end of thread */
464 while (mp) {
465 if (mp->m_younger) {
466 mp = mp->m_younger;
467 continue;
469 mq = next_in_thread(mp);
470 if (mq == NULL || mq->m_threadpos < mp->m_threadpos)
471 return mp;
472 mp = mq;
474 return NULL;
476 while (mp && mp->m_threadpos < n) {
477 if (mp->m_younger && mp->m_younger->m_threadpos <= n) {
478 mp = mp->m_younger;
479 continue;
481 mp = next_in_thread(mp);
483 return mp && mp->m_threadpos == n ? mp : NULL;
487 * Sorted mode is internally just a variant of threaded mode with all
488 * m_parent and m_child links being NULL.
490 FL int
491 sort(void *vp)
493 enum method {
494 SORT_SUBJECT,
495 SORT_DATE,
496 SORT_STATUS,
497 SORT_SIZE,
498 SORT_FROM,
499 SORT_TO,
500 #ifdef HAVE_SPAM
501 SORT_SPAM,
502 #endif
503 SORT_THREAD
504 } method;
505 struct {
506 const char *me_name;
507 enum method me_method;
508 int (*me_func)(const void *, const void *);
509 } methnames[] = {
510 { "date", SORT_DATE, mlonglt },
511 { "from", SORT_FROM, mcharlt },
512 { "to", SORT_TO, mcharlt },
513 { "subject", SORT_SUBJECT, mcharlt },
514 { "size", SORT_SIZE, mlonglt },
515 #ifdef HAVE_SPAM
516 { "spam", SORT_SPAM, muilt },
517 #endif
518 { "status", SORT_STATUS, mlonglt },
519 { "thread", SORT_THREAD, NULL },
520 { NULL, -1, NULL }
522 char **args = (char **)vp, *cp, *_args[2];
523 int (*func)(const void *, const void *);
524 struct msort *ms;
525 struct str in, out;
526 int i, n, msgvec[2];
527 int showname = value("showname") != NULL;
528 struct message *mp;
530 msgvec[0] = dot - &message[0] + 1;
531 msgvec[1] = 0;
532 if (vp == NULL || vp == (void *)-1) {
533 _args[0] = savestr(mb.mb_sorted);
534 _args[1] = NULL;
535 args = _args;
536 } else if (args[0] == NULL) {
537 printf("Current sorting criterion is: %s\n",
538 mb.mb_sorted ? mb.mb_sorted : "unsorted");
539 return 0;
541 for (i = 0; methnames[i].me_name; i++)
542 if (*args[0] && is_prefix(args[0], methnames[i].me_name))
543 break;
544 if (methnames[i].me_name == NULL) {
545 fprintf(stderr, "Unknown sorting method \"%s\"\n", args[0]);
546 return 1;
548 method = methnames[i].me_method;
549 func = methnames[i].me_func;
550 free(mb.mb_sorted);
551 mb.mb_sorted = sstrdup(args[0]);
552 if (method == SORT_THREAD)
553 return thread(vp && vp != (void *)-1 ? msgvec : vp);
554 ms = ac_alloc(sizeof *ms * msgCount);
555 switch (method) {
556 case SORT_SUBJECT:
557 case SORT_DATE:
558 case SORT_FROM:
559 case SORT_TO:
560 #ifdef HAVE_IMAP
561 if (mb.mb_type == MB_IMAP)
562 imap_getheaders(1, msgCount);
563 #endif
564 break;
565 default:
566 break;
568 for (n = 0, i = 0; i < msgCount; i++) {
569 mp = &message[i];
570 if ((mp->m_flag&MHIDDEN) == 0) {
571 switch (method) {
572 case SORT_DATE:
573 if (mp->m_date == 0 &&
574 (cp = hfield1("date", mp)) != 0)
575 mp->m_date = rfctime(cp);
576 ms[n].ms_u.ms_long = mp->m_date;
577 break;
578 case SORT_STATUS:
579 if (mp->m_flag & MDELETED)
580 ms[n].ms_u.ms_long = 1;
581 else if ((mp->m_flag&(MNEW|MREAD)) == MNEW)
582 ms[n].ms_u.ms_long = 90;
583 else if (mp->m_flag & MFLAGGED)
584 ms[n].ms_u.ms_long = 85;
585 else if ((mp->m_flag&(MNEW|MBOX)) == MBOX)
586 ms[n].ms_u.ms_long = 70;
587 else if (mp->m_flag & MNEW)
588 ms[n].ms_u.ms_long = 80;
589 else if (mp->m_flag & MREAD)
590 ms[n].ms_u.ms_long = 40;
591 else
592 ms[n].ms_u.ms_long = 60;
593 break;
594 case SORT_SIZE:
595 ms[n].ms_u.ms_long = mp->m_xsize;
596 break;
597 #ifdef HAVE_SPAM
598 case SORT_SPAM:
599 ms[n].ms_u.ms_ui = mp->m_spamscore;
600 break;
601 #endif
602 case SORT_FROM:
603 case SORT_TO:
604 if ((cp = hfield1(method == SORT_FROM ?
605 "from" : "to", mp)) != NULL) {
606 ms[n].ms_u.ms_char = showname ?
607 realname(cp) : skin(cp);
608 makelow(ms[n].ms_u.ms_char);
609 } else
610 ms[n].ms_u.ms_char = UNCONST("");
611 break;
612 default:
613 case SORT_SUBJECT:
614 if ((cp = hfield1("subject", mp)) != NULL) {
615 in.s = cp;
616 in.l = strlen(in.s);
617 mime_fromhdr(&in, &out, TD_ICONV);
618 ms[n].ms_u.ms_char =
619 savestr(skipre(out.s));
620 free(out.s);
621 makelow(ms[n].ms_u.ms_char);
622 } else
623 ms[n].ms_u.ms_char = UNCONST("");
624 break;
626 ms[n++].ms_n = i;
628 mp->m_child = mp->m_younger = mp->m_elder = mp->m_parent = NULL;
629 mp->m_level = 0;
630 mp->m_collapsed = 0;
632 if (n > 0) {
633 qsort(ms, n, sizeof *ms, func);
634 threadroot = &message[ms[0].ms_n];
635 for (i = 1; i < n; i++) {
636 message[ms[i-1].ms_n].m_younger = &message[ms[i].ms_n];
637 message[ms[i].ms_n].m_elder = &message[ms[i-1].ms_n];
639 } else
640 threadroot = &message[0];
641 finalize(threadroot);
642 mb.mb_threaded = 2;
643 ac_free(ms);
644 return vp && vp != (void *)-1 && !inhook &&
645 value("header") ? headers(msgvec) : 0;
648 static char const *
649 skipre(char const *cp)
651 if (lowerconv(cp[0]) == 'r' && lowerconv(cp[1]) == 'e' &&
652 cp[2] == ':' && spacechar(cp[3])) {
653 cp = &cp[4];
654 while (spacechar(*cp))
655 cp++;
657 return cp;
660 FL int
661 ccollapse(void *v)
663 return colpt(v, 1);
666 FL int
667 cuncollapse(void *v)
669 return colpt(v, 0);
672 static int
673 colpt(int *msgvec, int cl)
675 int *ip;
677 if (mb.mb_threaded != 1) {
678 puts("Not in threaded mode.");
679 return 1;
681 for (ip = msgvec; *ip != 0; ip++)
682 colps(&message[*ip-1], cl);
683 return 0;
686 static void
687 colps(struct message *b, int cl)
689 struct message *m;
690 int cc = 0, uc = 0;
692 if (cl && (b->m_collapsed > 0 || (b->m_flag & (MNEW|MREAD)) == MNEW))
693 return;
694 if (b->m_child) {
695 m = b->m_child;
696 colpm(m, cl, &cc, &uc);
697 for (m = m->m_younger; m; m = m->m_younger)
698 colpm(m, cl, &cc, &uc);
700 if (cl) {
701 b->m_collapsed = -cc;
702 for (m = b->m_parent; m; m = m->m_parent)
703 if (m->m_collapsed <= -uc ) {
704 m->m_collapsed += uc;
705 break;
707 } else {
708 if (b->m_collapsed > 0) {
709 b->m_collapsed = 0;
710 uc++;
712 for (m = b; m; m = m->m_parent)
713 if (m->m_collapsed <= -uc) {
714 m->m_collapsed += uc;
715 break;
720 static void
721 colpm(struct message *m, int cl, int *cc, int *uc)
723 if (cl) {
724 if (m->m_collapsed > 0)
725 (*uc)++;
726 if ((m->m_flag & (MNEW|MREAD)) != MNEW || m->m_collapsed < 0)
727 m->m_collapsed = 1;
728 if (m->m_collapsed > 0)
729 (*cc)++;
730 } else {
731 if (m->m_collapsed > 0) {
732 m->m_collapsed = 0;
733 (*uc)++;
736 if (m->m_child) {
737 m = m->m_child;
738 colpm(m, cl, cc, uc);
739 for (m = m->m_younger; m; m = m->m_younger)
740 colpm(m, cl, cc, uc);
744 FL void
745 uncollapse1(struct message *m, int always)
747 if (mb.mb_threaded == 1 && (always || m->m_collapsed > 0))
748 colps(m, 0);