2 ** mhbuild.c -- expand/translate MIME composition files
4 ** This code is Copyright (c) 2002, by the authors of nmh. See the
5 ** COPYRIGHT file in the root directory of the nmh distribution for
6 ** complete copyright information.
10 ** This code was originally part of mhn.c. I split it into
11 ** a separate program (mhbuild.c). But the code still has some of
12 ** the mhn.c code in it. This program needs additional
13 ** streamlining and removal of unneeded code.
21 #include <h/mhparse.h>
29 #ifdef HAVE_SYS_TIME_H
30 # include <sys/time.h>
34 static struct swit switches[] = {
50 ** Directory to place tmp files. This must
51 ** be set before these routines are called.
57 static char prefix[] = "----- =_aaaaaaaaaa";
65 int make_intermediates(char *);
66 void content_error(char *, CT, char *, ...);
69 void free_content(CT);
71 void free_encoding(CT, int);
76 static int init_decoded_content(CT);
77 static char *fgetstr(char *, int, FILE *);
78 static int user_content(FILE *, char *, char *, CT *);
79 static void set_id(CT, int);
80 static int compose_content(CT);
81 static int scan_content(CT);
82 static int build_headers(CT);
83 static CT build_mime(char *);
92 static char infile[BUFSIZ];
93 static int unlink_infile = 0;
95 static char outfile[BUFSIZ];
96 static int unlink_outfile = 0;
101 int output_message(CT, char *);
102 int output_message_fp(CT, FILE *, char*);
105 void set_endian(void);
108 void free_content(CT);
112 main(int argc, char **argv)
114 char *cp, buf[BUFSIZ];
115 char buffer[BUFSIZ], *compfile = NULL;
116 char **argp, **arguments;
121 if (atexit(unlink_done) != 0) {
122 adios(EX_OSERR, NULL, "atexit failed");
125 setlocale(LC_ALL, "");
126 invo_name = mhbasename(argv[0]);
128 /* read user profile/context */
131 arguments = getarguments(invo_name, argc, argv, 1);
134 while ((cp = *argp++)) {
135 if (cp[0] == '-' && cp[1] == '\0') {
137 adios(EX_USAGE, NULL, "cannot specify both standard input and a file");
140 verbosw = 0; /* turn off -verbose listings */
144 switch (smatch(++cp, switches)) {
146 ambigsw(cp, switches);
149 adios(EX_USAGE, NULL, "-%s unknown", cp);
152 snprintf(buf, sizeof(buf), "%s [switches] file", invo_name);
153 print_help(buf, switches, 1);
154 exit(argc == 2 ? EX_OK : EX_USAGE);
156 print_version(invo_name);
157 exit(argc == 2 ? EX_OK : EX_USAGE);
171 adios(EX_USAGE, NULL, "only one composition file allowed");
179 ** Check if we've specified an additional profile
181 if ((cp = getenv("MHBUILD"))) {
182 if ((fp = fopen(cp, "r"))) {
183 readconfig((struct node **) 0, fp, cp, 0);
186 admonish("", "unable to read $MHBUILD profile (%s)",
192 ** Read the standard profile setup
194 if ((fp = fopen(cp = etcpath("mhn.defaults"), "r"))) {
195 readconfig((struct node **) 0, fp, cp, 0);
200 ** Check for storage directory. If defined, we
201 ** will store temporary files there. Else we
202 ** store them in standard nmh directory.
204 if ((cp = context_find(nmhstorage)) && *cp)
205 tmp = concat(cp, "/", invo_name, NULL);
207 tmp = getcpy(toabsdir(invo_name));
209 /* Check if we have a file to process */
211 adios(EX_USAGE, NULL, "need to specify a %s composition file",
215 ** Process the composition file from standard input.
217 if (compfile[0] == '-' && compfile[1] == '\0') {
218 /* copy standard input to temporary file */
219 strncpy(infile, m_mktemp(invo_name, NULL, &fp),
221 while (fgets(buffer, BUFSIZ, stdin))
226 /* build the content structures for MIME message */
227 ct = build_mime(infile);
229 /* output MIME message to this temporary file */
230 strncpy(outfile, m_mktemp(invo_name, NULL, &fp_out),
234 /* output the message */
235 output_message_fp(ct, fp_out, outfile);
238 /* output the temp file to standard output */
239 if ((fp = fopen(outfile, "r")) == NULL)
240 adios(EX_IOERR, outfile, "unable to open");
241 while (fgets(buffer, BUFSIZ, fp))
242 fputs(buffer, stdout);
256 ** Process the composition file from a file.
259 /* build the content structures for MIME message */
260 ct = build_mime(compfile);
262 /* output MIME message to this temporary file */
263 strncpy(outfile, m_mktemp2(compfile, invo_name, NULL, &fp_out),
267 /* output the message */
268 output_message_fp(ct, fp_out, outfile);
271 /* Rename composition draft */
272 snprintf(buffer, sizeof(buffer), "%s.orig", compfile);
273 if (rename(compfile, buffer) == NOTOK) {
274 adios(EX_IOERR, buffer, "unable to rename draft %s to", compfile);
277 /* Rename output file to take its place */
278 if (rename(outfile, compfile) == NOTOK) {
279 advise(compfile, "unable to rename output %s to", outfile);
280 rename(buffer, compfile);
294 ** Check if we need to remove stray temporary files.
299 if (unlink_outfile) {
305 ** Main routine for translating composition file
306 ** into valid MIME message. It translates the draft
307 ** into a content structure (actually a tree of content
308 ** structures). This message then can be manipulated
309 ** in various ways, including being output via
313 build_mime(char *infile)
316 char buf[BUFSIZ], name[NAMESZ];
325 /* open the composition draft */
326 if ((in = fopen(infile, "r")) == NULL)
327 adios(EX_IOERR, infile, "unable to open for reading");
330 ** Allocate space for primary (outside) content
332 if ((ct = (CT) calloc(1, sizeof(*ct))) == NULL)
333 adios(EX_OSERR, NULL, "out of memory");
336 ** Allocate structure for handling decoded content
337 ** for this part. We don't really need this, but
338 ** allocate it to remain consistent.
340 init_decoded_content(ct);
343 ** Parse some of the header fields in the composition
344 ** draft into the linked list of header fields for
345 ** the new MIME message.
347 for (compnum = 1, state = FLD;;) {
348 switch (state = m_getfld(state, name, buf, sizeof(buf), in)) {
354 /* abort if draft has Mime-Version header field */
355 if (!mh_strcasecmp(name, VRSN_FIELD))
356 adios(EX_CONFIG, NULL, "draft shouldn't contain %s: field", VRSN_FIELD);
359 ** abort if draft has Content-Transfer-Encoding
362 if (!mh_strcasecmp(name, ENCODING_FIELD))
363 adios(EX_CONFIG, NULL, "draft shouldn't contain %s: field", ENCODING_FIELD);
365 /* ignore any Content-Type fields in the header */
366 if (!mh_strcasecmp(name, TYPE_FIELD)) {
367 while (state == FLDPLUS)
368 state = m_getfld(state, name, buf,
373 /* get copies of the buffers */
377 /* if necessary, get rest of field */
378 while (state == FLDPLUS) {
379 state = m_getfld(state, name, buf,
381 vp = add(buf, vp); /* add to prev value */
384 /* Now add the header data to the list */
385 add_header(ct, np, vp);
388 /* if this wasn't the last hdr field, then continue */
394 adios(EX_CONFIG, NULL, "draft has empty body -- no directives!");
399 fseek(in, (long) (-strlen(buf)), SEEK_CUR);
404 adios(EX_CONFIG, NULL, "message format error in component #%d",
408 adios(EX_SOFTWARE, NULL, "getfld() returned %d", state);
414 ** Now add the MIME-Version header field
415 ** to the list of header fields.
417 np = getcpy(VRSN_FIELD);
418 vp = concat(" ", VRSN_VALUE, "\n", NULL);
419 add_header(ct, np, vp);
422 ** We initally assume we will find multiple contents in the
423 ** draft. So create a multipart/mixed content to hold everything.
424 ** We can remove this later, if it is not needed.
426 if (get_ctinfo("multipart/mixed", ct, 0) == NOTOK) {
429 ct->c_type = CT_MULTIPART;
430 ct->c_subtype = MULTI_MIXED;
431 ct->c_file = getcpy(infile);
433 if ((m = (struct multipart *) calloc(1, sizeof(*m))) == NULL)
434 adios(EX_OSERR, NULL, "out of memory");
435 ct->c_ctparams = (void *) m;
439 ** read and parse the composition file
440 ** and the directives it contains.
442 while (fgetstr(buf, sizeof(buf) - 1, in)) {
446 if (user_content(in, infile, buf, &p) == DONE) {
447 admonish(NULL, "ignoring spurious #end");
453 if ((part = (struct part *) calloc(1, sizeof(*part))) == NULL)
454 adios(EX_OSERR, NULL, "out of memory");
461 ** close the composition draft since
462 ** it's not needed any longer.
466 /* check if any contents were found */
468 adios(EX_OSERR, NULL, "no content directives found");
471 ** If only one content was found, then remove and
472 ** free the outer multipart content.
474 if (!m->mp_parts->mp_next) {
477 p = m->mp_parts->mp_part;
478 m->mp_parts->mp_part = NULL;
480 /* move header fields */
481 p->c_first_hf = ct->c_first_hf;
482 p->c_last_hf = ct->c_last_hf;
483 ct->c_first_hf = NULL;
484 ct->c_last_hf = NULL;
493 ** Fill out, or expand directives. Parse and execute
494 ** commands specified by profile composition strings.
498 if ((cp = strchr(prefix, 'a')) == NULL)
499 adios(EX_SOFTWARE, NULL, "internal error(4)");
502 ** Scan the contents. Choose a transfer encoding, and
503 ** check if prefix for multipart boundary clashes with
504 ** any of the contents.
506 while (scan_content(ct) == NOTOK) {
511 adios(EX_SOFTWARE, NULL, "giving up trying to find a unique delimiter string");
517 /* Build the rest of the header field structures */
525 ** Set up structures for placing unencoded
526 ** content when building parts.
530 init_decoded_content(CT ct)
534 if ((ce = (CE) calloc(1, sizeof(*ce))) == NULL)
535 adios(EX_OSERR, NULL, "out of memory");
538 ct->c_ceopenfnx = open7Bit; /* since unencoded */
539 ct->c_ceclosefnx = close_encoding;
540 ct->c_cesizefnx = NULL; /* since unencoded */
547 fgetstr(char *s, int n, FILE *stream)
551 for (ep = (cp = s) + n; cp < ep; ) {
554 if (!fgets(cp, n, stream))
555 return (cp != s ? s : NULL);
556 if (cp == s && *cp != '#')
559 cp += (i = strlen(cp)) - 1;
560 if (i <= 1 || *cp-- != '\n' || *cp != '\\')
571 ** Parse the composition draft for text and directives.
572 ** Do initial setup of Content structure.
576 user_content(FILE *in, char *file, char *buf, CT *ctp)
584 struct str2init *s2i;
589 if (buf[0] == '\n' || strcmp(buf, "#\n") == 0) {
594 /* allocate basic Content structure */
595 if ((ct = (CT) calloc(1, sizeof(*ct))) == NULL)
596 adios(EX_OSERR, NULL, "out of memory");
599 /* allocate basic structure for handling decoded content */
600 init_decoded_content(ct);
607 ** Handle inline text. Check if line
608 ** is one of the following forms:
610 ** 1) doesn't begin with '#' (implicit directive)
611 ** 2) begins with "##" (implicit directive)
612 ** 3) begins with "#<"
614 if (buf[0] != '#' || buf[1] == '#' || buf[1] == '<') {
618 char content[BUFSIZ];
622 cp = m_mktemp2(NULL, invo_name, NULL, &out);
624 adios(EX_CANTCREAT, "mhbuild", "unable to create temporary file");
626 /* use a temp file to collect the plain text lines */
627 ce->ce_file = getcpy(cp);
630 if (buf[0] == '#' && buf[1] == '<') {
631 strncpy(content, buf + 2, sizeof(content));
638 /* the directive is implicit */
639 strncpy(content, "text/plain", sizeof(content));
641 strncpy(buffer, buf[0] != '#' ? buf : buf + 1, sizeof(buffer));
645 if (headers >= 0 && uprf(buffer, DESCR_FIELD) &&
646 buffer[i=strlen(DESCR_FIELD)] == ':') {
650 ct->c_descr = add(buffer + i + 1, ct->c_descr);
651 if (!fgetstr(buffer, sizeof(buffer) - 1, in))
652 adios(EX_DATAERR, NULL, "end-of-file after %s: field in plaintext", DESCR_FIELD);
660 adios(EX_DATAERR, NULL, "#-directive after %s: field in plaintext", DESCR_FIELD);
668 if (headers >= 0 && uprf(buffer, DISPO_FIELD)
669 && buffer[i = strlen(DISPO_FIELD)] == ':') {
673 ct->c_dispo = add(buffer + i + 1, ct->c_dispo);
674 if (!fgetstr(buffer, sizeof(buffer) - 1, in))
675 adios(EX_DATAERR, NULL, "end-of-file after %s: field in plaintext", DISPO_FIELD);
683 adios(EX_DATAERR, NULL, "#-directive after %s: field in plaintext", DISPO_FIELD);
691 if (headers != 1 || buffer[0] != '\n')
697 if ((cp = fgetstr(buffer, sizeof(buffer) - 1, in))
700 if (buffer[0] == '#') {
703 if (buffer[1] != '#')
705 for (cp = (bp = buffer) + 1; *cp; cp++)
713 /* parse content type */
714 if (get_ctinfo(content, ct, inlineD) == NOTOK)
717 for (s2i = str2cts; s2i->si_key; s2i++)
718 if (!mh_strcasecmp(ci->ci_type, s2i->si_key))
720 if (!s2i->si_key && !uprf(ci->ci_type, "X-"))
724 ** check type specified (possibly implicitly)
726 switch (ct->c_type = s2i->si_val) {
728 if (!mh_strcasecmp(ci->ci_subtype, "rfc822")) {
729 ct->c_encoding = CE_7BIT;
734 adios(EX_DATAERR, NULL, "it doesn't make sense to define an in-line %s content",
735 ct->c_type == CT_MESSAGE ? "message" :
741 if ((ct->c_ctinitfnx = s2i->si_init))
742 (*ct->c_ctinitfnx) (ct);
747 fseek(in, pos, SEEK_SET);
752 ** If we've reached this point, the next line
753 ** must be some type of explicit directive.
757 adios(EX_DATAERR, NULL, "The #@ directive i.e. message/external-body "
758 "is not supported anymore.");
761 /* parse directive */
762 if (get_ctinfo(buf+1, ct, 1) == NOTOK)
765 /* check directive against the list of MIME types */
766 for (s2i = str2cts; s2i->si_key; s2i++)
767 if (!mh_strcasecmp(ci->ci_type, s2i->si_key))
771 ** Check if the directive specified a valid type.
772 ** This will happen if it was one of the following forms:
778 adios(EX_DATAERR, NULL, "missing subtype in \"#%s\"", ci->ci_type);
780 switch (ct->c_type = s2i->si_val) {
782 adios(EX_DATAERR, NULL, "use \"#begin ... #end\" instead of \"#%s/%s\"", ci->ci_type, ci->ci_subtype);
786 if (!mh_strcasecmp(ci->ci_subtype, "partial") ||
787 !mh_strcasecmp(ci->ci_subtype,
789 adios(EX_DATAERR, NULL, "sorry, \"#%s/%s\" isn't supported", ci->ci_type, ci->ci_subtype);
792 admonish(NULL, "use \"#forw [+folder] [msgs]\" instead of \"#%s/%s\"", ci->ci_type, ci->ci_subtype);
796 if ((ct->c_ctinitfnx = s2i->si_init))
797 (*ct->c_ctinitfnx) (ct);
801 /* Handle [file] argument */
803 /* check if specifies command to execute */
804 if (*ci->ci_magic == '|' || *ci->ci_magic == '!') {
805 for (cp = ci->ci_magic + 1; isspace(*cp); cp++)
808 adios(EX_DATAERR, NULL, "empty pipe command for #%s directive", ci->ci_type);
813 /* record filename of decoded contents */
814 ce->ce_file = ci->ci_magic;
815 if (access(ce->ce_file, R_OK) == NOTOK)
816 adios(EX_IOERR, "reading", "unable to access %s for", ce->ce_file);
823 ** No [file] argument, so check profile for
824 ** method to compose content.
826 snprintf(buffer, sizeof(buffer), "%s-compose-%s/%s",
827 invo_name, ci->ci_type, ci->ci_subtype);
828 if ((cp = context_find(buffer)) == NULL || *cp == '\0') {
829 snprintf(buffer, sizeof(buffer), "%s-compose-%s",
830 invo_name, ci->ci_type);
831 if ((cp = context_find(buffer)) == NULL ||
833 content_error(NULL, ct, "don't know how to compose content");
837 ci->ci_magic = getcpy(cp);
843 ** #forw [+folder] [msgs]
845 if (!mh_strcasecmp(ci->ci_type, "forw")) {
847 char *folder, *arguments[MAXARGS];
853 ap = brkstring(ci->ci_magic, " ", "\n");
854 for (i=0; ap[i] && i<MAXARGS-1; i++) {
855 arguments[i] = ap[i];
860 arguments[0] = seq_cur;
865 /* search the arguments for a folder name */
866 for (ap = arguments; *ap; ap++) {
868 if (*cp == '+' || *cp == '@') {
870 adios(EX_USAGE, NULL, "only one folder per #forw directive");
872 folder = getcpy(expandfol(cp));
876 /* else, use the current folder */
878 folder = getcpy(getcurfol());
880 if (!(mp = folder_read(folder)))
881 adios(EX_IOERR, NULL, "unable to read folder %s", folder);
882 for (ap = arguments; *ap; ap++) {
884 if (*cp != '+' && *cp != '@')
885 if (!m_convert(mp, cp))
892 ** If there is more than one message to include, make this
893 ** a content of type "multipart/digest" and insert each message
894 ** as a subpart. If there is only one message, then make this
895 ** a content of type "message/rfc822".
897 if (mp->numsel > 1) {
898 /* we are forwarding multiple messages */
899 if (get_ctinfo("multipart/digest", ct, 0) == NOTOK)
901 ct->c_type = CT_MULTIPART;
902 ct->c_subtype = MULTI_DIGEST;
904 if ((m = (struct multipart *)
905 calloc(1, sizeof(*m))) == NULL)
906 adios(EX_OSERR, NULL, "out of memory");
907 ct->c_ctparams = (void *) m;
910 for (msgnum = mp->lowsel; msgnum <= mp->hghsel; msgnum++) {
911 if (is_selected(mp, msgnum)) {
916 if ((p = (CT) calloc(1, sizeof(*p)))
918 adios(EX_OSERR, NULL, "out of memory");
919 init_decoded_content(p);
921 if (get_ctinfo("message/rfc822", p, 0)
924 p->c_type = CT_MESSAGE;
925 p->c_subtype = MESSAGE_RFC822;
927 snprintf(buffer, sizeof(buffer),
928 "%s/%d", mp->foldpath,
930 pe->ce_file = getcpy(buffer);
932 if ((part = (struct part *) calloc(1, sizeof(*part))) == NULL)
933 adios(EX_OSERR, NULL, "out of memory");
940 /* we are forwarding one message */
941 if (get_ctinfo("message/rfc822", ct, 0) == NOTOK)
943 ct->c_type = CT_MESSAGE;
944 ct->c_subtype = MESSAGE_RFC822;
947 snprintf(buffer, sizeof(buffer), "%s/%d",
948 mp->foldpath, msgnum);
949 ce->ce_file = getcpy(buffer);
952 folder_free(mp); /* free folder/message structure */
959 if (!mh_strcasecmp(ci->ci_type, "end")) {
966 ** #begin [ alternative | parallel ]
968 if (!mh_strcasecmp(ci->ci_type, "begin")) {
971 cp = SubMultiPart[vrsn - 1].kv_key;
972 } else if (!mh_strcasecmp(ci->ci_magic, "alternative")) {
973 vrsn = MULTI_ALTERNATE;
974 cp = SubMultiPart[vrsn - 1].kv_key;
975 } else if (!mh_strcasecmp(ci->ci_magic, "parallel")) {
976 vrsn = MULTI_PARALLEL;
977 cp = SubMultiPart[vrsn - 1].kv_key;
978 } else if (uprf(ci->ci_magic, "digest")) {
981 vrsn = MULTI_UNKNOWN;
986 snprintf(buffer, sizeof(buffer), "multipart/%s", cp);
987 if (get_ctinfo(buffer, ct, 0) == NOTOK)
989 ct->c_type = CT_MULTIPART;
990 ct->c_subtype = vrsn;
992 if ((m = (struct multipart *) calloc(1, sizeof(*m))) == NULL)
993 adios(EX_OSERR, NULL, "out of memory");
994 ct->c_ctparams = (void *) m;
997 while (fgetstr(buffer, sizeof(buffer) - 1, in)) {
1001 if (user_content(in, file, buffer, &p) == DONE) {
1003 adios(EX_DATAERR, NULL, "empty \"#begin ... #end\" sequence");
1009 if ((part = (struct part *)
1010 calloc(1, sizeof(*part))) == NULL)
1011 adios(EX_OSERR, NULL, "out of memory");
1013 pp = &part->mp_next;
1016 admonish(NULL, "premature end-of-file, missing #end");
1021 ** Unknown directive
1023 adios(EX_DATAERR, NULL, "unknown directive \"#%s\"", ci->ci_type);
1024 return NOTOK; /* NOT REACHED */
1029 set_id(CT ct, int top)
1033 static time_t clock = 0;
1034 static char *msgfmt;
1038 snprintf(msgid, sizeof(msgid), "<%d.%ld.%%d@%s>\n",
1039 (int) getpid(), (long) clock, LocalName());
1041 msgfmt = getcpy(msgid);
1043 snprintf(msgid, sizeof(msgid), msgfmt, top ? 0 : ++partno);
1044 ct->c_id = getcpy(msgid);
1049 ** Fill out, or expand the various contents in the composition
1050 ** draft. Read-in any necessary files. Parse and execute any
1051 ** commands specified by profile composition strings.
1055 compose_content(CT ct)
1057 CE ce = ct->c_cefile;
1059 switch (ct->c_type) {
1064 char partnam[BUFSIZ];
1065 struct multipart *m = (struct multipart *) ct->c_ctparams;
1069 snprintf(partnam, sizeof(partnam), "%s.",
1071 pp = partnam + strlen(partnam);
1076 /* first, we call compose_content on all the subparts */
1077 for (part = m->mp_parts, partnum = 1; part;
1078 part = part->mp_next, partnum++) {
1079 CT p = part->mp_part;
1081 sprintf(pp, "%d", partnum);
1082 p->c_partno = getcpy(partnam);
1083 if (compose_content(p) == NOTOK)
1090 /* Nothing to do for type message */
1094 ** Discrete types (text/application/audio/image/video)
1099 int xstdout, len, buflen;
1100 char *bp, **ap, *cp;
1101 char *vec[4], buffer[BUFSIZ];
1103 CI ci = &ct->c_ctinfo;
1106 if (!(cp = ci->ci_magic))
1107 adios(EX_SOFTWARE, NULL, "internal error(5)");
1109 tfile = m_mktemp2(NULL, invo_name, NULL, NULL);
1110 if (tfile == NULL) {
1111 adios(EX_CANTCREAT, "mhbuild", "unable to create temporary file");
1113 ce->ce_file = getcpy(tfile);
1118 /* Get buffer ready to go */
1121 buflen = sizeof(buffer);
1124 ** Parse composition string into buffer
1126 for ( ; *cp; cp++) {
1132 ** insert parameters from
1138 for (ap = ci->ci_attrs, ep = ci->ci_values; *ap; ap++, ep++) {
1139 snprintf(bp, buflen, "%s%s=\"%s\"", s, *ap, *ep);
1149 /* %f, and stdout is not-redirected */
1155 ** insert temporary filename
1156 ** where content should be
1159 snprintf(bp, buflen, "%s", ce->ce_file);
1163 /* insert content subtype */
1164 strncpy(bp, ci->ci_subtype, buflen);
1168 /* insert character % */
1189 printf("composing content %s/%s from command\n\t%s\n", ci->ci_type, ci->ci_subtype, buffer);
1191 fflush(stdout); /* not sure if need for -noverbose */
1198 if ((out = fopen(ce->ce_file, "w")) == NULL)
1199 adios(EX_IOERR, ce->ce_file, "unable to open for writing");
1201 switch (child_id = fork()) {
1203 adios(EX_OSERR, "fork", "unable to fork");
1208 dup2(fileno(out), 1);
1210 execvp("/bin/sh", vec);
1211 fprintf(stderr, "unable to exec ");
1218 if (pidXwait(child_id, NULL))
1231 ** Scan the content.
1233 ** 1) choose a transfer encoding.
1234 ** 2) check for clashes with multipart boundary string.
1235 ** 3) for text content, figure out which character set is being used.
1237 ** If there is a clash with one of the contents and the multipart boundary,
1238 ** this function will exit with NOTOK. This will cause the scanning process
1239 ** to be repeated with a different multipart boundary. It is possible
1240 ** (although highly unlikely) that this scan will be repeated multiple times.
1247 int check8bit = 0, contains8bit = 0;
1248 int checklinelen = 0, linelen = 0;
1249 int checkboundary = 0, boundaryclash = 0;
1250 int checklinespace = 0, linespace = 0; /* trailing whitespace */
1251 unsigned char *cp = NULL, buffer[BUFSIZ];
1252 struct text *t = NULL;
1254 CE ce = ct->c_cefile;
1257 ** handle multipart by scanning all subparts
1258 ** and then checking their encoding.
1260 if (ct->c_type == CT_MULTIPART) {
1261 struct multipart *m = (struct multipart *) ct->c_ctparams;
1264 /* initially mark the domain of enclosing multipart as 7bit */
1265 ct->c_encoding = CE_7BIT;
1267 for (part = m->mp_parts; part; part = part->mp_next) {
1268 CT p = part->mp_part;
1270 if (scan_content(p) == NOTOK) {
1271 /* choose encoding for subpart */
1276 ** if necessary, enlarge encoding for enclosing
1279 if (p->c_encoding == CE_BINARY)
1280 ct->c_encoding = CE_BINARY;
1281 if (p->c_encoding == CE_8BIT &&
1282 ct->c_encoding != CE_BINARY)
1283 ct->c_encoding = CE_8BIT;
1290 ** Decide what to check while scanning this content.
1292 switch (ct->c_type) {
1296 if (ct->c_subtype == TEXT_PLAIN) {
1312 case CT_APPLICATION:
1324 ** Scan the unencoded content
1326 if (check8bit || checklinelen || checklinespace || checkboundary) {
1327 if ((in = fopen(ce->ce_file, "r")) == NULL)
1328 adios(EX_IOERR, ce->ce_file, "unable to open for reading");
1329 len = strlen(prefix);
1331 while (fgets(buffer, sizeof(buffer) - 1, in)) {
1333 for (cp = buffer; *cp; cp++) {
1334 if (!isascii(*cp)) {
1336 /* no need to keep checking */
1342 if (checklinelen && (strlen(buffer) > CPERLIN + 1)) {
1344 checklinelen = 0; /* no need to keep checking */
1347 if (checklinespace &&
1348 (cp = buffer + strlen(buffer) - 2) >
1349 buffer && isspace(*cp)) {
1351 /* no need to keep checking */
1356 ** Check if content contains a line that clashes
1357 ** with our standard boundary for multipart messages.
1359 if (checkboundary && buffer[0] == '-' &&
1361 for (cp = buffer + strlen(buffer) - 1;
1366 if (strncmp(buffer + 2, prefix, len)==0 &&
1367 isdigit(buffer[2 + len])) {
1369 /* no need to keep checking */
1378 ** Decide which transfer encoding to use.
1380 switch (ct->c_type) {
1383 ** If the text content didn't specify a character
1384 ** set, we need to figure out which one was used.
1386 t = (struct text *) ct->c_ctparams;
1387 if (t->tx_charset == CHARSET_UNSPECIFIED) {
1388 CI ci = &ct->c_ctinfo;
1391 for (ap = ci->ci_attrs, ep = ci->ci_values; *ap; ap++, ep++)
1395 t->tx_charset = CHARSET_UNKNOWN;
1396 *ap = concat("charset=", write_charset_8bit(),
1399 t->tx_charset = CHARSET_USASCII;
1400 *ap = getcpy("charset=us-ascii");
1403 cp = strchr(*ap++, '=');
1409 if (contains8bit || linelen || linespace)
1410 ct->c_encoding = CE_QUOTED;
1412 ct->c_encoding = CE_7BIT;
1416 ct->c_encoding = CE_7BIT;
1419 case CT_APPLICATION:
1424 ** Forcing use of base64, because these types likely
1425 ** contain binary data and NUL bytes. Don't care about
1426 ** files that would be clean.
1428 ct->c_encoding = CE_BASE64;
1432 return (boundaryclash ? NOTOK : OK);
1437 ** Scan the content structures, and build header
1438 ** fields that will need to be output into the
1443 build_headers(CT ct)
1447 char *np, *vp, buffer[BUFSIZ];
1448 CI ci = &ct->c_ctinfo;
1451 ** If message is type multipart, then add the multipart
1452 ** boundary to the list of attribute/value pairs.
1454 if (ct->c_type == CT_MULTIPART) {
1456 static int level = 0; /* store nesting level */
1460 snprintf(buffer, sizeof(buffer), "boundary=%s%d",
1462 cp = strchr(*ap++ = getcpy(buffer), '=');
1469 ** output the content type and subtype
1471 np = getcpy(TYPE_FIELD);
1472 vp = concat(" ", ci->ci_type, "/", ci->ci_subtype, NULL);
1474 /* keep track of length of line */
1475 len = strlen(TYPE_FIELD) + strlen(ci->ci_type) +
1476 strlen(ci->ci_subtype) + 3;
1479 ** Append the attribute/value pairs to
1480 ** the end of the Content-Type line.
1482 for (ap = ci->ci_attrs, ep = ci->ci_values; *ap; ap++, ep++) {
1486 snprintf(buffer, sizeof(buffer), "%s=\"%s\"", *ap, *ep);
1487 if (len + 1 + (cc = strlen(buffer)) >= CPERLIN) {
1488 vp = add("\n\t", vp);
1494 vp = add(buffer, vp);
1499 ** Append any RFC-822 comment to the end of
1500 ** the Content-Type line.
1502 if (ci->ci_comment) {
1503 snprintf(buffer, sizeof(buffer), "(%s)", ci->ci_comment);
1504 if (len + 1 + (cc = 2 + strlen(ci->ci_comment)) >= CPERLIN) {
1505 vp = add("\n\t", vp);
1511 vp = add(buffer, vp);
1515 add_header(ct, np, vp);
1518 ** output the Content-ID
1521 np = getcpy(ID_FIELD);
1522 vp = concat(" ", ct->c_id, NULL);
1523 add_header(ct, np, vp);
1527 ** output the Content-Description
1530 np = getcpy(DESCR_FIELD);
1531 vp = concat(" ", ct->c_descr, NULL);
1532 add_header(ct, np, vp);
1536 ** output the Content-Disposition
1539 np = getcpy(DISPO_FIELD);
1540 vp = concat(" ", ct->c_dispo, NULL);
1541 add_header(ct, np, vp);
1545 ** output the Content-Transfer-Encoding
1547 switch (ct->c_encoding) {
1549 /* Nothing to output */
1553 if (ct->c_type == CT_MESSAGE)
1554 adios(EX_DATAERR, NULL, "internal error, invalid encoding");
1556 np = getcpy(ENCODING_FIELD);
1557 vp = concat(" ", "8bit", "\n", NULL);
1558 add_header(ct, np, vp);
1562 if (ct->c_type == CT_MESSAGE || ct->c_type == CT_MULTIPART)
1563 adios(EX_DATAERR, NULL, "internal error, invalid encoding");
1565 np = getcpy(ENCODING_FIELD);
1566 vp = concat(" ", "quoted-printable", "\n", NULL);
1567 add_header(ct, np, vp);
1571 if (ct->c_type == CT_MESSAGE || ct->c_type == CT_MULTIPART)
1572 adios(EX_DATAERR, NULL, "internal error, invalid encoding");
1574 np = getcpy(ENCODING_FIELD);
1575 vp = concat(" ", "base64", "\n", NULL);
1576 add_header(ct, np, vp);
1580 if (ct->c_type == CT_MESSAGE)
1581 adios(EX_DATAERR, NULL, "internal error, invalid encoding");
1583 np = getcpy(ENCODING_FIELD);
1584 vp = concat(" ", "binary", "\n", NULL);
1585 add_header(ct, np, vp);
1589 adios(EX_DATAERR, NULL, "unknown transfer encoding in content");
1594 ** Additional content specific header processing
1596 switch (ct->c_type) {
1599 struct multipart *m;
1602 m = (struct multipart *) ct->c_ctparams;
1603 for (part = m->mp_parts; part; part = part->mp_next) {