Commit | Line | Data |
---|---|---|
c58b88df | 1 | /* $Cambridge: exim/src/src/regex.c,v 1.7 2005/07/01 10:49:02 ph10 Exp $ */ |
8523533c TK |
2 | |
3 | /************************************************* | |
4 | * Exim - an Internet mail transport agent * | |
5 | *************************************************/ | |
6 | ||
7 | /* Copyright (c) Tom Kistner <tom@duncanthrax.net> 2003-???? */ | |
8 | /* License: GPL */ | |
9 | ||
10 | /* Code for matching regular expressions against headers and body. | |
11 | Called from acl.c. */ | |
12 | ||
13 | #include "exim.h" | |
14 | #ifdef WITH_CONTENT_SCAN | |
15 | #include <unistd.h> | |
16 | #include <sys/mman.h> | |
17 | ||
18 | /* Structure to hold a list of Regular expressions */ | |
19 | typedef struct pcre_list { | |
20 | pcre *re; | |
21 | uschar *pcre_text; | |
22 | struct pcre_list *next; | |
23 | } pcre_list; | |
24 | ||
25 | uschar regex_match_string_buffer[1024]; | |
26 | ||
27 | extern FILE *mime_stream; | |
28 | extern uschar *mime_current_boundary; | |
29 | ||
30 | int regex(uschar **listptr) { | |
31 | int sep = 0; | |
32 | uschar *list = *listptr; | |
33 | uschar *regex_string; | |
34 | uschar regex_string_buffer[1024]; | |
f7b63901 | 35 | unsigned long mbox_size; |
8523533c TK |
36 | FILE *mbox_file; |
37 | pcre *re; | |
38 | pcre_list *re_list_head = NULL; | |
39 | pcre_list *re_list_item; | |
40 | const char *pcre_error; | |
41 | int pcre_erroffset; | |
42 | uschar *linebuffer; | |
43 | long f_pos = 0; | |
8e669ac1 | 44 | |
8523533c TK |
45 | /* reset expansion variable */ |
46 | regex_match_string = NULL; | |
8e669ac1 | 47 | |
8523533c TK |
48 | if (mime_stream == NULL) { |
49 | /* We are in the DATA ACL */ | |
50 | mbox_file = spool_mbox(&mbox_size); | |
51 | if (mbox_file == NULL) { | |
52 | /* error while spooling */ | |
53 | log_write(0, LOG_MAIN|LOG_PANIC, | |
54 | "regex acl condition: error while creating mbox spool file"); | |
55 | return DEFER; | |
56 | }; | |
57 | } | |
58 | else { | |
59 | f_pos = ftell(mime_stream); | |
60 | mbox_file = mime_stream; | |
61 | }; | |
8e669ac1 | 62 | |
8523533c TK |
63 | /* precompile our regexes */ |
64 | while ((regex_string = string_nextinlist(&list, &sep, | |
65 | regex_string_buffer, | |
66 | sizeof(regex_string_buffer))) != NULL) { | |
8e669ac1 | 67 | |
8523533c | 68 | /* parse option */ |
8e669ac1 | 69 | if ( (strcmpic(regex_string,US"false") == 0) || |
8523533c TK |
70 | (Ustrcmp(regex_string,"0") == 0) ) { |
71 | /* explicitly no matching */ | |
72 | continue; | |
73 | }; | |
8e669ac1 | 74 | |
8523533c TK |
75 | /* compile our regular expression */ |
76 | re = pcre_compile( CS regex_string, | |
77 | 0, | |
78 | &pcre_error, | |
79 | &pcre_erroffset, | |
80 | NULL ); | |
81 | ||
82 | if (re == NULL) { | |
83 | log_write(0, LOG_MAIN, | |
84 | "regex acl condition warning - error in regex '%s': %s at offset %d, skipped.", regex_string, pcre_error, pcre_erroffset); | |
85 | continue; | |
86 | } | |
87 | else { | |
88 | re_list_item = store_get(sizeof(pcre_list)); | |
89 | re_list_item->re = re; | |
90 | re_list_item->pcre_text = string_copy(regex_string); | |
91 | re_list_item->next = re_list_head; | |
92 | re_list_head = re_list_item; | |
93 | }; | |
94 | }; | |
8e669ac1 | 95 | |
8523533c TK |
96 | /* no regexes -> nothing to do */ |
97 | if (re_list_head == NULL) { | |
98 | return FAIL; | |
99 | }; | |
8e669ac1 | 100 | |
8523533c TK |
101 | /* match each line against all regexes */ |
102 | linebuffer = store_get(32767); | |
8e669ac1 | 103 | while (fgets(CS linebuffer, 32767, mbox_file) != NULL) { |
8523533c TK |
104 | if ( (mime_stream != NULL) && (mime_current_boundary != NULL) ) { |
105 | /* check boundary */ | |
106 | if (Ustrncmp(linebuffer,"--",2) == 0) { | |
107 | if (Ustrncmp((linebuffer+2),mime_current_boundary,Ustrlen(mime_current_boundary)) == 0) | |
108 | /* found boundary */ | |
109 | break; | |
110 | }; | |
111 | }; | |
112 | re_list_item = re_list_head; | |
113 | do { | |
114 | /* try matcher on the line */ | |
115 | if (pcre_exec(re_list_item->re, NULL, CS linebuffer, | |
384152a6 | 116 | (int)Ustrlen(linebuffer), 0, 0, NULL, 0) >= 0) { |
8523533c TK |
117 | Ustrncpy(regex_match_string_buffer, re_list_item->pcre_text, 1023); |
118 | regex_match_string = regex_match_string_buffer; | |
119 | if (mime_stream == NULL) | |
f1e894f3 | 120 | (void)fclose(mbox_file); |
8523533c TK |
121 | else { |
122 | clearerr(mime_stream); | |
123 | fseek(mime_stream,f_pos,SEEK_SET); | |
124 | }; | |
125 | return OK; | |
126 | }; | |
127 | re_list_item = re_list_item->next; | |
128 | } while (re_list_item != NULL); | |
129 | }; | |
8e669ac1 | 130 | |
8523533c | 131 | if (mime_stream == NULL) |
f1e894f3 | 132 | (void)fclose(mbox_file); |
8523533c TK |
133 | else { |
134 | clearerr(mime_stream); | |
135 | fseek(mime_stream,f_pos,SEEK_SET); | |
136 | }; | |
8e669ac1 | 137 | |
8523533c TK |
138 | /* no matches ... */ |
139 | return FAIL; | |
140 | } | |
141 | ||
142 | ||
143 | int mime_regex(uschar **listptr) { | |
144 | int sep = 0; | |
145 | uschar *list = *listptr; | |
146 | uschar *regex_string; | |
147 | uschar regex_string_buffer[1024]; | |
148 | pcre *re; | |
149 | pcre_list *re_list_head = NULL; | |
150 | pcre_list *re_list_item; | |
151 | const char *pcre_error; | |
152 | int pcre_erroffset; | |
153 | FILE *f; | |
154 | uschar *mime_subject = NULL; | |
155 | int mime_subject_len = 0; | |
156 | ||
157 | /* reset expansion variable */ | |
158 | regex_match_string = NULL; | |
159 | ||
160 | /* precompile our regexes */ | |
161 | while ((regex_string = string_nextinlist(&list, &sep, | |
162 | regex_string_buffer, | |
163 | sizeof(regex_string_buffer))) != NULL) { | |
8e669ac1 | 164 | |
8523533c | 165 | /* parse option */ |
8e669ac1 | 166 | if ( (strcmpic(regex_string,US"false") == 0) || |
8523533c TK |
167 | (Ustrcmp(regex_string,"0") == 0) ) { |
168 | /* explicitly no matching */ | |
169 | continue; | |
170 | }; | |
8e669ac1 | 171 | |
8523533c TK |
172 | /* compile our regular expression */ |
173 | re = pcre_compile( CS regex_string, | |
174 | 0, | |
175 | &pcre_error, | |
176 | &pcre_erroffset, | |
177 | NULL ); | |
178 | ||
179 | if (re == NULL) { | |
180 | log_write(0, LOG_MAIN, | |
181 | "regex acl condition warning - error in regex '%s': %s at offset %d, skipped.", regex_string, pcre_error, pcre_erroffset); | |
182 | continue; | |
183 | } | |
184 | else { | |
185 | re_list_item = store_get(sizeof(pcre_list)); | |
186 | re_list_item->re = re; | |
187 | re_list_item->pcre_text = string_copy(regex_string); | |
188 | re_list_item->next = re_list_head; | |
189 | re_list_head = re_list_item; | |
190 | }; | |
191 | }; | |
8e669ac1 | 192 | |
8523533c TK |
193 | /* no regexes -> nothing to do */ |
194 | if (re_list_head == NULL) { | |
195 | return FAIL; | |
196 | }; | |
8e669ac1 | 197 | |
8523533c TK |
198 | /* check if the file is already decoded */ |
199 | if (mime_decoded_filename == NULL) { | |
200 | uschar *empty = US""; | |
201 | /* no, decode it first */ | |
202 | mime_decode(&empty); | |
203 | if (mime_decoded_filename == NULL) { | |
204 | /* decoding failed */ | |
205 | log_write(0, LOG_MAIN, | |
206 | "mime_regex acl condition warning - could not decode MIME part to file."); | |
207 | return DEFER; | |
208 | }; | |
209 | }; | |
210 | ||
211 | ||
212 | /* open file */ | |
c58b88df | 213 | f = fopen(CS mime_decoded_filename, "rb"); |
8523533c TK |
214 | if (f == NULL) { |
215 | /* open failed */ | |
216 | log_write(0, LOG_MAIN, | |
217 | "mime_regex acl condition warning - can't open '%s' for reading.", mime_decoded_filename); | |
218 | return DEFER; | |
219 | }; | |
8e669ac1 | 220 | |
8523533c TK |
221 | /* get 32k memory */ |
222 | mime_subject = (uschar *)store_get(32767); | |
8e669ac1 | 223 | |
8523533c TK |
224 | /* read max 32k chars from file */ |
225 | mime_subject_len = fread(mime_subject, 1, 32766, f); | |
8e669ac1 | 226 | |
8523533c TK |
227 | re_list_item = re_list_head; |
228 | do { | |
229 | /* try matcher on the mmapped file */ | |
230 | debug_printf("Matching '%s'\n", re_list_item->pcre_text); | |
231 | if (pcre_exec(re_list_item->re, NULL, CS mime_subject, | |
232 | mime_subject_len, 0, 0, NULL, 0) >= 0) { | |
233 | Ustrncpy(regex_match_string_buffer, re_list_item->pcre_text, 1023); | |
234 | regex_match_string = regex_match_string_buffer; | |
f1e894f3 | 235 | (void)fclose(f); |
8523533c TK |
236 | return OK; |
237 | }; | |
238 | re_list_item = re_list_item->next; | |
239 | } while (re_list_item != NULL); | |
240 | ||
f1e894f3 | 241 | (void)fclose(f); |
8e669ac1 | 242 | |
8523533c TK |
243 | /* no matches ... */ |
244 | return FAIL; | |
245 | } | |
246 | ||
247 | #endif |