1. Don't show helo=[<ip address>] unnecessarily. 2. Update old test
[exim.git] / src / src / host.c
CommitLineData
82c19f95 1/* $Cambridge: exim/src/src/host.c,v 1.17 2005/11/11 10:02:04 ph10 Exp $ */
059ec3d9
PH
2
3/*************************************************
4* Exim - an Internet mail transport agent *
5*************************************************/
6
c988f1f4 7/* Copyright (c) University of Cambridge 1995 - 2005 */
059ec3d9
PH
8/* See the file NOTICE for conditions of use and distribution. */
9
10/* Functions for finding hosts, either by gethostbyname(), gethostbyaddr(), or
11directly via the DNS. When IPv6 is supported, getipnodebyname() and
12getipnodebyaddr() may be used instead of gethostbyname() and gethostbyaddr(),
13if the newer functions are available. This module also contains various other
14functions concerned with hosts and addresses, and a random number function,
15used for randomizing hosts with equal MXs but available for use in other parts
16of Exim. */
17
18
19#include "exim.h"
20
21
22/* Static variable for preserving the list of interface addresses in case it is
23used more than once. */
24
25static ip_address_item *local_interface_data = NULL;
26
27
28#ifdef USE_INET_NTOA_FIX
29/*************************************************
30* Replacement for broken inet_ntoa() *
31*************************************************/
32
33/* On IRIX systems, gcc uses a different structure passing convention to the
34native libraries. This causes inet_ntoa() to always yield 0.0.0.0 or
35255.255.255.255. To get round this, we provide a private version of the
36function here. It is used only if USE_INET_NTOA_FIX is set, which should happen
37only when gcc is in use on an IRIX system. Code send to me by J.T. Breitner,
38with these comments:
39
40 code by Stuart Levy
41 as seen in comp.sys.sgi.admin
42
2548ba04
PH
43August 2005: Apparently this is also needed for AIX systems; USE_INET_NTOA_FIX
44should now be set for them as well.
45
059ec3d9
PH
46Arguments: sa an in_addr structure
47Returns: pointer to static text string
48*/
49
50char *
51inet_ntoa(struct in_addr sa)
52{
53static uschar addr[20];
54sprintf(addr, "%d.%d.%d.%d",
55 (US &sa.s_addr)[0],
56 (US &sa.s_addr)[1],
57 (US &sa.s_addr)[2],
58 (US &sa.s_addr)[3]);
59 return addr;
60}
61#endif
62
63
64
65/*************************************************
66* Random number generator *
67*************************************************/
68
69/* This is a simple pseudo-random number generator. It does not have to be
70very good for the uses to which it is put. When running the regression tests,
71start with a fixed seed.
72
73Arguments:
74 limit: one more than the largest number required
75
76Returns: a pseudo-random number in the range 0 to limit-1
77*/
78
79int
80random_number(int limit)
81{
82if (random_seed == 0)
83 {
84 if (running_in_test_harness) random_seed = 42; else
85 {
86 int p = (int)getpid();
87 random_seed = (int)time(NULL) ^ ((p << 16) | p);
88 }
89 }
90random_seed = 1103515245 * random_seed + 12345;
91return (unsigned int)(random_seed >> 16) % limit;
92}
93
94
95
d8ef3577
PH
96/*************************************************
97* Sort addresses when testing *
98*************************************************/
99
100/* This function is called only when running in the test harness. It sorts a
101number of multihomed host IP addresses into the order, so as to get
102repeatability. This doesn't have to be efficient. But don't interchange IPv4
103and IPv6 addresses!
104
e7726cbf
PH
105NOTE:
106This sorting is not necessary for the new test harness, because it
107doesn't call the real DNS resolver, and its output is repeatable. However,
108until the old test harness is discarded, we need to retain this capability.
109The new harness is being developed towards the end of 2005. It will be some
110time before it can do everything that the old one can do.
111
d8ef3577
PH
112Arguments:
113 host -> the first host item
114 last -> the last host item
8e669ac1 115
d8ef3577 116Returns: nothing
8e669ac1 117*/
d8ef3577
PH
118
119static void
120sort_addresses(host_item *host, host_item *last)
121{
122BOOL done = FALSE;
123while (!done)
124 {
125 host_item *h;
126 done = TRUE;
127 for (h = host; h != last; h = h->next)
128 {
129 if ((Ustrchr(h->address, ':') == NULL) !=
130 (Ustrchr(h->next->address, ':') == NULL))
131 continue;
132 if (Ustrcmp(h->address, h->next->address) > 0)
133 {
134 uschar *temp = h->address;
135 h->address = h->next->address;
136 h->next->address = temp;
137 done = FALSE;
138 }
139 }
140 }
141}
142
143
144
e7726cbf
PH
145/*************************************************
146* Replace gethostbyname() when testing *
147*************************************************/
148
149/* This function is called instead of gethostbyname(), gethostbyname2(), or
7a546ad5
PH
150getipnodebyname() when running in the test harness. It recognizes the name
151"manyhome.test.ex" and generates a humungous number of IP addresses. It also
152recognizes an unqualified "localhost" and forces it to the appropriate loopback
153address. IP addresses are treated as literals. For other names, it uses the DNS
154to find the host name. In the new test harness, this means it will access only
e7726cbf
PH
155the fake DNS resolver. In the old harness it will call the real resolver and
156access the test zone.
157
158Arguments:
159 name the host name or a textual IP address
160 af AF_INET or AF_INET6
161 error_num where to put an error code:
162 HOST_NOT_FOUND/TRY_AGAIN/NO_RECOVERY/NO_DATA
163
164Returns: a hostent structure or NULL for an error
165*/
166
167static struct hostent *
168host_fake_gethostbyname(uschar *name, int af, int *error_num)
169{
70d67ad3 170#if HAVE_IPV6
e7726cbf 171int alen = (af == AF_INET)? sizeof(struct in_addr):sizeof(struct in6_addr);
70d67ad3
PH
172#else
173int alen = sizeof(struct in_addr);
174#endif
175
176int ipa;
e7726cbf
PH
177uschar *lname = name;
178uschar *adds;
179uschar **alist;
180struct hostent *yield;
181dns_answer dnsa;
182dns_scan dnss;
183dns_record *rr;
184
185DEBUG(D_host_lookup)
186 debug_printf("using host_fake_gethostbyname for %s (%s)\n", name,
187 (af == AF_INET)? "IPv4" : "IPv6");
188
7a546ad5
PH
189/* Handle the name that needs a vast number of IP addresses */
190
191if (Ustrcmp(name, "manyhome.test.ex") == 0 && af == AF_INET)
192 {
193 int i, j;
194 yield = store_get(sizeof(struct hostent));
195 alist = store_get(2049 * sizeof(char *));
196 adds = store_get(2048 * alen);
197 yield->h_name = CS name;
198 yield->h_aliases = NULL;
199 yield->h_addrtype = af;
200 yield->h_length = alen;
201 yield->h_addr_list = CSS alist;
202 for (i = 104; i <= 111; i++)
203 {
204 for (j = 0; j <= 255; j++)
205 {
206 *alist++ = adds;
207 *adds++ = 10;
208 *adds++ = 250;
209 *adds++ = i;
210 *adds++ = j;
211 }
212 }
213 *alist = NULL;
214 return yield;
215 }
216
217/* Handle unqualified "localhost" */
218
e7726cbf
PH
219if (Ustrcmp(name, "localhost") == 0)
220 lname = (af == AF_INET)? US"127.0.0.1" : US"::1";
221
222/* Handle a literal IP address */
223
224ipa = string_is_ip_address(lname, NULL);
225if (ipa != 0)
226 {
227 if ((ipa == 4 && af == AF_INET) ||
228 (ipa == 6 && af == AF_INET6))
229 {
230 int i, n;
231 int x[4];
232 yield = store_get(sizeof(struct hostent));
233 alist = store_get(2 * sizeof(char *));
234 adds = store_get(alen);
235 yield->h_name = CS name;
236 yield->h_aliases = NULL;
237 yield->h_addrtype = af;
238 yield->h_length = alen;
239 yield->h_addr_list = CSS alist;
240 *alist++ = adds;
241 n = host_aton(lname, x);
242 for (i = 0; i < n; i++)
243 {
244 int y = x[i];
245 *adds++ = (y >> 24) & 255;
246 *adds++ = (y >> 16) & 255;
247 *adds++ = (y >> 8) & 255;
248 *adds++ = y & 255;
249 }
250 *alist = NULL;
251 }
252
253 /* Wrong kind of literal address */
254
255 else
256 {
257 *error_num = HOST_NOT_FOUND;
258 return NULL;
259 }
260 }
261
262/* Handle a host name */
263
264else
265 {
266 int type = (af == AF_INET)? T_A:T_AAAA;
267 int rc = dns_lookup(&dnsa, lname, type, NULL);
268 int count = 0;
269
270 switch(rc)
271 {
272 case DNS_SUCCEED: break;
273 case DNS_NOMATCH: *error_num = HOST_NOT_FOUND; return NULL;
274 case DNS_NODATA: *error_num = NO_DATA; return NULL;
275 case DNS_AGAIN: *error_num = TRY_AGAIN; return NULL;
276 default:
277 case DNS_FAIL: *error_num = NO_RECOVERY; return NULL;
278 }
279
280 for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
281 rr != NULL;
282 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
283 {
284 if (rr->type == type) count++;
285 }
286
287 yield = store_get(sizeof(struct hostent));
288 alist = store_get((count + 1) * sizeof(char **));
289 adds = store_get(count *alen);
290
291 yield->h_name = CS name;
292 yield->h_aliases = NULL;
293 yield->h_addrtype = af;
294 yield->h_length = alen;
295 yield->h_addr_list = CSS alist;
296
297 for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
298 rr != NULL;
299 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
300 {
301 int i, n;
302 int x[4];
303 dns_address *da;
304 if (rr->type != type) continue;
305 da = dns_address_from_rr(&dnsa, rr);
306 *alist++ = adds;
307 n = host_aton(da->address, x);
308 for (i = 0; i < n; i++)
309 {
310 int y = x[i];
311 *adds++ = (y >> 24) & 255;
312 *adds++ = (y >> 16) & 255;
313 *adds++ = (y >> 8) & 255;
314 *adds++ = y & 255;
315 }
316 }
317 *alist = NULL;
318 }
319
320return yield;
321}
322
323
324
059ec3d9
PH
325/*************************************************
326* Build chain of host items from list *
327*************************************************/
328
329/* This function builds a chain of host items from a textual list of host
330names. It does not do any lookups. If randomize is true, the chain is build in
331a randomized order. There may be multiple groups of independently randomized
332hosts; they are delimited by a host name consisting of just "+".
333
334Arguments:
335 anchor anchor for the chain
336 list text list
337 randomize TRUE for randomizing
338
339Returns: nothing
340*/
341
342void
343host_build_hostlist(host_item **anchor, uschar *list, BOOL randomize)
344{
345int sep = 0;
346int fake_mx = MX_NONE; /* This value is actually -1 */
347uschar *name;
348uschar buffer[1024];
349
350if (list == NULL) return;
351if (randomize) fake_mx--; /* Start at -2 for randomizing */
352
353*anchor = NULL;
354
355while ((name = string_nextinlist(&list, &sep, buffer, sizeof(buffer))) != NULL)
356 {
357 host_item *h;
358
359 if (name[0] == '+' && name[1] == 0) /* "+" delimits a randomized group */
360 { /* ignore if not randomizing */
361 if (randomize) fake_mx--;
362 continue;
363 }
364
365 h = store_get(sizeof(host_item));
366 h->name = string_copy(name);
367 h->address = NULL;
368 h->port = PORT_NONE;
369 h->mx = fake_mx;
370 h->sort_key = randomize? (-fake_mx)*1000 + random_number(1000) : 0;
371 h->status = hstatus_unknown;
372 h->why = hwhy_unknown;
373 h->last_try = 0;
374
375 if (*anchor == NULL)
376 {
377 h->next = NULL;
378 *anchor = h;
379 }
380 else
381 {
382 host_item *hh = *anchor;
383 if (h->sort_key < hh->sort_key)
384 {
385 h->next = hh;
386 *anchor = h;
387 }
388 else
389 {
390 while (hh->next != NULL && h->sort_key >= (hh->next)->sort_key)
391 hh = hh->next;
392 h->next = hh->next;
393 hh->next = h;
394 }
395 }
396 }
397}
398
399
400
401
402
403/*************************************************
404* Extract port from address string *
405*************************************************/
406
407/* In the spool file, and in the -oMa and -oMi options, a host plus port is
408given as an IP address followed by a dot and a port number. This function
409decodes this.
410
411An alternative format for the -oMa and -oMi options is [ip address]:port which
412is what Exim 4 uses for output, because it seems to becoming commonly used,
413whereas the dot form confuses some programs/people. So we recognize that form
414too.
415
416Argument:
417 address points to the string; if there is a port, the '.' in the string
418 is overwritten with zero to terminate the address; if the string
419 is in the [xxx]:ppp format, the address is shifted left and the
420 brackets are removed
421
422Returns: 0 if there is no port, else the port number. If there's a syntax
423 error, leave the incoming address alone, and return 0.
424*/
425
426int
7cd1141b 427host_address_extract_port(uschar *address)
059ec3d9
PH
428{
429int port = 0;
430uschar *endptr;
431
432/* Handle the "bracketed with colon on the end" format */
433
434if (*address == '[')
435 {
436 uschar *rb = address + 1;
437 while (*rb != 0 && *rb != ']') rb++;
438 if (*rb++ == 0) return 0; /* Missing ]; leave invalid address */
439 if (*rb == ':')
440 {
441 port = Ustrtol(rb + 1, &endptr, 10);
442 if (*endptr != 0) return 0; /* Invalid port; leave invalid address */
443 }
444 else if (*rb != 0) return 0; /* Bad syntax; leave invalid address */
445 memmove(address, address + 1, rb - address - 2);
446 rb[-2] = 0;
447 }
448
449/* Handle the "dot on the end" format */
450
451else
452 {
453 int skip = -3; /* Skip 3 dots in IPv4 addresses */
454 address--;
455 while (*(++address) != 0)
456 {
457 int ch = *address;
458 if (ch == ':') skip = 0; /* Skip 0 dots in IPv6 addresses */
459 else if (ch == '.' && skip++ >= 0) break;
460 }
461 if (*address == 0) return 0;
462 port = Ustrtol(address + 1, &endptr, 10);
463 if (*endptr != 0) return 0; /* Invalid port; leave invalid address */
464 *address = 0;
465 }
466
467return port;
468}
469
470
7cd1141b
PH
471/*************************************************
472* Get port from a host item's name *
473*************************************************/
474
475/* This function is called when finding the IP address for a host that is in a
476list of hosts explicitly configured, such as in the manualroute router, or in a
477fallback hosts list. We see if there is a port specification at the end of the
478host name, and if so, remove it. A minimum length of 3 is required for the
479original name; nothing shorter is recognized as having a port.
480
481We test for a name ending with a sequence of digits; if preceded by colon we
482have a port if the character before the colon is ] and the name starts with [
483or if there are no other colons in the name (i.e. it's not an IPv6 address).
484
485Arguments: pointer to the host item
486Returns: a port number or PORT_NONE
487*/
488
489int
490host_item_get_port(host_item *h)
491{
492uschar *p;
493int port, x;
494int len = Ustrlen(h->name);
495
496if (len < 3 || (p = h->name + len - 1, !isdigit(*p))) return PORT_NONE;
497
498/* Extract potential port number */
499
500port = *p-- - '0';
501x = 10;
502
503while (p > h->name + 1 && isdigit(*p))
504 {
505 port += (*p-- - '0') * x;
506 x *= 10;
507 }
508
509/* The smallest value of p at this point is h->name + 1. */
510
511if (*p != ':') return PORT_NONE;
512
513if (p[-1] == ']' && h->name[0] == '[')
514 h->name = string_copyn(h->name + 1, p - h->name - 2);
515else if (Ustrchr(h->name, ':') == p)
516 h->name = string_copyn(h->name, p - h->name);
517else return PORT_NONE;
518
519DEBUG(D_route|D_host_lookup) debug_printf("host=%s port=%d\n", h->name, port);
520return port;
521}
522
523
059ec3d9
PH
524
525#ifndef STAND_ALONE /* Omit when standalone testing */
526
527/*************************************************
528* Build sender_fullhost and sender_rcvhost *
529*************************************************/
530
531/* This function is called when sender_host_name and/or sender_helo_name
532have been set. Or might have been set - for a local message read off the spool
533they won't be. In that case, do nothing. Otherwise, set up the fullhost string
534as follows:
535
536(a) No sender_host_name or sender_helo_name: "[ip address]"
537(b) Just sender_host_name: "host_name [ip address]"
82c19f95
PH
538(c) Just sender_helo_name: "(helo_name) [ip address]" unless helo is IP
539 in which case: "[ip address}"
540(d) The two are identical: "host_name [ip address]" includes helo = IP
059ec3d9
PH
541(e) The two are different: "host_name (helo_name) [ip address]"
542
543If log_incoming_port is set, the sending host's port number is added to the IP
544address.
545
546This function also builds sender_rcvhost for use in Received: lines, whose
547syntax is a bit different. This value also includes the RFC 1413 identity.
548There wouldn't be two different variables if I had got all this right in the
549first place.
550
551Because this data may survive over more than one incoming SMTP message, it has
552to be in permanent store.
553
554Arguments: none
555Returns: nothing
556*/
557
558void
559host_build_sender_fullhost(void)
560{
82c19f95 561BOOL show_helo = TRUE;
059ec3d9 562uschar *address;
82c19f95 563int len;
059ec3d9
PH
564int old_pool = store_pool;
565
566if (sender_host_address == NULL) return;
567
568store_pool = POOL_PERM;
569
570/* Set up address, with or without the port. After discussion, it seems that
571the only format that doesn't cause trouble is [aaaa]:pppp. However, we can't
572use this directly as the first item for Received: because it ain't an RFC 2822
573domain. Sigh. */
574
575address = string_sprintf("[%s]:%d", sender_host_address, sender_host_port);
576if ((log_extra_selector & LX_incoming_port) == 0 || sender_host_port <= 0)
577 *(Ustrrchr(address, ':')) = 0;
578
82c19f95
PH
579/* If there's no EHLO/HELO data, we can't show it. */
580
581if (sender_helo_name == NULL) show_helo = FALSE;
582
583/* If HELO/EHLO was followed by an IP literal, it's messy because of two
584features of IPv6. Firstly, there's the "IPv6:" prefix (Exim is liberal and
585doesn't require this, for historical reasons). Secondly, IPv6 addresses may not
586be given in canonical form, so we have to canonicize them before comparing. As
587it happens, the code works for both IPv4 and IPv6. */
588
589else if (sender_helo_name[0] == '[' &&
590 sender_helo_name[(len=Ustrlen(sender_helo_name))-1] == ']')
591 {
592 int offset = 1;
593 uschar *helo_ip;
594
595 if (strncmpic(sender_helo_name + 1, US"IPv6:", 5) == 0) offset += 5;
596 if (strncmpic(sender_helo_name + 1, US"IPv4:", 5) == 0) offset += 5;
597
598 helo_ip = string_copyn(sender_helo_name + offset, len - offset - 1);
599
600 if (string_is_ip_address(helo_ip, NULL) != 0)
601 {
602 int x[4], y[4];
603 int sizex, sizey;
604 uschar ipx[48], ipy[48]; /* large enough for full IPv6 */
605
606 sizex = host_aton(helo_ip, x);
607 sizey = host_aton(sender_host_address, y);
608
609 (void)host_nmtoa(sizex, x, -1, ipx, ':');
610 (void)host_nmtoa(sizey, y, -1, ipy, ':');
611
612 if (strcmpic(ipx, ipy) == 0) show_helo = FALSE;
613 }
614 }
615
059ec3d9
PH
616/* Host name is not verified */
617
618if (sender_host_name == NULL)
619 {
620 uschar *portptr = Ustrstr(address, "]:");
621 int size = 0;
622 int ptr = 0;
623 int adlen; /* Sun compiler doesn't like ++ in initializers */
624
625 adlen = (portptr == NULL)? Ustrlen(address) : (++portptr - address);
626 sender_fullhost = (sender_helo_name == NULL)? address :
627 string_sprintf("(%s) %s", sender_helo_name, address);
628
629 sender_rcvhost = string_cat(NULL, &size, &ptr, address, adlen);
630
82c19f95 631 if (sender_ident != NULL || show_helo || portptr != NULL)
059ec3d9
PH
632 {
633 int firstptr;
634 sender_rcvhost = string_cat(sender_rcvhost, &size, &ptr, US" (", 2);
635 firstptr = ptr;
636
637 if (portptr != NULL)
638 sender_rcvhost = string_append(sender_rcvhost, &size, &ptr, 2, US"port=",
639 portptr + 1);
640
82c19f95 641 if (show_helo)
059ec3d9
PH
642 sender_rcvhost = string_append(sender_rcvhost, &size, &ptr, 2,
643 (firstptr == ptr)? US"helo=" : US" helo=", sender_helo_name);
644
645 if (sender_ident != NULL)
646 sender_rcvhost = string_append(sender_rcvhost, &size, &ptr, 2,
647 (firstptr == ptr)? US"ident=" : US" ident=", sender_ident);
648
649 sender_rcvhost = string_cat(sender_rcvhost, &size, &ptr, US")", 1);
650 }
651
652 sender_rcvhost[ptr] = 0; /* string_cat() always leaves room */
653
654 /* Release store, because string_cat allocated a minimum of 100 bytes that
655 are rarely completely used. */
656
657 store_reset(sender_rcvhost + ptr + 1);
658 }
659
82c19f95
PH
660/* Host name is known and verified. Unless we've already found that the HELO
661data matches the IP address, compare it with the name. */
059ec3d9
PH
662
663else
664 {
82c19f95
PH
665 if (show_helo && strcmpic(sender_host_name, sender_helo_name) == 0)
666 show_helo = FALSE;
5dd9625b 667
82c19f95 668 if (show_helo)
059ec3d9
PH
669 {
670 sender_fullhost = string_sprintf("%s (%s) %s", sender_host_name,
671 sender_helo_name, address);
672 sender_rcvhost = (sender_ident == NULL)?
673 string_sprintf("%s (%s helo=%s)", sender_host_name,
674 address, sender_helo_name) :
675 string_sprintf("%s\n\t(%s helo=%s ident=%s)", sender_host_name,
676 address, sender_helo_name, sender_ident);
677 }
82c19f95
PH
678 else
679 {
680 sender_fullhost = string_sprintf("%s %s", sender_host_name, address);
681 sender_rcvhost = (sender_ident == NULL)?
682 string_sprintf("%s (%s)", sender_host_name, address) :
683 string_sprintf("%s (%s ident=%s)", sender_host_name, address,
684 sender_ident);
685 }
059ec3d9
PH
686 }
687
688store_pool = old_pool;
689
690DEBUG(D_host_lookup) debug_printf("sender_fullhost = %s\n", sender_fullhost);
691DEBUG(D_host_lookup) debug_printf("sender_rcvhost = %s\n", sender_rcvhost);
692}
693
694
695
696/*************************************************
697* Build host+ident message *
698*************************************************/
699
700/* Used when logging rejections and various ACL and SMTP incidents. The text
701return depends on whether sender_fullhost and sender_ident are set or not:
702
703 no ident, no host => U=unknown
704 no ident, host set => H=sender_fullhost
705 ident set, no host => U=ident
706 ident set, host set => H=sender_fullhost U=ident
707
708Arguments:
709 useflag TRUE if first item to be flagged (H= or U=); if there are two
710 items, the second is always flagged
711
712Returns: pointer to a string in big_buffer
713*/
714
715uschar *
716host_and_ident(BOOL useflag)
717{
718if (sender_fullhost == NULL)
719 {
720 (void)string_format(big_buffer, big_buffer_size, "%s%s", useflag? "U=" : "",
721 (sender_ident == NULL)? US"unknown" : sender_ident);
722 }
723else
724 {
725 uschar *flag = useflag? US"H=" : US"";
726 uschar *iface = US"";
727 if ((log_extra_selector & LX_incoming_interface) != 0 &&
728 interface_address != NULL)
729 iface = string_sprintf(" I=[%s]:%d", interface_address, interface_port);
730 if (sender_ident == NULL)
731 (void)string_format(big_buffer, big_buffer_size, "%s%s%s",
732 flag, sender_fullhost, iface);
733 else
734 (void)string_format(big_buffer, big_buffer_size, "%s%s%s U=%s",
735 flag, sender_fullhost, iface, sender_ident);
736 }
737return big_buffer;
738}
739
740#endif /* STAND_ALONE */
741
742
743
744
745/*************************************************
746* Build list of local interfaces *
747*************************************************/
748
749/* This function interprets the contents of the local_interfaces or
750extra_local_interfaces options, and creates an ip_address_item block for each
751item on the list. There is no special interpretation of any IP addresses; in
752particular, 0.0.0.0 and ::0 are returned without modification. If any address
753includes a port, it is set in the block. Otherwise the port value is set to
754zero.
755
756Arguments:
757 list the list
758 name the name of the option being expanded
759
760Returns: a chain of ip_address_items, each containing to a textual
761 version of an IP address, and a port number (host order) or
762 zero if no port was given with the address
763*/
764
765ip_address_item *
766host_build_ifacelist(uschar *list, uschar *name)
767{
768int sep = 0;
769uschar *s;
770uschar buffer[64];
771ip_address_item *yield = NULL;
772ip_address_item *last = NULL;
773ip_address_item *next;
774
775while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer))) != NULL)
776 {
7cd1141b 777 int port = host_address_extract_port(s); /* Leaves just the IP address */
a5a28604 778 if (string_is_ip_address(s, NULL) == 0)
059ec3d9
PH
779 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "Malformed IP address \"%s\" in %s",
780 s, name);
781
782 /* This use of strcpy() is OK because we have checked that s is a valid IP
783 address above. The field in the ip_address_item is large enough to hold an
784 IPv6 address. */
785
786 next = store_get(sizeof(ip_address_item));
787 next->next = NULL;
788 Ustrcpy(next->address, s);
789 next->port = port;
790 next->v6_include_v4 = FALSE;
791
792 if (yield == NULL) yield = last = next; else
793 {
794 last->next = next;
795 last = next;
796 }
797 }
798
799return yield;
800}
801
802
803
804
805
806/*************************************************
807* Find addresses on local interfaces *
808*************************************************/
809
810/* This function finds the addresses of local IP interfaces. These are used
811when testing for routing to the local host. As the function may be called more
812than once, the list is preserved in permanent store, pointed to by a static
813variable, to save doing the work more than once per process.
814
815The generic list of interfaces is obtained by calling host_build_ifacelist()
816for local_interfaces and extra_local_interfaces. This list scanned to remove
817duplicates (which may exist with different ports - not relevant here). If
818either of the wildcard IP addresses (0.0.0.0 and ::0) are encountered, they are
819replaced by the appropriate (IPv4 or IPv6) list of actual local interfaces,
820obtained from os_find_running_interfaces().
821
822Arguments: none
823Returns: a chain of ip_address_items, each containing to a textual
824 version of an IP address; the port numbers are not relevant
825*/
826
827
828/* First, a local subfunction to add an interface to a list in permanent store,
829but only if there isn't a previous copy of that address on the list. */
830
831static ip_address_item *
832add_unique_interface(ip_address_item *list, ip_address_item *ipa)
833{
834ip_address_item *ipa2;
835for (ipa2 = list; ipa2 != NULL; ipa2 = ipa2->next)
836 if (Ustrcmp(ipa2->address, ipa->address) == 0) return list;
837ipa2 = store_get_perm(sizeof(ip_address_item));
838*ipa2 = *ipa;
839ipa2->next = list;
840return ipa2;
841}
842
843
844/* This is the globally visible function */
845
846ip_address_item *
847host_find_interfaces(void)
848{
849ip_address_item *running_interfaces = NULL;
850
851if (local_interface_data == NULL)
852 {
853 void *reset_item = store_get(0);
854 ip_address_item *dlist = host_build_ifacelist(local_interfaces,
855 US"local_interfaces");
856 ip_address_item *xlist = host_build_ifacelist(extra_local_interfaces,
857 US"extra_local_interfaces");
858 ip_address_item *ipa;
859
860 if (dlist == NULL) dlist = xlist; else
861 {
862 for (ipa = dlist; ipa->next != NULL; ipa = ipa->next);
863 ipa->next = xlist;
864 }
865
866 for (ipa = dlist; ipa != NULL; ipa = ipa->next)
867 {
868 if (Ustrcmp(ipa->address, "0.0.0.0") == 0 ||
869 Ustrcmp(ipa->address, "::0") == 0)
870 {
871 ip_address_item *ipa2;
872 BOOL ipv6 = ipa->address[0] == ':';
873 if (running_interfaces == NULL)
874 running_interfaces = os_find_running_interfaces();
875 for (ipa2 = running_interfaces; ipa2 != NULL; ipa2 = ipa2->next)
876 {
877 if ((Ustrchr(ipa2->address, ':') != NULL) == ipv6)
878 local_interface_data = add_unique_interface(local_interface_data,
879 ipa2);
880 }
881 }
882 else
883 {
884 local_interface_data = add_unique_interface(local_interface_data, ipa);
885 DEBUG(D_interface)
886 {
887 debug_printf("Configured local interface: address=%s", ipa->address);
888 if (ipa->port != 0) debug_printf(" port=%d", ipa->port);
889 debug_printf("\n");
890 }
891 }
892 }
893 store_reset(reset_item);
894 }
895
896return local_interface_data;
897}
898
899
900
901
902
903/*************************************************
904* Convert network IP address to text *
905*************************************************/
906
907/* Given an IPv4 or IPv6 address in binary, convert it to a text
908string and return the result in a piece of new store. The address can
909either be given directly, or passed over in a sockaddr structure. Note
910that this isn't the converse of host_aton() because of byte ordering
911differences. See host_nmtoa() below.
912
913Arguments:
914 type if < 0 then arg points to a sockaddr, else
915 either AF_INET or AF_INET6
916 arg points to a sockaddr if type is < 0, or
917 points to an IPv4 address (32 bits), or
918 points to an IPv6 address (128 bits),
919 in both cases, in network byte order
920 buffer if NULL, the result is returned in gotten store;
921 else points to a buffer to hold the answer
922 portptr points to where to put the port number, if non NULL; only
923 used when type < 0
924
925Returns: pointer to character string
926*/
927
928uschar *
929host_ntoa(int type, const void *arg, uschar *buffer, int *portptr)
930{
931uschar *yield;
932
933/* The new world. It is annoying that we have to fish out the address from
934different places in the block, depending on what kind of address it is. It
935is also a pain that inet_ntop() returns a const uschar *, whereas the IPv4
936function inet_ntoa() returns just uschar *, and some picky compilers insist
937on warning if one assigns a const uschar * to a uschar *. Hence the casts. */
938
939#if HAVE_IPV6
940uschar addr_buffer[46];
941if (type < 0)
942 {
943 int family = ((struct sockaddr *)arg)->sa_family;
944 if (family == AF_INET6)
945 {
946 struct sockaddr_in6 *sk = (struct sockaddr_in6 *)arg;
947 yield = (uschar *)inet_ntop(family, &(sk->sin6_addr), CS addr_buffer,
948 sizeof(addr_buffer));
949 if (portptr != NULL) *portptr = ntohs(sk->sin6_port);
950 }
951 else
952 {
953 struct sockaddr_in *sk = (struct sockaddr_in *)arg;
954 yield = (uschar *)inet_ntop(family, &(sk->sin_addr), CS addr_buffer,
955 sizeof(addr_buffer));
956 if (portptr != NULL) *portptr = ntohs(sk->sin_port);
957 }
958 }
959else
960 {
961 yield = (uschar *)inet_ntop(type, arg, CS addr_buffer, sizeof(addr_buffer));
962 }
963
964/* If the result is a mapped IPv4 address, show it in V4 format. */
965
966if (Ustrncmp(yield, "::ffff:", 7) == 0) yield += 7;
967
968#else /* HAVE_IPV6 */
969
970/* The old world */
971
972if (type < 0)
973 {
974 yield = US inet_ntoa(((struct sockaddr_in *)arg)->sin_addr);
975 if (portptr != NULL) *portptr = ntohs(((struct sockaddr_in *)arg)->sin_port);
976 }
977else
978 yield = US inet_ntoa(*((struct in_addr *)arg));
979#endif
980
981/* If there is no buffer, put the string into some new store. */
982
983if (buffer == NULL) return string_copy(yield);
984
985/* Callers of this function with a non-NULL buffer must ensure that it is
986large enough to hold an IPv6 address, namely, at least 46 bytes. That's what
987makes this use of strcpy() OK. */
988
989Ustrcpy(buffer, yield);
990return buffer;
991}
992
993
994
995
996/*************************************************
997* Convert address text to binary *
998*************************************************/
999
1000/* Given the textual form of an IP address, convert it to binary in an
1001array of ints. IPv4 addresses occupy one int; IPv6 addresses occupy 4 ints.
1002The result has the first byte in the most significant byte of the first int. In
1003other words, the result is not in network byte order, but in host byte order.
1004As a result, this is not the converse of host_ntoa(), which expects network
1005byte order. See host_nmtoa() below.
1006
1007Arguments:
1008 address points to the textual address, checked for syntax
1009 bin points to an array of 4 ints
1010
1011Returns: the number of ints used
1012*/
1013
1014int
1015host_aton(uschar *address, int *bin)
1016{
1017int x[4];
1018int v4offset = 0;
1019
8e669ac1 1020/* Handle IPv6 address, which may end with an IPv4 address. It may also end
7e634d24
PH
1021with a "scope", introduced by a percent sign. This code is NOT enclosed in #if
1022HAVE_IPV6 in order that IPv6 addresses are recognized even if IPv6 is not
1023supported. */
059ec3d9
PH
1024
1025if (Ustrchr(address, ':') != NULL)
1026 {
1027 uschar *p = address;
1028 uschar *component[8];
1029 BOOL ipv4_ends = FALSE;
1030 int ci = 0;
1031 int nulloffset = 0;
1032 int v6count = 8;
1033 int i;
1034
1035 /* If the address starts with a colon, it will start with two colons.
1036 Just lose the first one, which will leave a null first component. */
8e669ac1 1037
059ec3d9
PH
1038 if (*p == ':') p++;
1039
8e669ac1
PH
1040 /* Split the address into components separated by colons. The input address
1041 is supposed to be checked for syntax. There was a case where this was
1042 overlooked; to guard against that happening again, check here and crash if
7e634d24 1043 there are too many components. */
059ec3d9 1044
7e634d24 1045 while (*p != 0 && *p != '%')
059ec3d9 1046 {
7e634d24 1047 int len = Ustrcspn(p, ":%");
059ec3d9 1048 if (len == 0) nulloffset = ci;
8e669ac1 1049 if (ci > 7) log_write(0, LOG_MAIN|LOG_PANIC_DIE,
b975ba52 1050 "Internal error: invalid IPv6 address \"%s\" passed to host_aton()",
8e669ac1 1051 address);
059ec3d9
PH
1052 component[ci++] = p;
1053 p += len;
1054 if (*p == ':') p++;
1055 }
1056
1057 /* If the final component contains a dot, it is a trailing v4 address.
1058 As the syntax is known to be checked, just set up for a trailing
1059 v4 address and restrict the v6 part to 6 components. */
1060
1061 if (Ustrchr(component[ci-1], '.') != NULL)
1062 {
1063 address = component[--ci];
1064 ipv4_ends = TRUE;
1065 v4offset = 3;
1066 v6count = 6;
1067 }
1068
1069 /* If there are fewer than 6 or 8 components, we have to insert some
1070 more empty ones in the middle. */
1071
1072 if (ci < v6count)
1073 {
1074 int insert_count = v6count - ci;
1075 for (i = v6count-1; i > nulloffset + insert_count; i--)
1076 component[i] = component[i - insert_count];
1077 while (i > nulloffset) component[i--] = US"";
1078 }
1079
1080 /* Now turn the components into binary in pairs and bung them
1081 into the vector of ints. */
1082
1083 for (i = 0; i < v6count; i += 2)
1084 bin[i/2] = (Ustrtol(component[i], NULL, 16) << 16) +
1085 Ustrtol(component[i+1], NULL, 16);
1086
1087 /* If there was no terminating v4 component, we are done. */
1088
1089 if (!ipv4_ends) return 4;
1090 }
1091
1092/* Handle IPv4 address */
1093
ff790e47 1094(void)sscanf(CS address, "%d.%d.%d.%d", x, x+1, x+2, x+3);
059ec3d9
PH
1095bin[v4offset] = (x[0] << 24) + (x[1] << 16) + (x[2] << 8) + x[3];
1096return v4offset+1;
1097}
1098
1099
1100/*************************************************
1101* Apply mask to an IP address *
1102*************************************************/
1103
1104/* Mask an address held in 1 or 4 ints, with the ms bit in the ms bit of the
1105first int, etc.
1106
1107Arguments:
1108 count the number of ints
1109 binary points to the ints to be masked
1110 mask the count of ms bits to leave, or -1 if no masking
1111
1112Returns: nothing
1113*/
1114
1115void
1116host_mask(int count, int *binary, int mask)
1117{
1118int i;
1119if (mask < 0) mask = 99999;
1120for (i = 0; i < count; i++)
1121 {
1122 int wordmask;
1123 if (mask == 0) wordmask = 0;
1124 else if (mask < 32)
1125 {
1126 wordmask = (-1) << (32 - mask);
1127 mask = 0;
1128 }
1129 else
1130 {
1131 wordmask = -1;
1132 mask -= 32;
1133 }
1134 binary[i] &= wordmask;
1135 }
1136}
1137
1138
1139
1140
1141/*************************************************
1142* Convert masked IP address in ints to text *
1143*************************************************/
1144
1145/* We can't use host_ntoa() because it assumes the binary values are in network
1146byte order, and these are the result of host_aton(), which puts them in ints in
1147host byte order. Also, we really want IPv6 addresses to be in a canonical
6f0c9a4f
PH
1148format, so we output them with no abbreviation. In a number of cases we can't
1149use the normal colon separator in them because it terminates keys in lsearch
8e669ac1 1150files, so we want to use dot instead. There's an argument that specifies what
6f0c9a4f 1151to use for IPv6 addresses.
059ec3d9
PH
1152
1153Arguments:
1154 count 1 or 4 (number of ints)
1155 binary points to the ints
1156 mask mask value; if < 0 don't add to result
1157 buffer big enough to hold the result
8e669ac1 1158 sep component separator character for IPv6 addresses
059ec3d9
PH
1159
1160Returns: the number of characters placed in buffer, not counting
1161 the final nul.
1162*/
1163
1164int
6f0c9a4f 1165host_nmtoa(int count, int *binary, int mask, uschar *buffer, int sep)
059ec3d9
PH
1166{
1167int i, j;
1168uschar *tt = buffer;
1169
1170if (count == 1)
1171 {
1172 j = binary[0];
1173 for (i = 24; i >= 0; i -= 8)
1174 {
1175 sprintf(CS tt, "%d.", (j >> i) & 255);
1176 while (*tt) tt++;
1177 }
1178 }
1179else
1180 {
1181 for (i = 0; i < 4; i++)
1182 {
1183 j = binary[i];
6f0c9a4f 1184 sprintf(CS tt, "%04x%c%04x%c", (j >> 16) & 0xffff, sep, j & 0xffff, sep);
059ec3d9
PH
1185 while (*tt) tt++;
1186 }
1187 }
1188
6f0c9a4f 1189tt--; /* lose final separator */
059ec3d9
PH
1190
1191if (mask < 0)
1192 *tt = 0;
1193else
1194 {
1195 sprintf(CS tt, "/%d", mask);
1196 while (*tt) tt++;
1197 }
1198
1199return tt - buffer;
1200}
1201
1202
1203
1204/*************************************************
1205* Check port for tls_on_connect *
1206*************************************************/
1207
1208/* This function checks whether a given incoming port is configured for tls-
1209on-connect. It is called from the daemon and from inetd handling. If the global
1210option tls_on_connect is already set, all ports operate this way. Otherwise, we
1211check the tls_on_connect_ports option for a list of ports.
1212
1213Argument: a port number
1214Returns: TRUE or FALSE
1215*/
1216
1217BOOL
1218host_is_tls_on_connect_port(int port)
1219{
1220int sep = 0;
1221uschar buffer[32];
1222uschar *list = tls_on_connect_ports;
1223uschar *s;
1224
1225if (tls_on_connect) return TRUE;
1226
1227while ((s = string_nextinlist(&list, &sep, buffer, sizeof(buffer))) != NULL)
1228 {
1229 uschar *end;
1230 int lport = Ustrtol(s, &end, 10);
1231 if (*end != 0) log_write(0, LOG_MAIN|LOG_PANIC_DIE, "tls_on_connect_ports "
1232 "contains \"%s\", which is not a port number: exim abandoned", s);
1233 if (lport == port) return TRUE;
1234 }
1235
1236return FALSE;
1237}
1238
1239
1240
1241/*************************************************
1242* Check whether host is in a network *
1243*************************************************/
1244
1245/* This function checks whether a given IP address matches a pattern that
1246represents either a single host, or a network (using CIDR notation). The caller
1247of this function must check the syntax of the arguments before calling it.
1248
1249Arguments:
1250 host string representation of the ip-address to check
1251 net string representation of the network, with optional CIDR mask
1252 maskoffset offset to the / that introduces the mask in the key
1253 zero if there is no mask
1254
1255Returns:
1256 TRUE the host is inside the network
1257 FALSE the host is NOT inside the network
1258*/
1259
1260BOOL
1261host_is_in_net(uschar *host, uschar *net, int maskoffset)
1262{
1263int i;
1264int address[4];
1265int incoming[4];
1266int mlen;
1267int size = host_aton(net, address);
1268int insize;
1269
1270/* No mask => all bits to be checked */
1271
1272if (maskoffset == 0) mlen = 99999; /* Big number */
1273 else mlen = Uatoi(net + maskoffset + 1);
1274
1275/* Convert the incoming address to binary. */
1276
1277insize = host_aton(host, incoming);
1278
1279/* Convert IPv4 addresses given in IPv6 compatible mode, which represent
1280 connections from IPv4 hosts to IPv6 hosts, that is, addresses of the form
1281 ::ffff:<v4address>, to IPv4 format. */
1282
1283if (insize == 4 && incoming[0] == 0 && incoming[1] == 0 &&
1284 incoming[2] == 0xffff)
1285 {
1286 insize = 1;
1287 incoming[0] = incoming[3];
1288 }
1289
1290/* No match if the sizes don't agree. */
1291
1292if (insize != size) return FALSE;
1293
1294/* Else do the masked comparison. */
1295
1296for (i = 0; i < size; i++)
1297 {
1298 int mask;
1299 if (mlen == 0) mask = 0;
1300 else if (mlen < 32)
1301 {
1302 mask = (-1) << (32 - mlen);
1303 mlen = 0;
1304 }
1305 else
1306 {
1307 mask = -1;
1308 mlen -= 32;
1309 }
1310 if ((incoming[i] & mask) != (address[i] & mask)) return FALSE;
1311 }
1312
1313return TRUE;
1314}
1315
1316
1317
1318/*************************************************
1319* Scan host list for local hosts *
1320*************************************************/
1321
1322/* Scan through a chain of addresses and check whether any of them is the
1323address of an interface on the local machine. If so, remove that address and
1324any previous ones with the same MX value, and all subsequent ones (which will
1325have greater or equal MX values) from the chain. Note: marking them as unusable
1326is NOT the right thing to do because it causes the hosts not to be used for
1327other domains, for which they may well be correct.
1328
1329The hosts may be part of a longer chain; we only process those between the
1330initial pointer and the "last" pointer.
1331
1332There is also a list of "pseudo-local" host names which are checked against the
1333host names. Any match causes that host item to be treated the same as one which
1334matches a local IP address.
1335
1336If the very first host is a local host, then all MX records had a precedence
1337greater than or equal to that of the local host. Either there's a problem in
1338the DNS, or an apparently remote name turned out to be an abbreviation for the
1339local host. Give a specific return code, and let the caller decide what to do.
1340Otherwise, give a success code if at least one host address has been found.
1341
1342Arguments:
1343 host pointer to the first host in the chain
1344 lastptr pointer to pointer to the last host in the chain (may be updated)
1345 removed if not NULL, set TRUE if some local addresses were removed
1346 from the list
1347
1348Returns:
1349 HOST_FOUND if there is at least one host with an IP address on the chain
1350 and an MX value less than any MX value associated with the
1351 local host
1352 HOST_FOUND_LOCAL if a local host is among the lowest-numbered MX hosts; when
1353 the host addresses were obtained from A records or
1354 gethostbyname(), the MX values are set to -1.
1355 HOST_FIND_FAILED if no valid hosts with set IP addresses were found
1356*/
1357
1358int
1359host_scan_for_local_hosts(host_item *host, host_item **lastptr, BOOL *removed)
1360{
1361int yield = HOST_FIND_FAILED;
1362host_item *last = *lastptr;
1363host_item *prev = NULL;
1364host_item *h;
1365
1366if (removed != NULL) *removed = FALSE;
1367
1368if (local_interface_data == NULL) local_interface_data = host_find_interfaces();
1369
1370for (h = host; h != last->next; h = h->next)
1371 {
1372 #ifndef STAND_ALONE
1373 if (hosts_treat_as_local != NULL)
1374 {
1375 int rc;
1376 uschar *save = deliver_domain;
1377 deliver_domain = h->name; /* set $domain */
1378 rc = match_isinlist(string_copylc(h->name), &hosts_treat_as_local, 0,
1379 &domainlist_anchor, NULL, MCL_DOMAIN, TRUE, NULL);
1380 deliver_domain = save;
1381 if (rc == OK) goto FOUND_LOCAL;
1382 }
1383 #endif
1384
1385 /* It seems that on many operating systems, 0.0.0.0 is treated as a synonym
1386 for 127.0.0.1 and refers to the local host. We therefore force it always to
1387 be treated as local. */
1388
1389 if (h->address != NULL)
1390 {
1391 ip_address_item *ip;
1392 if (Ustrcmp(h->address, "0.0.0.0") == 0) goto FOUND_LOCAL;
1393 for (ip = local_interface_data; ip != NULL; ip = ip->next)
1394 if (Ustrcmp(h->address, ip->address) == 0) goto FOUND_LOCAL;
1395 yield = HOST_FOUND; /* At least one remote address has been found */
1396 }
1397
1398 /* Update prev to point to the last host item before any that have
1399 the same MX value as the one we have just considered. */
1400
1401 if (h->next == NULL || h->next->mx != h->mx) prev = h;
1402 }
1403
1404return yield; /* No local hosts found: return HOST_FOUND or HOST_FIND_FAILED */
1405
1406/* A host whose IP address matches a local IP address, or whose name matches
1407something in hosts_treat_as_local has been found. */
1408
1409FOUND_LOCAL:
1410
1411if (prev == NULL)
1412 {
1413 HDEBUG(D_host_lookup) debug_printf((h->mx >= 0)?
1414 "local host has lowest MX\n" :
1415 "local host found for non-MX address\n");
1416 return HOST_FOUND_LOCAL;
1417 }
1418
1419HDEBUG(D_host_lookup)
1420 {
1421 debug_printf("local host in host list - removed hosts:\n");
1422 for (h = prev->next; h != last->next; h = h->next)
1423 debug_printf(" %s %s %d\n", h->name, h->address, h->mx);
1424 }
1425
1426if (removed != NULL) *removed = TRUE;
1427prev->next = last->next;
1428*lastptr = prev;
1429return yield;
1430}
1431
1432
1433
1434
1435/*************************************************
1436* Remove duplicate IPs in host list *
1437*************************************************/
1438
1439/* You would think that administrators could set up their DNS records so that
1440one ended up with a list of unique IP addresses after looking up A or MX
1441records, but apparently duplication is common. So we scan such lists and
1442remove the later duplicates. Note that we may get lists in which some host
1443addresses are not set.
1444
1445Arguments:
1446 host pointer to the first host in the chain
1447 lastptr pointer to pointer to the last host in the chain (may be updated)
1448
1449Returns: nothing
1450*/
1451
1452static void
1453host_remove_duplicates(host_item *host, host_item **lastptr)
1454{
1455while (host != *lastptr)
1456 {
1457 if (host->address != NULL)
1458 {
1459 host_item *h = host;
1460 while (h != *lastptr)
1461 {
1462 if (h->next->address != NULL &&
1463 Ustrcmp(h->next->address, host->address) == 0)
1464 {
1465 DEBUG(D_host_lookup) debug_printf("duplicate IP address %s (MX=%d) "
1466 "removed\n", host->address, h->next->mx);
1467 if (h->next == *lastptr) *lastptr = h;
1468 h->next = h->next->next;
1469 }
1470 else h = h->next;
1471 }
1472 }
1473 /* If the last item was removed, host may have become == *lastptr */
1474 if (host != *lastptr) host = host->next;
1475 }
1476}
1477
1478
1479
1480
1481/*************************************************
1482* Find sender host name by gethostbyaddr() *
1483*************************************************/
1484
1485/* This used to be the only way it was done, but it turns out that not all
1486systems give aliases for calls to gethostbyaddr() - or one of the modern
1487equivalents like getipnodebyaddr(). Fortunately, multiple PTR records are rare,
1488but they can still exist. This function is now used only when a DNS lookup of
1489the IP address fails, in order to give access to /etc/hosts.
1490
1491Arguments: none
1492Returns: OK, DEFER, FAIL
1493*/
1494
1495static int
1496host_name_lookup_byaddr(void)
1497{
1498int len;
1499uschar *s, *t;
1500struct hostent *hosts;
1501struct in_addr addr;
1502
1503/* Lookup on IPv6 system */
1504
1505#if HAVE_IPV6
1506if (Ustrchr(sender_host_address, ':') != NULL)
1507 {
1508 struct in6_addr addr6;
1509 if (inet_pton(AF_INET6, CS sender_host_address, &addr6) != 1)
1510 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "unable to parse \"%s\" as an "
1511 "IPv6 address", sender_host_address);
1512 #if HAVE_GETIPNODEBYADDR
1513 hosts = getipnodebyaddr(CS &addr6, sizeof(addr6), AF_INET6, &h_errno);
1514 #else
1515 hosts = gethostbyaddr(CS &addr6, sizeof(addr6), AF_INET6);
1516 #endif
1517 }
1518else
1519 {
1520 if (inet_pton(AF_INET, CS sender_host_address, &addr) != 1)
1521 log_write(0, LOG_MAIN|LOG_PANIC_DIE, "unable to parse \"%s\" as an "
1522 "IPv4 address", sender_host_address);
1523 #if HAVE_GETIPNODEBYADDR
1524 hosts = getipnodebyaddr(CS &addr, sizeof(addr), AF_INET, &h_errno);
1525 #else
1526 hosts = gethostbyaddr(CS &addr, sizeof(addr), AF_INET);
1527 #endif
1528 }
1529
1530/* Do lookup on IPv4 system */
1531
1532#else
1533addr.s_addr = (S_ADDR_TYPE)inet_addr(CS sender_host_address);
1534hosts = gethostbyaddr(CS(&addr), sizeof(addr), AF_INET);
1535#endif
1536
1537/* Failed to look up the host. */
1538
1539if (hosts == NULL)
1540 {
1541 HDEBUG(D_host_lookup) debug_printf("IP address lookup failed: h_errno=%d\n",
1542 h_errno);
1543 return (h_errno == TRY_AGAIN || h_errno == NO_RECOVERY) ? DEFER : FAIL;
1544 }
1545
1546/* It seems there are some records in the DNS that yield an empty name. We
1547treat this as non-existent. In some operating systems, this is returned as an
1548empty string; in others as a single dot. */
1549
1550if (hosts->h_name[0] == 0 || hosts->h_name[0] == '.')
1551 {
1552 HDEBUG(D_host_lookup) debug_printf("IP address lookup yielded an empty name: "
1553 "treated as non-existent host name\n");
1554 return FAIL;
1555 }
1556
1557/* Copy and lowercase the name, which is in static storage in many systems.
1558Put it in permanent memory. */
1559
1560s = (uschar *)hosts->h_name;
1561len = Ustrlen(s) + 1;
1562t = sender_host_name = store_get_perm(len);
1563while (*s != 0) *t++ = tolower(*s++);
1564*t = 0;
1565
1566/* If the host has aliases, build a copy of the alias list */
1567
1568if (hosts->h_aliases != NULL)
1569 {
1570 int count = 1;
1571 uschar **aliases, **ptr;
1572 for (aliases = USS hosts->h_aliases; *aliases != NULL; aliases++) count++;
1573 ptr = sender_host_aliases = store_get_perm(count * sizeof(uschar *));
1574 for (aliases = USS hosts->h_aliases; *aliases != NULL; aliases++)
1575 {
1576 uschar *s = *aliases;
1577 int len = Ustrlen(s) + 1;
1578 uschar *t = *ptr++ = store_get_perm(len);
1579 while (*s != 0) *t++ = tolower(*s++);
1580 *t = 0;
1581 }
1582 *ptr = NULL;
1583 }
1584
1585return OK;
1586}
1587
1588
1589
1590/*************************************************
1591* Find host name for incoming call *
1592*************************************************/
1593
1594/* Put the name in permanent store, pointed to by sender_host_name. We also set
1595up a list of alias names, pointed to by sender_host_alias. The list is
1596NULL-terminated. The incoming address is in sender_host_address, either in
1597dotted-quad form for IPv4 or in colon-separated form for IPv6.
1598
1599This function does a thorough check that the names it finds point back to the
1600incoming IP address. Any that do not are discarded. Note that this is relied on
1601by the ACL reverse_host_lookup check.
1602
1603On some systems, get{host,ipnode}byaddr() appears to do this internally, but
1604this it not universally true. Also, for release 4.30, this function was changed
1605to do a direct DNS lookup first, by default[1], because it turns out that that
1606is the only guaranteed way to find all the aliases on some systems. My
1607experiments indicate that Solaris gethostbyaddr() gives the aliases for but
1608Linux does not.
1609
1610[1] The actual order is controlled by the host_lookup_order option.
1611
1612Arguments: none
1613Returns: OK on success, the answer being placed in the global variable
1614 sender_host_name, with any aliases in a list hung off
1615 sender_host_aliases
1616 FAIL if no host name can be found
1617 DEFER if a temporary error was encountered
1618
1619The variable host_lookup_msg is set to an empty string on sucess, or to a
1620reason for the failure otherwise, in a form suitable for tagging onto an error
8e669ac1 1621message, and also host_lookup_failed is set TRUE if the lookup failed. If there
b08b24c8
PH
1622was a defer, host_lookup_deferred is set TRUE.
1623
1624Any dynamically constructed string for host_lookup_msg must be in permanent
1625store, because it might be used for several incoming messages on the same SMTP
059ec3d9
PH
1626connection. */
1627
1628int
1629host_name_lookup(void)
1630{
1631int old_pool, rc;
1632int sep = 0;
1633uschar *hname, *save_hostname;
1634uschar **aliases;
1635uschar buffer[256];
1636uschar *ordername;
1637uschar *list = host_lookup_order;
1638dns_record *rr;
1639dns_answer dnsa;
1640dns_scan dnss;
1641
b08b24c8
PH
1642host_lookup_deferred = host_lookup_failed = FALSE;
1643
059ec3d9
PH
1644HDEBUG(D_host_lookup)
1645 debug_printf("looking up host name for %s\n", sender_host_address);
1646
1647/* For testing the case when a lookup does not complete, we have a special
1648reserved IP address. */
1649
1650if (running_in_test_harness &&
1651 Ustrcmp(sender_host_address, "99.99.99.99") == 0)
1652 {
1653 HDEBUG(D_host_lookup)
1654 debug_printf("Test harness: host name lookup returns DEFER\n");
8e669ac1 1655 host_lookup_deferred = TRUE;
059ec3d9
PH
1656 return DEFER;
1657 }
1658
1659/* Do lookups directly in the DNS or via gethostbyaddr() (or equivalent), in
1660the order specified by the host_lookup_order option. */
1661
1662while ((ordername = string_nextinlist(&list, &sep, buffer, sizeof(buffer)))
1663 != NULL)
1664 {
1665 if (strcmpic(ordername, US"bydns") == 0)
1666 {
1667 dns_init(FALSE, FALSE);
1668 dns_build_reverse(sender_host_address, buffer);
1669 rc = dns_lookup(&dnsa, buffer, T_PTR, NULL);
1670
1671 /* The first record we come across is used for the name; others are
1672 considered to be aliases. We have to scan twice, in order to find out the
1673 number of aliases. However, if all the names are empty, we will behave as
1674 if failure. (PTR records that yield empty names have been encountered in
1675 the DNS.) */
1676
1677 if (rc == DNS_SUCCEED)
1678 {
1679 uschar **aptr = NULL;
1680 int ssize = 264;
1681 int count = 0;
1682 int old_pool = store_pool;
1683
1684 store_pool = POOL_PERM; /* Save names in permanent storage */
1685
1686 for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
1687 rr != NULL;
1688 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
1689 {
1690 if (rr->type == T_PTR) count++;
1691 }
1692
1693 /* Get store for the list of aliases. For compatibility with
1694 gethostbyaddr, we make an empty list if there are none. */
1695
1696 aptr = sender_host_aliases = store_get(count * sizeof(uschar *));
1697
1698 /* Re-scan and extract the names */
1699
1700 for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
1701 rr != NULL;
1702 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
1703 {
1704 uschar *s = NULL;
1705 if (rr->type != T_PTR) continue;
1706 s = store_get(ssize);
1707
1708 /* If an overlong response was received, the data will have been
1709 truncated and dn_expand may fail. */
1710
1711 if (dn_expand(dnsa.answer, dnsa.answer + dnsa.answerlen,
1712 (uschar *)(rr->data), (DN_EXPAND_ARG4_TYPE)(s), ssize) < 0)
1713 {
1714 log_write(0, LOG_MAIN, "host name alias list truncated for %s",
1715 sender_host_address);
1716 break;
1717 }
1718
1719 store_reset(s + Ustrlen(s) + 1);
1720 if (s[0] == 0)
1721 {
1722 HDEBUG(D_host_lookup) debug_printf("IP address lookup yielded an "
1723 "empty name: treated as non-existent host name\n");
1724 continue;
1725 }
1726 if (sender_host_name == NULL) sender_host_name = s;
1727 else *aptr++ = s;
1728 while (*s != 0) { *s = tolower(*s); s++; }
1729 }
1730
1731 *aptr = NULL; /* End of alias list */
1732 store_pool = old_pool; /* Reset store pool */
1733
1734 /* If we've found a names, break out of the "order" loop */
1735
1736 if (sender_host_name != NULL) break;
1737 }
1738
1739 /* If the DNS lookup deferred, we must also defer. */
1740
1741 if (rc == DNS_AGAIN)
1742 {
1743 HDEBUG(D_host_lookup)
1744 debug_printf("IP address PTR lookup gave temporary error\n");
8e669ac1 1745 host_lookup_deferred = TRUE;
059ec3d9
PH
1746 return DEFER;
1747 }
1748 }
1749
1750 /* Do a lookup using gethostbyaddr() - or equivalent */
1751
1752 else if (strcmpic(ordername, US"byaddr") == 0)
1753 {
1754 HDEBUG(D_host_lookup)
1755 debug_printf("IP address lookup using gethostbyaddr()\n");
059ec3d9 1756 rc = host_name_lookup_byaddr();
8e669ac1 1757 if (rc == DEFER)
b08b24c8 1758 {
8e669ac1 1759 host_lookup_deferred = TRUE;
b08b24c8 1760 return rc; /* Can't carry on */
8e669ac1 1761 }
059ec3d9
PH
1762 if (rc == OK) break; /* Found a name */
1763 }
1764 } /* Loop for bydns/byaddr scanning */
1765
1766/* If we have failed to find a name, return FAIL and log when required.
1767NB host_lookup_msg must be in permanent store. */
1768
1769if (sender_host_name == NULL)
1770 {
1771 if (host_checking || !log_testing_mode)
1772 log_write(L_host_lookup_failed, LOG_MAIN, "no host name found for IP "
1773 "address %s", sender_host_address);
1774 host_lookup_msg = US" (failed to find host name from IP address)";
b08b24c8 1775 host_lookup_failed = TRUE;
059ec3d9
PH
1776 return FAIL;
1777 }
1778
1779/* We have a host name. If we are running in the test harness, we want the host
1780name and its alias to appear always the same way round. There are only ever two
1781names in these tests. If one of them contains "alias", make sure it is second;
1782otherwise put them in alphabetical order. */
1783
1784if (running_in_test_harness && *sender_host_aliases != NULL &&
1785 (
1786 Ustrstr(sender_host_name, "alias") != NULL ||
1787 (
1788 Ustrstr(*sender_host_aliases, "alias") == NULL &&
1789 Ustrcmp(sender_host_name, *sender_host_aliases) > 0
1790 )
1791 ))
1792 {
1793 uschar *temp = sender_host_name;
1794 sender_host_name = *sender_host_aliases;
1795 *sender_host_aliases = temp;
1796 }
1797
1798/* Debug output what was found, after test harness swapping, for consistency */
1799
1800HDEBUG(D_host_lookup)
1801 {
1802 uschar **aliases = sender_host_aliases;
1803 debug_printf("IP address lookup yielded %s\n", sender_host_name);
1804 while (*aliases != NULL) debug_printf(" alias %s\n", *aliases++);
1805 }
1806
1807/* We need to verify that a forward lookup on the name we found does indeed
1808correspond to the address. This is for security: in principle a malefactor who
1809happened to own a reverse zone could set it to point to any names at all.
1810
1811This code was present in versions of Exim before 3.20. At that point I took it
1812out because I thought that gethostbyaddr() did the check anyway. It turns out
1813that this isn't always the case, so it's coming back in at 4.01. This version
1814is actually better, because it also checks aliases.
1815
1816The code was made more robust at release 4.21. Prior to that, it accepted all
1817the names if any of them had the correct IP address. Now the code checks all
1818the names, and accepts only those that have the correct IP address. */
1819
1820save_hostname = sender_host_name; /* Save for error messages */
1821aliases = sender_host_aliases;
1822for (hname = sender_host_name; hname != NULL; hname = *aliases++)
1823 {
1824 int rc;
1825 BOOL ok = FALSE;
1826 host_item h;
1827 h.next = NULL;
1828 h.name = hname;
1829 h.mx = MX_NONE;
1830 h.address = NULL;
1831
1832 /* When called with the 5th argument FALSE, host_find_byname() won't return
1833 HOST_FOUND_LOCAL. If the incoming address is an IPv4 address expressed in
1834 IPv6 format, we must compare the IPv4 part to any IPv4 addresses. */
1835
1836 if ((rc = host_find_byname(&h, NULL, NULL, FALSE)) == HOST_FOUND)
1837 {
1838 host_item *hh;
1839 uschar *address_ipv4 = (Ustrncmp(sender_host_address, "::ffff:", 7) == 0)?
1840 sender_host_address + 7 : sender_host_address;
1841 HDEBUG(D_host_lookup) debug_printf("checking addresses for %s\n", hname);
1842 for (hh = &h; hh != NULL; hh = hh->next)
1843 {
1844 if ((Ustrcmp(hh->address, (Ustrchr(hh->address, ':') == NULL)?
1845 address_ipv4 : sender_host_address)) == 0)
1846 {
1847 HDEBUG(D_host_lookup) debug_printf(" %s OK\n", hh->address);
1848 ok = TRUE;
1849 break;
1850 }
1851 else
1852 {
1853 HDEBUG(D_host_lookup) debug_printf(" %s\n", hh->address);
1854 }
1855 }
1856 if (!ok) HDEBUG(D_host_lookup)
1857 debug_printf("no IP address for %s matched %s\n", hname,
1858 sender_host_address);
1859 }
1860 else if (rc == HOST_FIND_AGAIN)
1861 {
1862 HDEBUG(D_host_lookup) debug_printf("temporary error for host name lookup\n");
8e669ac1 1863 host_lookup_deferred = TRUE;
059ec3d9
PH
1864 return DEFER;
1865 }
1866 else
1867 {
1868 HDEBUG(D_host_lookup) debug_printf("no IP addresses found for %s\n", hname);
1869 }
1870
1871 /* If this name is no good, and it's the sender name, set it null pro tem;
1872 if it's an alias, just remove it from the list. */
1873
1874 if (!ok)
1875 {
1876 if (hname == sender_host_name) sender_host_name = NULL; else
1877 {
1878 uschar **a; /* Don't amalgamate - some */
1879 a = --aliases; /* compilers grumble */
1880 while (*a != NULL) { *a = a[1]; a++; }
1881 }
1882 }
1883 }
1884
1885/* If sender_host_name == NULL, it means we didn't like the name. Replace
1886it with the first alias, if there is one. */
1887
1888if (sender_host_name == NULL && *sender_host_aliases != NULL)
1889 sender_host_name = *sender_host_aliases++;
1890
1891/* If we now have a main name, all is well. */
1892
1893if (sender_host_name != NULL) return OK;
1894
1895/* We have failed to find an address that matches. */
1896
1897HDEBUG(D_host_lookup)
1898 debug_printf("%s does not match any IP address for %s\n",
1899 sender_host_address, save_hostname);
1900
1901/* This message must be in permanent store */
1902
1903old_pool = store_pool;
1904store_pool = POOL_PERM;
1905host_lookup_msg = string_sprintf(" (%s does not match any IP address for %s)",
1906 sender_host_address, save_hostname);
1907store_pool = old_pool;
059ec3d9
PH
1908host_lookup_failed = TRUE;
1909return FAIL;
1910}
1911
1912
1913
1914
1915/*************************************************
1916* Find IP address(es) for host by name *
1917*************************************************/
1918
1919/* The input is a host_item structure with the name filled in and the address
1920field set to NULL. We use gethostbyname(). Of course, gethostbyname() may use
1921the DNS, but it doesn't do MX processing. If more than one address is given,
1922chain on additional host items, with other relevant fields copied.
1923
1924The second argument provides a host list (usually an IP list) of hosts to
1925ignore. This makes it possible to ignore IPv6 link-local addresses or loopback
1926addresses in unreasonable places.
1927
1928The lookup may result in a change of name. For compatibility with the dns
1929lookup, return this via fully_qualified_name as well as updating the host item.
1930The lookup may also yield more than one IP address, in which case chain on
1931subsequent host_item structures.
1932
1933Arguments:
1934 host a host item with the name and MX filled in;
1935 the address is to be filled in;
1936 multiple IP addresses cause other host items to be
1937 chained on.
1938 ignore_target_hosts a list of hosts to ignore
1939 fully_qualified_name if not NULL, set to point to host name for
1940 compatibility with host_find_bydns
1941 local_host_check TRUE if a check for the local host is wanted
1942
1943Returns: HOST_FIND_FAILED Failed to find the host or domain
1944 HOST_FIND_AGAIN Try again later
1945 HOST_FOUND Host found - data filled in
1946 HOST_FOUND_LOCAL Host found and is the local host
1947*/
1948
1949int
1950host_find_byname(host_item *host, uschar *ignore_target_hosts,
1951 uschar **fully_qualified_name, BOOL local_host_check)
1952{
1953int i, yield, times;
1954uschar **addrlist;
1955host_item *last = NULL;
1956BOOL temp_error = FALSE;
b08b24c8
PH
1957#if HAVE_IPV6
1958int af;
1959#endif
1960
1961/* If we are in the test harness, a name ending in .test.again.dns always
1962forces a temporary error response. */
1963
1964if (running_in_test_harness)
1965 {
1966 uschar *endname = host->name + Ustrlen(host->name);
1967 if (Ustrcmp(endname - 14, "test.again.dns") == 0)
1968 return HOST_FIND_AGAIN;
8e669ac1 1969 }
059ec3d9
PH
1970
1971/* In an IPv6 world, we need to scan for both kinds of address, so go round the
1972loop twice. Note that we have ensured that AF_INET6 is defined even in an IPv4
1973world, which makes for slightly tidier code. However, if dns_ipv4_lookup
1974matches the domain, we also just do IPv4 lookups here (except when testing
1975standalone). */
1976
1977#if HAVE_IPV6
059ec3d9
PH
1978 #ifndef STAND_ALONE
1979 if (dns_ipv4_lookup != NULL &&
1980 match_isinlist(host->name, &dns_ipv4_lookup, 0, NULL, NULL, MCL_DOMAIN,
1981 TRUE, NULL) == OK)
1982 { af = AF_INET; times = 1; }
1983 else
1984 #endif /* STAND_ALONE */
1985
1986 { af = AF_INET6; times = 2; }
1987
1988/* No IPv6 support */
1989
1990#else /* HAVE_IPV6 */
1991 times = 1;
1992#endif /* HAVE_IPV6 */
1993
1994/* Initialize the flag that gets set for DNS syntax check errors, so that the
1995interface to this function can be similar to host_find_bydns. */
1996
1997host_find_failed_syntax = FALSE;
1998
1999/* Loop to look up both kinds of address in an IPv6 world */
2000
2001for (i = 1; i <= times;
2002 #if HAVE_IPV6
2003 af = AF_INET, /* If 2 passes, IPv4 on the second */
2004 #endif
2005 i++)
2006 {
2007 BOOL ipv4_addr;
2008 int error_num;
2009 struct hostent *hostdata;
2010
2011 #if HAVE_IPV6
e7726cbf
PH
2012 if (running_in_test_harness)
2013 hostdata = host_fake_gethostbyname(host->name, af, &error_num);
2014 else
2015 {
059ec3d9
PH
2016 #if HAVE_GETIPNODEBYNAME
2017 hostdata = getipnodebyname(CS host->name, af, 0, &error_num);
2018 #else
2019 hostdata = gethostbyname2(CS host->name, af);
2020 error_num = h_errno;
2021 #endif
e7726cbf
PH
2022 }
2023
2024 #else /* not HAVE_IPV6 */
2025 if (running_in_test_harness)
2026 hostdata = host_fake_gethostbyname(host->name, AF_INET, &error_num);
2027 else
2028 {
2029 hostdata = gethostbyname(CS host->name);
2030 error_num = h_errno;
2031 }
2032 #endif /* HAVE_IPV6 */
059ec3d9
PH
2033
2034 if (hostdata == NULL)
2035 {
2036 uschar *error;
2037 switch (error_num)
2038 {
2039 case HOST_NOT_FOUND: error = US"HOST_NOT_FOUND"; break;
2040 case TRY_AGAIN: error = US"TRY_AGAIN"; break;
2041 case NO_RECOVERY: error = US"NO_RECOVERY"; break;
2042 case NO_DATA: error = US"NO_DATA"; break;
2043 #if NO_DATA != NO_ADDRESS
2044 case NO_ADDRESS: error = US"NO_ADDRESS"; break;
2045 #endif
2046 default: error = US"?"; break;
2047 }
2048
2049 DEBUG(D_host_lookup) debug_printf("%s returned %d (%s)\n",
2050 #if HAVE_IPV6
2051 #if HAVE_GETIPNODEBYNAME
2052 (af == AF_INET6)? "getipnodebyname(af=inet6)" : "getipnodebyname(af=inet)",
2053 #else
2054 (af == AF_INET6)? "gethostbyname2(af=inet6)" : "gethostbyname2(af=inet)",
2055 #endif
2056 #else
2057 "gethostbyname",
2058 #endif
2059 error_num, error);
2060
2061 if (error_num == TRY_AGAIN || error_num == NO_RECOVERY) temp_error = TRUE;
2062 continue;
2063 }
2064 if ((hostdata->h_addr_list)[0] == NULL) continue;
2065
2066 /* Replace the name with the fully qualified one if necessary, and fill in
2067 the fully_qualified_name pointer. */
2068
2069 if (hostdata->h_name[0] != 0 &&
2070 Ustrcmp(host->name, hostdata->h_name) != 0)
2071 host->name = string_copy_dnsdomain((uschar *)hostdata->h_name);
2072 if (fully_qualified_name != NULL) *fully_qualified_name = host->name;
2073
2074 /* Get the list of addresses. IPv4 and IPv6 addresses can be distinguished
2075 by their different lengths. Scan the list, ignoring any that are to be
2076 ignored, and build a chain from the rest. */
2077
2078 ipv4_addr = hostdata->h_length == sizeof(struct in_addr);
2079
2080 for (addrlist = USS hostdata->h_addr_list; *addrlist != NULL; addrlist++)
2081 {
2082 uschar *text_address =
2083 host_ntoa(ipv4_addr? AF_INET:AF_INET6, *addrlist, NULL, NULL);
2084
2085 #ifndef STAND_ALONE
2086 if (ignore_target_hosts != NULL &&
2087 verify_check_this_host(&ignore_target_hosts, NULL, host->name,
2088 text_address, NULL) == OK)
2089 {
2090 DEBUG(D_host_lookup)
2091 debug_printf("ignored host %s [%s]\n", host->name, text_address);
2092 continue;
2093 }
2094 #endif
2095
2096 /* If this is the first address, last == NULL and we put the data in the
2097 original block. */
2098
2099 if (last == NULL)
2100 {
2101 host->address = text_address;
2102 host->port = PORT_NONE;
2103 host->status = hstatus_unknown;
2104 host->why = hwhy_unknown;
2105 last = host;
2106 }
2107
2108 /* Else add further host item blocks for any other addresses, keeping
2109 the order. */
2110
2111 else
2112 {
2113 host_item *next = store_get(sizeof(host_item));
2114 next->name = host->name;
2115 next->mx = host->mx;
2116 next->address = text_address;
2117 next->port = PORT_NONE;
2118 next->status = hstatus_unknown;
2119 next->why = hwhy_unknown;
2120 next->last_try = 0;
2121 next->next = last->next;
2122 last->next = next;
2123 last = next;
2124 }
2125 }
2126 }
2127
2128/* If no hosts were found, the address field in the original host block will be
2129NULL. If temp_error is set, at least one of the lookups gave a temporary error,
2130so we pass that back. */
2131
2132if (host->address == NULL)
2133 {
2134 uschar *msg =
2135 #ifndef STAND_ALONE
2136 (message_id[0] == 0 && smtp_in != NULL)?
2137 string_sprintf("no IP address found for host %s (during %s)", host->name,
2138 smtp_get_connection_info()) :
2139 #endif
2140 string_sprintf("no IP address found for host %s", host->name);
2141
2142 HDEBUG(D_host_lookup) debug_printf("%s\n", msg);
2143 if (temp_error) return HOST_FIND_AGAIN;
2144 if (host_checking || !log_testing_mode)
2145 log_write(L_host_lookup_failed, LOG_MAIN, "%s", msg);
2146 return HOST_FIND_FAILED;
2147 }
2148
2149/* Remove any duplicate IP addresses, then check to see if this is the local
2150host if required. */
2151
2152host_remove_duplicates(host, &last);
2153yield = local_host_check?
2154 host_scan_for_local_hosts(host, &last, NULL) : HOST_FOUND;
2155
2156/* When running in the test harness, sort into the order of addresses so as to
d8ef3577 2157get repeatability. */
059ec3d9 2158
d8ef3577 2159if (running_in_test_harness) sort_addresses(host, last);
059ec3d9
PH
2160
2161HDEBUG(D_host_lookup)
2162 {
2163 host_item *h;
2164 if (fully_qualified_name != NULL)
2165 debug_printf("fully qualified name = %s\n", *fully_qualified_name);
2166 debug_printf("%s looked up these IP addresses:\n",
2167 #if HAVE_IPV6
2168 #if HAVE_GETIPNODEBYNAME
2169 "getipnodebyname"
2170 #else
2171 "gethostbyname2"
2172 #endif
2173 #else
2174 "gethostbyname"
2175 #endif
2176 );
2177 for (h = host; h != last->next; h = h->next)
2178 debug_printf(" name=%s address=%s\n", h->name,
2179 (h->address == NULL)? US"<null>" : h->address);
2180 }
2181
2182/* Return the found status. */
2183
2184return yield;
2185}
2186
2187
2188
2189/*************************************************
2190* Fill in a host address from the DNS *
2191*************************************************/
2192
2193/* Given a host item, with its name and mx fields set, and its address field
2194set to NULL, fill in its IP address from the DNS. If it is multi-homed, create
2195additional host items for the additional addresses, copying all the other
2196fields, and randomizing the order.
2197
2198On IPv6 systems, A6 records are sought first (but only if support for A6 is
2199configured - they may never become mainstream), then AAAA records are sought,
2200and finally A records are sought as well.
2201
2202The host name may be changed if the DNS returns a different name - e.g. fully
2203qualified or changed via CNAME. If fully_qualified_name is not NULL, dns_lookup
2204ensures that it points to the fully qualified name. However, this is the fully
2205qualified version of the original name; if a CNAME is involved, the actual
2206canonical host name may be different again, and so we get it directly from the
2207relevant RR. Note that we do NOT change the mx field of the host item in this
2208function as it may be called to set the addresses of hosts taken from MX
2209records.
2210
2211Arguments:
2212 host points to the host item we're filling in
2213 lastptr points to pointer to last host item in a chain of
2214 host items (may be updated if host is last and gets
2215 extended because multihomed)
2216 ignore_target_hosts list of hosts to ignore
2217 allow_ip if TRUE, recognize an IP address and return it
2218 fully_qualified_name if not NULL, return fully qualified name here if
2219 the contents are different (i.e. it must be preset
2220 to something)
2221
2222Returns: HOST_FIND_FAILED couldn't find A record
2223 HOST_FIND_AGAIN try again later
2224 HOST_FOUND found AAAA and/or A record(s)
2225 HOST_IGNORED found, but all IPs ignored
2226*/
2227
2228static int
2229set_address_from_dns(host_item *host, host_item **lastptr,
2230 uschar *ignore_target_hosts, BOOL allow_ip, uschar **fully_qualified_name)
2231{
2232dns_record *rr;
2233host_item *thishostlast = NULL; /* Indicates not yet filled in anything */
2234BOOL v6_find_again = FALSE;
2235int i;
2236
2237/* If allow_ip is set, a name which is an IP address returns that value
2238as its address. This is used for MX records when allow_mx_to_ip is set, for
2239those sites that feel they have to flaunt the RFC rules. */
2240
2241if (allow_ip && string_is_ip_address(host->name, NULL) != 0)
2242 {
2243 #ifndef STAND_ALONE
2244 if (ignore_target_hosts != NULL &&
2245 verify_check_this_host(&ignore_target_hosts, NULL, host->name,
2246 host->name, NULL) == OK)
2247 return HOST_IGNORED;
2248 #endif
2249
2250 host->address = host->name;
2251 host->port = PORT_NONE;
2252 return HOST_FOUND;
2253 }
2254
2255/* On an IPv6 system, go round the loop up to three times, looking for A6 and
2256AAAA records the first two times. However, unless doing standalone testing, we
2257force an IPv4 lookup if the domain matches dns_ipv4_lookup is set. Since A6
2258records look like being abandoned, support them only if explicitly configured
2259to do so. On an IPv4 system, go round the loop once only, looking only for A
2260records. */
2261
2262#if HAVE_IPV6
059ec3d9
PH
2263 #ifndef STAND_ALONE
2264 if (dns_ipv4_lookup != NULL &&
2265 match_isinlist(host->name, &dns_ipv4_lookup, 0, NULL, NULL, MCL_DOMAIN,
2266 TRUE, NULL) == OK)
2267 i = 0; /* look up A records only */
2268 else
2269 #endif /* STAND_ALONE */
2270
2271 #ifdef SUPPORT_A6
2272 i = 2; /* look up A6 and AAAA and A records */
2273 #else
2274 i = 1; /* look up AAAA and A records */
2275 #endif /* SUPPORT_A6 */
2276
2277/* The IPv4 world */
2278
2279#else /* HAVE_IPV6 */
2280 i = 0; /* look up A records only */
2281#endif /* HAVE_IPV6 */
2282
2283for (; i >= 0; i--)
2284 {
2285 static int types[] = { T_A, T_AAAA, T_A6 };
2286 int type = types[i];
2287 int randoffset = (i == 0)? 500 : 0; /* Ensures v6 sorts before v4 */
2288 dns_answer dnsa;
2289 dns_scan dnss;
2290
2291 int rc = dns_lookup(&dnsa, host->name, type, fully_qualified_name);
2292
2293 /* We want to return HOST_FIND_AGAIN if one of the A, A6, or AAAA lookups
2294 fails or times out, but not if another one succeeds. (In the early
2295 IPv6 days there are name servers that always fail on AAAA, but are happy
2296 to give out an A record. We want to proceed with that A record.) */
8e669ac1 2297
059ec3d9
PH
2298 if (rc != DNS_SUCCEED)
2299 {
2300 if (i == 0) /* Just tried for an A record, i.e. end of loop */
2301 {
2302 if (host->address != NULL) return HOST_FOUND; /* A6 or AAAA was found */
2303 if (rc == DNS_AGAIN || rc == DNS_FAIL || v6_find_again)
2304 return HOST_FIND_AGAIN;
2305 return HOST_FIND_FAILED; /* DNS_NOMATCH or DNS_NODATA */
2306 }
2307
2308 /* Tried for an A6 or AAAA record: remember if this was a temporary
2309 error, and look for the next record type. */
2310
2311 if (rc != DNS_NOMATCH && rc != DNS_NODATA) v6_find_again = TRUE;
2312 continue;
2313 }
2314
2315 /* Lookup succeeded: fill in the given host item with the first non-ignored
2316 address found; create additional items for any others. A single A6 record
2317 may generate more than one address. */
2318
2319 for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
2320 rr != NULL;
2321 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
2322 {
2323 if (rr->type == type)
2324 {
2325 /* dns_address *da = dns_address_from_rr(&dnsa, rr); */
2326
2327 dns_address *da;
2328 da = dns_address_from_rr(&dnsa, rr);
2329
2330 DEBUG(D_host_lookup)
2331 {
2332 if (da == NULL)
2333 debug_printf("no addresses extracted from A6 RR for %s\n",
2334 host->name);
2335 }
2336
2337 /* This loop runs only once for A and AAAA records, but may run
2338 several times for an A6 record that generated multiple addresses. */
2339
2340 for (; da != NULL; da = da->next)
2341 {
2342 #ifndef STAND_ALONE
2343 if (ignore_target_hosts != NULL &&
2344 verify_check_this_host(&ignore_target_hosts, NULL,
2345 host->name, da->address, NULL) == OK)
2346 {
2347 DEBUG(D_host_lookup)
2348 debug_printf("ignored host %s [%s]\n", host->name, da->address);
2349 continue;
2350 }
2351 #endif
2352
2353 /* If this is the first address, stick it in the given host block,
2354 and change the name if the returned RR has a different name. */
2355
2356 if (thishostlast == NULL)
2357 {
2358 if (strcmpic(host->name, rr->name) != 0)
2359 host->name = string_copy_dnsdomain(rr->name);
2360 host->address = da->address;
2361 host->port = PORT_NONE;
2362 host->sort_key = host->mx * 1000 + random_number(500) + randoffset;
2363 host->status = hstatus_unknown;
2364 host->why = hwhy_unknown;
2365 thishostlast = host;
2366 }
2367
2368 /* Not the first address. Check for, and ignore, duplicates. Then
2369 insert in the chain at a random point. */
2370
2371 else
2372 {
2373 int new_sort_key;
2374 host_item *next;
2375
2376 /* End of our local chain is specified by "thishostlast". */
2377
2378 for (next = host;; next = next->next)
2379 {
2380 if (Ustrcmp(CS da->address, next->address) == 0) break;
2381 if (next == thishostlast) { next = NULL; break; }
2382 }
2383 if (next != NULL) continue; /* With loop for next address */
2384
2385 /* Not a duplicate */
2386
2387 new_sort_key = host->mx * 1000 + random_number(500) + randoffset;
2388 next = store_get(sizeof(host_item));
2389
2390 /* New address goes first: insert the new block after the first one
2391 (so as not to disturb the original pointer) but put the new address
2392 in the original block. */
2393
2394 if (new_sort_key < host->sort_key)
2395 {
2396 *next = *host;
2397 host->next = next;
2398 host->address = da->address;
2399 host->port = PORT_NONE;
2400 host->sort_key = new_sort_key;
2401 if (thishostlast == host) thishostlast = next; /* Local last */
2402 if (*lastptr == host) *lastptr = next; /* Global last */
2403 }
2404
2405 /* Otherwise scan down the addresses for this host to find the
2406 one to insert after. */
2407
2408 else
2409 {
2410 host_item *h = host;
2411 while (h != thishostlast)
2412 {
2413 if (new_sort_key < h->next->sort_key) break;
2414 h = h->next;
2415 }
2416 *next = *h;
2417 h->next = next;
2418 next->address = da->address;
2419 next->port = PORT_NONE;
2420 next->sort_key = new_sort_key;
2421 if (h == thishostlast) thishostlast = next; /* Local last */
2422 if (h == *lastptr) *lastptr = next; /* Global last */
2423 }
2424 }
2425 }
2426 }
2427 }
2428 }
2429
2430/* Control gets here only if the third lookup (the A record) succeeded.
2431However, the address may not be filled in if it was ignored. */
2432
2433return (host->address == NULL)? HOST_IGNORED : HOST_FOUND;
2434}
2435
2436
2437
2438
2439/*************************************************
2440* Find IP addresses and names for host via DNS *
2441*************************************************/
2442
2443/* The input is a host_item structure with the name filled in and the address
2444field set to NULL. This may be in a chain of other host items. The lookup may
2445result in more than one IP address, in which case we must created new host
2446blocks for the additional addresses, and insert them into the chain. The
2447original name may not be fully qualified. Use the fully_qualified_name argument
2448to return the official name, as returned by the resolver.
2449
2450Arguments:
2451 host point to initial host item
2452 ignore_target_hosts a list of hosts to ignore
2453 whichrrs flags indicating which RRs to look for:
2454 HOST_FIND_BY_SRV => look for SRV
2455 HOST_FIND_BY_MX => look for MX
2456 HOST_FIND_BY_A => look for A or AAAA
2457 also flags indicating how the lookup is done
2458 HOST_FIND_QUALIFY_SINGLE ) passed to the
2459 HOST_FIND_SEARCH_PARENTS ) resolver
2460 srv_service when SRV used, the service name
2461 srv_fail_domains DNS errors for these domains => assume nonexist
2462 mx_fail_domains DNS errors for these domains => assume nonexist
2463 fully_qualified_name if not NULL, return fully-qualified name
2464 removed set TRUE if local host was removed from the list
2465
2466Returns: HOST_FIND_FAILED Failed to find the host or domain;
2467 if there was a syntax error,
2468 host_find_failed_syntax is set.
2469 HOST_FIND_AGAIN Could not resolve at this time
2470 HOST_FOUND Host found
2471 HOST_FOUND_LOCAL The lowest MX record points to this
2472 machine, if MX records were found, or
2473 an A record that was found contains
2474 an address of the local host
2475*/
2476
2477int
2478host_find_bydns(host_item *host, uschar *ignore_target_hosts, int whichrrs,
2479 uschar *srv_service, uschar *srv_fail_domains, uschar *mx_fail_domains,
2480 uschar **fully_qualified_name, BOOL *removed)
2481{
2482host_item *h, *last;
2483dns_record *rr;
2484int rc = DNS_FAIL;
2485int ind_type = 0;
2486int yield;
2487dns_answer dnsa;
2488dns_scan dnss;
2489
2490/* Set the default fully qualified name to the incoming name, initialize the
2491resolver if necessary, set up the relevant options, and initialize the flag
2492that gets set for DNS syntax check errors. */
2493
2494if (fully_qualified_name != NULL) *fully_qualified_name = host->name;
2495dns_init((whichrrs & HOST_FIND_QUALIFY_SINGLE) != 0,
2496 (whichrrs & HOST_FIND_SEARCH_PARENTS) != 0);
2497host_find_failed_syntax = FALSE;
2498
2499/* First, if requested, look for SRV records. The service name is given; we
2500assume TCP progocol. DNS domain names are constrained to a maximum of 256
2501characters, so the code below should be safe. */
2502
2503if ((whichrrs & HOST_FIND_BY_SRV) != 0)
2504 {
2505 uschar buffer[300];
2506 uschar *temp_fully_qualified_name = buffer;
2507 int prefix_length;
2508
2509 (void)sprintf(CS buffer, "_%s._tcp.%n%.256s", srv_service, &prefix_length,
2510 host->name);
2511 ind_type = T_SRV;
2512
2513 /* Search for SRV records. If the fully qualified name is different to
2514 the input name, pass back the new original domain, without the prepended
2515 magic. */
2516
2517 rc = dns_lookup(&dnsa, buffer, ind_type, &temp_fully_qualified_name);
2518 if (temp_fully_qualified_name != buffer && fully_qualified_name != NULL)
2519 *fully_qualified_name = temp_fully_qualified_name + prefix_length;
2520
2521 /* On DNS failures, we give the "try again" error unless the domain is
2522 listed as one for which we continue. */
2523
2524 if (rc == DNS_FAIL || rc == DNS_AGAIN)
2525 {
e7726cbf 2526 #ifndef STAND_ALONE
059ec3d9
PH
2527 if (match_isinlist(host->name, &srv_fail_domains, 0, NULL, NULL, MCL_DOMAIN,
2528 TRUE, NULL) != OK)
e7726cbf 2529 #endif
059ec3d9
PH
2530 return HOST_FIND_AGAIN;
2531 DEBUG(D_host_lookup) debug_printf("DNS_%s treated as DNS_NODATA "
2532 "(domain in srv_fail_domains)\n", (rc == DNS_FAIL)? "FAIL":"AGAIN");
2533 }
2534 }
2535
2536/* If we did not find any SRV records, search the DNS for MX records, if
2537requested to do so. If the result is DNS_NOMATCH, it means there is no such
2538domain, and there's no point in going on to look for address records with the
2539same domain. The result will be DNS_NODATA if the domain exists but has no MX
2540records. On DNS failures, we give the "try again" error unless the domain is
2541listed as one for which we continue. */
2542
2543if (rc != DNS_SUCCEED && (whichrrs & HOST_FIND_BY_MX) != 0)
2544 {
2545 ind_type = T_MX;
2546 rc = dns_lookup(&dnsa, host->name, ind_type, fully_qualified_name);
2547 if (rc == DNS_NOMATCH) return HOST_FIND_FAILED;
2548 if (rc == DNS_FAIL || rc == DNS_AGAIN)
2549 {
e7726cbf 2550 #ifndef STAND_ALONE
059ec3d9
PH
2551 if (match_isinlist(host->name, &mx_fail_domains, 0, NULL, NULL, MCL_DOMAIN,
2552 TRUE, NULL) != OK)
e7726cbf 2553 #endif
059ec3d9
PH
2554 return HOST_FIND_AGAIN;
2555 DEBUG(D_host_lookup) debug_printf("DNS_%s treated as DNS_NODATA "
2556 "(domain in mx_fail_domains)\n", (rc == DNS_FAIL)? "FAIL":"AGAIN");
2557 }
2558 }
2559
2560/* If we haven't found anything yet, and we are requested to do so, try for an
2561A or AAAA record. If we find it (or them) check to see that it isn't the local
2562host. */
2563
2564if (rc != DNS_SUCCEED)
2565 {
2566 if ((whichrrs & HOST_FIND_BY_A) == 0)
2567 {
2568 DEBUG(D_host_lookup) debug_printf("Address records are not being sought\n");
2569 return HOST_FIND_FAILED;
2570 }
2571
2572 last = host; /* End of local chainlet */
2573 host->mx = MX_NONE;
2574 host->port = PORT_NONE;
2575 rc = set_address_from_dns(host, &last, ignore_target_hosts, FALSE,
2576 fully_qualified_name);
2577
2578 /* If one or more address records have been found, check that none of them
2579 are local. Since we know the host items all have their IP addresses
2580 inserted, host_scan_for_local_hosts() can only return HOST_FOUND or
2581 HOST_FOUND_LOCAL. We do not need to scan for duplicate IP addresses here,
2582 because set_address_from_dns() removes them. */
2583
2584 if (rc == HOST_FOUND)
2585 rc = host_scan_for_local_hosts(host, &last, removed);
2586 else
2587 if (rc == HOST_IGNORED) rc = HOST_FIND_FAILED; /* No special action */
2588
d8ef3577
PH
2589 /* When running in the test harness, sort into the order of addresses so as
2590 to get repeatability. */
8e669ac1 2591
d8ef3577
PH
2592 if (running_in_test_harness) sort_addresses(host, last);
2593
059ec3d9
PH
2594 DEBUG(D_host_lookup)
2595 {
2596 host_item *h;
2597 if (host->address != NULL)
2598 {
2599 if (fully_qualified_name != NULL)
2600 debug_printf("fully qualified name = %s\n", *fully_qualified_name);
2601 for (h = host; h != last->next; h = h->next)
2602 debug_printf("%s %s mx=%d sort=%d %s\n", h->name,
2603 (h->address == NULL)? US"<null>" : h->address, h->mx, h->sort_key,
2604 (h->status >= hstatus_unusable)? US"*" : US"");
2605 }
2606 }
2607
2608 return rc;
2609 }
2610
2611/* We have found one or more MX or SRV records. Sort them according to
2612precedence. Put the data for the first one into the existing host block, and
2613insert new host_item blocks into the chain for the remainder. For equal
2614precedences one is supposed to randomize the order. To make this happen, the
2615sorting is actually done on the MX value * 1000 + a random number. This is put
2616into a host field called sort_key.
2617
2618In the case of hosts with both IPv6 and IPv4 addresses, we want to choose the
2619IPv6 address in preference. At this stage, we don't know what kind of address
2620the host has. We choose a random number < 500; if later we find an A record
2621first, we add 500 to the random number. Then for any other address records, we
2622use random numbers in the range 0-499 for AAAA records and 500-999 for A
2623records.
2624
2625At this point we remove any duplicates that point to the same host, retaining
2626only the one with the lowest precedence. We cannot yet check for precedence
2627greater than that of the local host, because that test cannot be properly done
2628until the addresses have been found - an MX record may point to a name for this
2629host which is not the primary hostname. */
2630
2631last = NULL; /* Indicates that not even the first item is filled yet */
2632
2633for (rr = dns_next_rr(&dnsa, &dnss, RESET_ANSWERS);
2634 rr != NULL;
2635 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
2636 {
2637 int precedence;
2638 int weight = 0; /* For SRV records */
2639 int port = PORT_NONE; /* For SRV records */
2640 uschar *s; /* MUST be unsigned for GETSHORT */
2641 uschar data[256];
2642
2643 if (rr->type != ind_type) continue;
2644 s = rr->data;
2645 GETSHORT(precedence, s); /* Pointer s is advanced */
2646
2647 /* For MX records, we use a random "weight" which causes multiple records of
2648 the same precedence to sort randomly. */
2649
2650 if (ind_type == T_MX)
2651 {
2652 weight = random_number(500);
2653 }
2654
2655 /* SRV records are specified with a port and a weight. The weight is used
2656 in a special algorithm. However, to start with, we just use it to order the
2657 records of equal priority (precedence). */
2658
2659 else
2660 {
2661 GETSHORT(weight, s);
2662 GETSHORT(port, s);
2663 }
2664
2665 /* Get the name of the host pointed to. */
2666
2667 (void)dn_expand(dnsa.answer, dnsa.answer + dnsa.answerlen, s,
2668 (DN_EXPAND_ARG4_TYPE)data, sizeof(data));
2669
2670 /* Check that we haven't already got this host on the chain; if we have,
2671 keep only the lower precedence. This situation shouldn't occur, but you
2672 never know what junk might get into the DNS (and this case has been seen on
2673 more than one occasion). */
2674
2675 if (last != NULL) /* This is not the first record */
2676 {
2677 host_item *prev = NULL;
2678
2679 for (h = host; h != last->next; prev = h, h = h->next)
2680 {
2681 if (strcmpic(h->name, data) == 0)
2682 {
2683 DEBUG(D_host_lookup)
2684 debug_printf("discarded duplicate host %s (MX=%d)\n", data,
2685 (precedence > h->mx)? precedence : h->mx);
2686 if (precedence >= h->mx) goto NEXT_MX_RR; /* Skip greater precedence */
2687 if (h == host) /* Override first item */
2688 {
2689 h->mx = precedence;
2690 host->sort_key = precedence * 1000 + weight;
2691 goto NEXT_MX_RR;
2692 }
2693
2694 /* Unwanted host item is not the first in the chain, so we can get
2695 get rid of it by cutting it out. */
2696
2697 prev->next = h->next;
2698 if (h == last) last = prev;
2699 break;
2700 }
2701 }
2702 }
2703
2704 /* If this is the first MX or SRV record, put the data into the existing host
2705 block. Otherwise, add a new block in the correct place; if it has to be
2706 before the first block, copy the first block's data to a new second block. */
2707
2708 if (last == NULL)
2709 {
2710 host->name = string_copy_dnsdomain(data);
2711 host->address = NULL;
2712 host->port = port;
2713 host->mx = precedence;
2714 host->sort_key = precedence * 1000 + weight;
2715 host->status = hstatus_unknown;
2716 host->why = hwhy_unknown;
2717 last = host;
2718 }
2719
2720 /* Make a new host item and seek the correct insertion place */
2721
2722 else
2723 {
2724 int sort_key = precedence * 1000 + weight;
2725 host_item *next = store_get(sizeof(host_item));
2726 next->name = string_copy_dnsdomain(data);
2727 next->address = NULL;
2728 next->port = port;
2729 next->mx = precedence;
2730 next->sort_key = sort_key;
2731 next->status = hstatus_unknown;
2732 next->why = hwhy_unknown;
2733 next->last_try = 0;
2734
2735 /* Handle the case when we have to insert before the first item. */
2736
2737 if (sort_key < host->sort_key)
2738 {
2739 host_item htemp;
2740 htemp = *host;
2741 *host = *next;
2742 *next = htemp;
2743 host->next = next;
2744 if (last == host) last = next;
2745 }
2746
2747 /* Else scan down the items we have inserted as part of this exercise;
2748 don't go further. */
2749
2750 else
2751 {
2752 for (h = host; h != last; h = h->next)
2753 {
2754 if (sort_key < h->next->sort_key)
2755 {
2756 next->next = h->next;
2757 h->next = next;
2758 break;
2759 }
2760 }
2761
2762 /* Join on after the last host item that's part of this
2763 processing if we haven't stopped sooner. */
2764
2765 if (h == last)
2766 {
2767 next->next = last->next;
2768 last->next = next;
2769 last = next;
2770 }
2771 }
2772 }
2773
2774 NEXT_MX_RR: continue;
2775 }
2776
2777/* If the list of hosts was obtained from SRV records, there are two things to
2778do. First, if there is only one host, and it's name is ".", it means there is
2779no SMTP service at this domain. Otherwise, we have to sort the hosts of equal
2780priority according to their weights, using an algorithm that is defined in RFC
27812782. The hosts are currently sorted by priority and weight. For each priority
2782group we have to pick off one host and put it first, and then repeat for any
2783remaining in the same priority group. */
2784
2785if (ind_type == T_SRV)
2786 {
2787 host_item **pptr;
2788
2789 if (host == last && host->name[0] == 0)
2790 {
2791 DEBUG(D_host_lookup) debug_printf("the single SRV record is \".\"\n");
2792 return HOST_FIND_FAILED;
2793 }
2794
2795 DEBUG(D_host_lookup)
2796 {
2797 debug_printf("original ordering of hosts from SRV records:\n");
2798 for (h = host; h != last->next; h = h->next)
2799 debug_printf(" %s P=%d W=%d\n", h->name, h->mx, h->sort_key % 1000);
2800 }
2801
2802 for (pptr = &host, h = host; h != last; pptr = &(h->next), h = h->next)
2803 {
2804 int sum = 0;
2805 host_item *hh;
2806
2807 /* Find the last following host that has the same precedence. At the same
2808 time, compute the sum of the weights and the running totals. These can be
2809 stored in the sort_key field. */
2810
2811 for (hh = h; hh != last; hh = hh->next)
2812 {
2813 int weight = hh->sort_key % 1000; /* was precedence * 1000 + weight */
2814 sum += weight;
2815 hh->sort_key = sum;
2816 if (hh->mx != hh->next->mx) break;
2817 }
2818
2819 /* If there's more than one host at this precedence (priority), we need to
2820 pick one to go first. */
2821
2822 if (hh != h)
2823 {
2824 host_item *hhh;
2825 host_item **ppptr;
2826 int randomizer = random_number(sum + 1);
2827
2828 for (ppptr = pptr, hhh = h;
2829 hhh != hh;
2830 ppptr = &(hhh->next), hhh = hhh->next)
2831 {
2832 if (hhh->sort_key >= randomizer) break;
2833 }
2834
2835 /* hhh now points to the host that should go first; ppptr points to the
2836 place that points to it. Unfortunately, if the start of the minilist is
2837 the start of the entire list, we can't just swap the items over, because
2838 we must not change the value of host, since it is passed in from outside.
2839 One day, this could perhaps be changed.
2840
2841 The special case is fudged by putting the new item *second* in the chain,
2842 and then transferring the data between the first and second items. We
2843 can't just swap the first and the chosen item, because that would mean
2844 that an item with zero weight might no longer be first. */
2845
2846 if (hhh != h)
2847 {
2848 *ppptr = hhh->next; /* Cuts it out of the chain */
2849
2850 if (h == host)
2851 {
2852 host_item temp = *h;
2853 *h = *hhh;
2854 *hhh = temp;
2855 hhh->next = temp.next;
2856 h->next = hhh;
2857 }
2858
2859 else
2860 {
2861 hhh->next = h; /* The rest of the chain follows it */
2862 *pptr = hhh; /* It takes the place of h */
2863 h = hhh; /* It's now the start of this minilist */
2864 }
2865 }
2866 }
2867
2868 /* A host has been chosen to be first at this priority and h now points
2869 to this host. There may be others at the same priority, or others at a
2870 different priority. Before we leave this host, we need to put back a sort
2871 key of the traditional MX kind, in case this host is multihomed, because
2872 the sort key is used for ordering the multiple IP addresses. We do not need
2873 to ensure that these new sort keys actually reflect the order of the hosts,
2874 however. */
2875
2876 h->sort_key = h->mx * 1000 + random_number(500);
2877 } /* Move on to the next host */
2878 }
2879
2880/* Now we have to ensure addresses exist for all the hosts. We have ensured
2881above that the names in the host items are all unique. The addresses may have
2882been returned in the additional data section of the DNS query. Because it is
2883more expensive to scan the returned DNS records (because you have to expand the
2884names) we do a single scan over them, and multiple scans of the chain of host
2885items (which is typically only 3 or 4 long anyway.) Add extra host items for
2886multi-homed hosts. */
2887
2888for (rr = dns_next_rr(&dnsa, &dnss, RESET_ADDITIONAL);
2889 rr != NULL;
2890 rr = dns_next_rr(&dnsa, &dnss, RESET_NEXT))
2891 {
2892 dns_address *da;
2893 int status = hstatus_unknown;
2894 int why = hwhy_unknown;
2895 int randoffset;
2896
2897 if (rr->type != T_A
2898 #if HAVE_IPV6
2899 && rr->type != T_AAAA
2900 #ifdef SUPPORT_A6
2901 && rr->type != T_A6
2902 #endif
2903 #endif
2904 ) continue;
2905
2906 /* Find the first host that matches this record's name. If there isn't
2907 one, move on to the next RR. */
2908
2909 for (h = host; h != last->next; h = h->next)
2910 { if (strcmpic(h->name, rr->name) == 0) break; }
2911 if (h == last->next) continue;
2912
2913 /* For IPv4 addresses, add 500 to the random part of the sort key, to ensure
2914 they sort after IPv6 addresses. */
2915
2916 randoffset = (rr->type == T_A)? 500 : 0;
2917
2918 /* Get the list of textual addresses for this RR. There may be more than one
2919 if it is an A6 RR. Then loop to handle multiple addresses from an A6 record.
2920 If there are none, nothing will get done - the record is ignored. */
2921
2922 for (da = dns_address_from_rr(&dnsa, rr); da != NULL; da = da->next)
2923 {
2924 /* Set status for an ignorable host. */
2925
2926 #ifndef STAND_ALONE
2927 if (ignore_target_hosts != NULL &&
2928 verify_check_this_host(&ignore_target_hosts, NULL, h->name,
2929 da->address, NULL) == OK)
2930 {
2931 DEBUG(D_host_lookup)
2932 debug_printf("ignored host %s [%s]\n", h->name, da->address);
2933 status = hstatus_unusable;
2934 why = hwhy_ignored;
2935 }
2936 #endif
2937
2938 /* If the address is already set for this host, it may be that
2939 we just have a duplicate DNS record. Alternatively, this may be
2940 a multi-homed host. Search all items with the same host name
2941 (they will all be together) and if this address is found, skip
2942 to the next RR. */
2943
2944 if (h->address != NULL)
2945 {
2946 int new_sort_key;
2947 host_item *thishostlast;
2948 host_item *hh = h;
2949
2950 do
2951 {
2952 if (hh->address != NULL && Ustrcmp(CS da->address, hh->address) == 0)
2953 goto DNS_NEXT_RR; /* Need goto to escape from inner loop */
2954 thishostlast = hh;
2955 hh = hh->next;
2956 }
2957 while (hh != last->next && strcmpic(hh->name, rr->name) == 0);
2958
2959 /* We have a multi-homed host, since we have a new address for
2960 an existing name. Create a copy of the current item, and give it
2961 the new address. RRs can be in arbitrary order, but one is supposed
2962 to randomize the addresses of multi-homed hosts, so compute a new
2963 sorting key and do that. [Latest SMTP RFC says not to randomize multi-
2964 homed hosts, but to rely on the resolver. I'm not happy about that -
2965 caching in the resolver will not rotate as often as the name server
2966 does.] */
2967
2968 new_sort_key = h->mx * 1000 + random_number(500) + randoffset;
2969 hh = store_get(sizeof(host_item));
2970
2971 /* New address goes first: insert the new block after the first one
2972 (so as not to disturb the original pointer) but put the new address
2973 in the original block. */
2974
2975 if (new_sort_key < h->sort_key)
2976 {
2977 *hh = *h; /* Note: copies the port */
2978 h->next = hh;
2979 h->address = da->address;
2980 h->sort_key = new_sort_key;
2981 h->status = status;
2982 h->why = why;
2983 }
2984
2985 /* Otherwise scan down the addresses for this host to find the
2986 one to insert after. */
2987
2988 else
2989 {
2990 while (h != thishostlast)
2991 {
2992 if (new_sort_key < h->next->sort_key) break;
2993 h = h->next;
2994 }
2995 *hh = *h; /* Note: copies the port */
2996 h->next = hh;
2997 hh->address = da->address;
2998 hh->sort_key = new_sort_key;
2999 hh->status = status;
3000 hh->why = why;
3001 }
3002
3003 if (h == last) last = hh; /* Inserted after last */
3004 }
3005
3006 /* The existing item doesn't have its address set yet, so just set it.
3007 Ensure that an IPv4 address gets its sort key incremented in case an IPv6
3008 address is found later. */
3009
3010 else
3011 {
3012 h->address = da->address; /* Port should be set already */
3013 h->status = status;
3014 h->why = why;
3015 h->sort_key += randoffset;
3016 }
3017 } /* Loop for addresses extracted from one RR */
3018
3019 /* Carry on to the next RR. It would be nice to be able to be able to stop
3020 when every host on the list has an address, but we can't be sure there won't
3021 be an additional address for a multi-homed host further down the list, so
3022 we have to continue to the end. */
3023
3024 DNS_NEXT_RR: continue;
3025 }
3026
3027/* Set the default yield to failure */
3028
3029yield = HOST_FIND_FAILED;
3030
3031/* If we haven't found all the addresses in the additional section, we
3032need to search for A or AAAA records explicitly. The names shouldn't point to
3033CNAMES, but we use the general lookup function that handles them, just
3034in case. If any lookup gives a soft error, change the default yield.
3035
3036For these DNS lookups, we must disable qualify_single and search_parents;
3037otherwise invalid host names obtained from MX or SRV records can cause trouble
3038if they happen to match something local. */
3039
3040dns_init(FALSE, FALSE);
3041
3042for (h = host; h != last->next; h = h->next)
3043 {
3044 if (h->address != NULL || h->status == hstatus_unusable) continue;
3045 rc = set_address_from_dns(h, &last, ignore_target_hosts, allow_mx_to_ip, NULL);
3046 if (rc != HOST_FOUND)
3047 {
3048 h->status = hstatus_unusable;
3049 if (rc == HOST_FIND_AGAIN)
3050 {
3051 yield = rc;
3052 h->why = hwhy_deferred;
3053 }
3054 else
3055 h->why = (rc == HOST_IGNORED)? hwhy_ignored : hwhy_failed;
3056 }
3057 }
3058
3059/* Scan the list for any hosts that are marked unusable because they have
3060been explicitly ignored, and remove them from the list, as if they did not
3061exist. If we end up with just a single, ignored host, flatten its fields as if
3062nothing was found. */
3063
3064if (ignore_target_hosts != NULL)
3065 {
3066 host_item *prev = NULL;
3067 for (h = host; h != last->next; h = h->next)
3068 {
3069 REDO:
3070 if (h->why != hwhy_ignored) /* Non ignored host, just continue */
3071 prev = h;
3072 else if (prev == NULL) /* First host is ignored */
3073 {
3074 if (h != last) /* First is not last */
3075 {
3076 if (h->next == last) last = h; /* Overwrite it with next */
3077 *h = *(h->next); /* and reprocess it. */
3078 goto REDO; /* C should have redo, like Perl */
3079 }
3080 }
3081 else /* Ignored host is not first - */
3082 { /* cut it out */
3083 prev->next = h->next;
3084 if (h == last) last = prev;
3085 }
3086 }
3087
3088 if (host->why == hwhy_ignored) host->address = NULL;
3089 }
3090
3091/* There is still one complication in the case of IPv6. Although the code above
3092arranges that IPv6 addresses take precedence over IPv4 addresses for multihomed
3093hosts, it doesn't do this for addresses that apply to different hosts with the
3094same MX precedence, because the sorting on MX precedence happens first. So we
3095have to make another pass to check for this case. We ensure that, within a
3096single MX preference value, IPv6 addresses come first. This can separate the
3097addresses of a multihomed host, but that should not matter. */
3098
3099#if HAVE_IPV6
3100if (h != last)
3101 {
3102 for (h = host; h != last; h = h->next)
3103 {
3104 host_item temp;
3105 host_item *next = h->next;
3106 if (h->mx != next->mx || /* If next is different MX value */
3107 (h->sort_key % 1000) < 500 || /* OR this one is IPv6 */
3108 (next->sort_key % 1000) >= 500) /* OR next is IPv4 */
3109 continue; /* move on to next */
3110 temp = *h;
3111 temp.next = next->next;
3112 *h = *next;
3113 h->next = next;
3114 *next = temp;
3115 }
3116 }
3117#endif
3118
3119/* When running in the test harness, we want the hosts always to be in the same
3120order so that the debugging output is the same and can be compared. Having a
3121fixed set of "random" numbers doesn't actually achieve this, because the RRs
3122come back from the resolver in a random order, so the non-random random numbers
3123get used in a different order. We therefore have to sort the hosts that have
3124the same MX values. We chose do to this by their name and then by IP address.
3125The fact that the sort is slow matters not - this is testing only! */
3126
3127if (running_in_test_harness)
3128 {
3129 BOOL done;
3130 do
3131 {
3132 done = TRUE;
3133 for (h = host; h != last; h = h->next)
3134 {
3135 int c = Ustrcmp(h->name, h->next->name);
3136 if (c == 0) c = Ustrcmp(h->address, h->next->address);
3137 if (h->mx == h->next->mx && c > 0)
3138 {
3139 host_item *next = h->next;
3140 host_item temp = *h;
3141 temp.next = next->next;
3142 *h = *next;
3143 h->next = next;
3144 *next = temp;
3145 done = FALSE;
3146 }
3147 }
3148 }
3149 while (!done);
3150 }
3151
3152/* Remove any duplicate IP addresses and then scan the list of hosts for any
3153whose IP addresses are on the local host. If any are found, all hosts with the
3154same or higher MX values are removed. However, if the local host has the lowest
3155numbered MX, then HOST_FOUND_LOCAL is returned. Otherwise, if at least one host
3156with an IP address is on the list, HOST_FOUND is returned. Otherwise,
3157HOST_FIND_FAILED is returned, but in this case do not update the yield, as it
3158might have been set to HOST_FIND_AGAIN just above here. If not, it will already
3159be HOST_FIND_FAILED. */
3160
3161host_remove_duplicates(host, &last);
3162rc = host_scan_for_local_hosts(host, &last, removed);
3163if (rc != HOST_FIND_FAILED) yield = rc;
3164
3165DEBUG(D_host_lookup)
3166 {
3167 if (fully_qualified_name != NULL)
3168 debug_printf("fully qualified name = %s\n", *fully_qualified_name);
3169 debug_printf("host_find_bydns yield = %s (%d); returned hosts:\n",
3170 (yield == HOST_FOUND)? "HOST_FOUND" :
3171 (yield == HOST_FOUND_LOCAL)? "HOST_FOUND_LOCAL" :
3172 (yield == HOST_FIND_AGAIN)? "HOST_FIND_AGAIN" :
3173 (yield == HOST_FIND_FAILED)? "HOST_FIND_FAILED" : "?",
3174 yield);
3175 for (h = host; h != last->next; h = h->next)
3176 {
3177 debug_printf(" %s %s MX=%d ", h->name,
3178 (h->address == NULL)? US"<null>" : h->address, h->mx);
3179 if (h->port != PORT_NONE) debug_printf("port=%d ", h->port);
3180 if (h->status >= hstatus_unusable) debug_printf("*");
3181 debug_printf("\n");
3182 }
3183 }
3184
3185return yield;
3186}
3187
3188
3189
3190
3191/*************************************************
3192**************************************************
3193* Stand-alone test program *
3194**************************************************
3195*************************************************/
3196
3197#ifdef STAND_ALONE
3198
059ec3d9
PH
3199int main(int argc, char **cargv)
3200{
3201host_item h;
3202int whichrrs = HOST_FIND_BY_MX | HOST_FIND_BY_A;
3203BOOL byname = FALSE;
3204BOOL qualify_single = TRUE;
3205BOOL search_parents = FALSE;
3206uschar **argv = USS cargv;
3207uschar buffer[256];
3208
3209primary_hostname = US"";
3210store_pool = POOL_MAIN;
3211debug_selector = D_host_lookup|D_interface;
3212debug_file = stdout;
3213debug_fd = fileno(debug_file);
3214
3215printf("Exim stand-alone host functions test\n");
3216
3217host_find_interfaces();
3218debug_selector = D_host_lookup | D_dns;
3219
3220if (argc > 1) primary_hostname = argv[1];
3221
3222/* So that debug level changes can be done first */
3223
3224dns_init(qualify_single, search_parents);
3225
3226printf("Testing host lookup\n");
3227printf("> ");
3228while (Ufgets(buffer, 256, stdin) != NULL)
3229 {
3230 int rc;
3231 int len = Ustrlen(buffer);
3232 uschar *fully_qualified_name;
3233
3234 while (len > 0 && isspace(buffer[len-1])) len--;
3235 buffer[len] = 0;
3236
3237 if (Ustrcmp(buffer, "q") == 0) break;
3238
3239 if (Ustrcmp(buffer, "byname") == 0) byname = TRUE;
3240 else if (Ustrcmp(buffer, "no_byname") == 0) byname = FALSE;
3241 else if (Ustrcmp(buffer, "a_only") == 0) whichrrs = HOST_FIND_BY_A;
3242 else if (Ustrcmp(buffer, "mx_only") == 0) whichrrs = HOST_FIND_BY_MX;
3243 else if (Ustrcmp(buffer, "srv_only") == 0) whichrrs = HOST_FIND_BY_SRV;
3244 else if (Ustrcmp(buffer, "srv+a") == 0)
3245 whichrrs = HOST_FIND_BY_SRV | HOST_FIND_BY_A;
3246 else if (Ustrcmp(buffer, "srv+mx") == 0)
3247 whichrrs = HOST_FIND_BY_SRV | HOST_FIND_BY_MX;
3248 else if (Ustrcmp(buffer, "srv+mx+a") == 0)
3249 whichrrs = HOST_FIND_BY_SRV | HOST_FIND_BY_MX | HOST_FIND_BY_A;
3250 else if (Ustrcmp(buffer, "qualify_single") == 0) qualify_single = TRUE;
3251 else if (Ustrcmp(buffer, "no_qualify_single") == 0) qualify_single = FALSE;
3252 else if (Ustrcmp(buffer, "search_parents") == 0) search_parents = TRUE;
3253 else if (Ustrcmp(buffer, "no_search_parents") == 0) search_parents = FALSE;
e7726cbf
PH
3254 else if (Ustrcmp(buffer, "test_harness") == 0)
3255 running_in_test_harness = !running_in_test_harness;
3256 else if (Ustrcmp(buffer, "res_debug") == 0)
3257 {
3258 _res.options ^= RES_DEBUG;
3259 }
059ec3d9
PH
3260 else if (Ustrncmp(buffer, "retrans", 7) == 0)
3261 {
ff790e47 3262 (void)sscanf(CS(buffer+8), "%d", &dns_retrans);
059ec3d9
PH
3263 _res.retrans = dns_retrans;
3264 }
3265 else if (Ustrncmp(buffer, "retry", 5) == 0)
3266 {
ff790e47 3267 (void)sscanf(CS(buffer+6), "%d", &dns_retry);
059ec3d9
PH
3268 _res.retry = dns_retry;
3269 }
059ec3d9
PH
3270 else
3271 {
3272 int flags = whichrrs;
3273
3274 h.name = buffer;
3275 h.next = NULL;
3276 h.mx = MX_NONE;
3277 h.port = PORT_NONE;
3278 h.status = hstatus_unknown;
3279 h.why = hwhy_unknown;
3280 h.address = NULL;
3281
3282 if (qualify_single) flags |= HOST_FIND_QUALIFY_SINGLE;
3283 if (search_parents) flags |= HOST_FIND_SEARCH_PARENTS;
3284
3285 rc = byname?
3286 host_find_byname(&h, NULL, &fully_qualified_name, TRUE)
3287 :
3288 host_find_bydns(&h, NULL, flags, US"smtp", NULL, NULL,
3289 &fully_qualified_name, NULL);
3290
3291 if (rc == HOST_FIND_FAILED) printf("Failed\n");
3292 else if (rc == HOST_FIND_AGAIN) printf("Again\n");
3293 else if (rc == HOST_FOUND_LOCAL) printf("Local\n");
3294 }
3295
3296 printf("\n> ");
3297 }
3298
3299printf("Testing host_aton\n");
3300printf("> ");
3301while (Ufgets(buffer, 256, stdin) != NULL)
3302 {
3303 int i;
3304 int x[4];
3305 int len = Ustrlen(buffer);
3306
3307 while (len > 0 && isspace(buffer[len-1])) len--;
3308 buffer[len] = 0;
3309
3310 if (Ustrcmp(buffer, "q") == 0) break;
3311
3312 len = host_aton(buffer, x);
3313 printf("length = %d ", len);
3314 for (i = 0; i < len; i++)
3315 {
3316 printf("%04x ", (x[i] >> 16) & 0xffff);
3317 printf("%04x ", x[i] & 0xffff);
3318 }
3319 printf("\n> ");
3320 }
3321
3322printf("\n");
3323
3324printf("Testing host_name_lookup\n");
3325printf("> ");
3326while (Ufgets(buffer, 256, stdin) != NULL)
3327 {
3328 int len = Ustrlen(buffer);
3329 while (len > 0 && isspace(buffer[len-1])) len--;
3330 buffer[len] = 0;
3331 if (Ustrcmp(buffer, "q") == 0) break;
3332 sender_host_address = buffer;
3333 sender_host_name = NULL;
3334 sender_host_aliases = NULL;
3335 host_lookup_msg = US"";
3336 host_lookup_failed = FALSE;
3337 if (host_name_lookup() == FAIL) /* Debug causes printing */
3338 printf("Lookup failed:%s\n", host_lookup_msg);
3339 printf("\n> ");
3340 }
3341
3342printf("\n");
3343
3344return 0;
3345}
3346#endif /* STAND_ALONE */
3347
3348/* End of host.c */