dns.c revision 1.11
1/*
2 * services/cache/dns.c - Cache services for DNS using msg and rrset caches.
3 *
4 * Copyright (c) 2007, NLnet Labs. All rights reserved.
5 *
6 * This software is open source.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 *
12 * Redistributions of source code must retain the above copyright notice,
13 * this list of conditions and the following disclaimer.
14 *
15 * Redistributions in binary form must reproduce the above copyright notice,
16 * this list of conditions and the following disclaimer in the documentation
17 * and/or other materials provided with the distribution.
18 *
19 * Neither the name of the NLNET LABS nor the names of its contributors may
20 * be used to endorse or promote products derived from this software without
21 * specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
24 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
25 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
26 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
27 * HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
28 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
29 * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
30 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
31 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
32 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
33 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34 */
35
36/**
37 * \file
38 *
39 * This file contains the DNS cache.
40 */
41#include "config.h"
42#include "iterator/iter_delegpt.h"
43#include "validator/val_nsec.h"
44#include "validator/val_utils.h"
45#include "services/cache/dns.h"
46#include "services/cache/rrset.h"
47#include "util/data/msgreply.h"
48#include "util/data/packed_rrset.h"
49#include "util/data/dname.h"
50#include "util/module.h"
51#include "util/net_help.h"
52#include "util/regional.h"
53#include "util/config_file.h"
54#include "sldns/sbuffer.h"
55
56/** store rrsets in the rrset cache.
57 * @param env: module environment with caches.
58 * @param rep: contains list of rrsets to store.
59 * @param now: current time.
60 * @param leeway: during prefetch how much leeway to update TTLs.
61 * 	This makes rrsets (other than type NS) timeout sooner so they get
62 * 	updated with a new full TTL.
63 * 	Type NS does not get this, because it must not be refreshed from the
64 * 	child domain, but keep counting down properly.
65 * @param pside: if from parentside discovered NS, so that its NS is okay
66 * 	in a prefetch situation to be updated (without becoming sticky).
67 * @param qrep: update rrsets here if cache is better
68 * @param region: for qrep allocs.
69 */
70static void
71store_rrsets(struct module_env* env, struct reply_info* rep, time_t now,
72	time_t leeway, int pside, struct reply_info* qrep,
73	struct regional* region)
74{
75        size_t i;
76        /* see if rrset already exists in cache, if not insert it. */
77        for(i=0; i<rep->rrset_count; i++) {
78                rep->ref[i].key = rep->rrsets[i];
79                rep->ref[i].id = rep->rrsets[i]->id;
80		/* update ref if it was in the cache */
81		switch(rrset_cache_update(env->rrset_cache, &rep->ref[i],
82                        env->alloc, now + ((ntohs(rep->ref[i].key->rk.type)==
83			LDNS_RR_TYPE_NS && !pside)?0:leeway))) {
84		case 0: /* ref unchanged, item inserted */
85			break;
86		case 2: /* ref updated, cache is superior */
87			if(region) {
88				struct ub_packed_rrset_key* ck;
89				lock_rw_rdlock(&rep->ref[i].key->entry.lock);
90				/* if deleted rrset, do not copy it */
91				if(rep->ref[i].key->id == 0)
92					ck = NULL;
93				else 	ck = packed_rrset_copy_region(
94					rep->ref[i].key, region, now);
95				lock_rw_unlock(&rep->ref[i].key->entry.lock);
96				if(ck) {
97					/* use cached copy if memory allows */
98					qrep->rrsets[i] = ck;
99				}
100			}
101			/* no break: also copy key item */
102			/* the line below is matched by gcc regex and silences
103			 * the fallthrough warning */
104			/* fallthrough */
105		case 1: /* ref updated, item inserted */
106                        rep->rrsets[i] = rep->ref[i].key;
107		}
108        }
109}
110
111/** delete message from message cache */
112void
113msg_cache_remove(struct module_env* env, uint8_t* qname, size_t qnamelen,
114	uint16_t qtype, uint16_t qclass, uint16_t flags)
115{
116	struct query_info k;
117	hashvalue_type h;
118
119	k.qname = qname;
120	k.qname_len = qnamelen;
121	k.qtype = qtype;
122	k.qclass = qclass;
123	k.local_alias = NULL;
124	h = query_info_hash(&k, flags);
125	slabhash_remove(env->msg_cache, h, &k);
126}
127
128/** remove servfail msg cache entry */
129static void
130msg_del_servfail(struct module_env* env, struct query_info* qinfo,
131	uint32_t flags)
132{
133	struct msgreply_entry* e;
134	/* see if the entry is servfail, and then remove it, so that
135	 * lookups move from the cacheresponse stage to the recursionresponse
136	 * stage */
137	e = msg_cache_lookup(env, qinfo->qname, qinfo->qname_len,
138		qinfo->qtype, qinfo->qclass, flags, 0, 0);
139	if(!e) return;
140	/* we don't check for the ttl here, also expired servfail entries
141	 * are removed.  If the user uses serve-expired, they would still be
142	 * used to answer from cache */
143	if(FLAGS_GET_RCODE(((struct reply_info*)e->entry.data)->flags)
144		!= LDNS_RCODE_SERVFAIL) {
145		lock_rw_unlock(&e->entry.lock);
146		return;
147	}
148	lock_rw_unlock(&e->entry.lock);
149	msg_cache_remove(env, qinfo->qname, qinfo->qname_len, qinfo->qtype,
150		qinfo->qclass, flags);
151}
152
153void
154dns_cache_store_msg(struct module_env* env, struct query_info* qinfo,
155	hashvalue_type hash, struct reply_info* rep, time_t leeway, int pside,
156	struct reply_info* qrep, uint32_t flags, struct regional* region)
157{
158	struct msgreply_entry* e;
159	time_t ttl = rep->ttl;
160	size_t i;
161
162	/* store RRsets */
163        for(i=0; i<rep->rrset_count; i++) {
164		rep->ref[i].key = rep->rrsets[i];
165		rep->ref[i].id = rep->rrsets[i]->id;
166	}
167
168	/* there was a reply_info_sortref(rep) here but it seems to be
169	 * unnecessary, because the cache gets locked per rrset. */
170	reply_info_set_ttls(rep, *env->now);
171	store_rrsets(env, rep, *env->now, leeway, pside, qrep, region);
172	if(ttl == 0 && !(flags & DNSCACHE_STORE_ZEROTTL)) {
173		/* we do not store the message, but we did store the RRs,
174		 * which could be useful for delegation information */
175		verbose(VERB_ALGO, "TTL 0: dropped msg from cache");
176		free(rep);
177		/* if the message is SERVFAIL in cache, remove that SERVFAIL,
178		 * so that the TTL 0 response can be returned for future
179		 * responses (i.e. don't get answered by the servfail from
180		 * cache, but instead go to recursion to get this TTL0
181		 * response). */
182		msg_del_servfail(env, qinfo, flags);
183		return;
184	}
185
186	/* store msg in the cache */
187	reply_info_sortref(rep);
188	if(!(e = query_info_entrysetup(qinfo, rep, hash))) {
189		log_err("store_msg: malloc failed");
190		return;
191	}
192	slabhash_insert(env->msg_cache, hash, &e->entry, rep, env->alloc);
193}
194
195/** find closest NS or DNAME and returns the rrset (locked) */
196static struct ub_packed_rrset_key*
197find_closest_of_type(struct module_env* env, uint8_t* qname, size_t qnamelen,
198	uint16_t qclass, time_t now, uint16_t searchtype, int stripfront)
199{
200	struct ub_packed_rrset_key *rrset;
201	uint8_t lablen;
202
203	if(stripfront) {
204		/* strip off so that DNAMEs have strict subdomain match */
205		lablen = *qname;
206		qname += lablen + 1;
207		qnamelen -= lablen + 1;
208	}
209
210	/* snip off front part of qname until the type is found */
211	while(qnamelen > 0) {
212		if((rrset = rrset_cache_lookup(env->rrset_cache, qname,
213			qnamelen, searchtype, qclass, 0, now, 0)))
214			return rrset;
215
216		/* snip off front label */
217		lablen = *qname;
218		qname += lablen + 1;
219		qnamelen -= lablen + 1;
220	}
221	return NULL;
222}
223
224/** add addr to additional section */
225static void
226addr_to_additional(struct ub_packed_rrset_key* rrset, struct regional* region,
227	struct dns_msg* msg, time_t now)
228{
229	if((msg->rep->rrsets[msg->rep->rrset_count] =
230		packed_rrset_copy_region(rrset, region, now))) {
231		msg->rep->ar_numrrsets++;
232		msg->rep->rrset_count++;
233	}
234}
235
236/** lookup message in message cache */
237struct msgreply_entry*
238msg_cache_lookup(struct module_env* env, uint8_t* qname, size_t qnamelen,
239	uint16_t qtype, uint16_t qclass, uint16_t flags, time_t now, int wr)
240{
241	struct lruhash_entry* e;
242	struct query_info k;
243	hashvalue_type h;
244
245	k.qname = qname;
246	k.qname_len = qnamelen;
247	k.qtype = qtype;
248	k.qclass = qclass;
249	k.local_alias = NULL;
250	h = query_info_hash(&k, flags);
251	e = slabhash_lookup(env->msg_cache, h, &k, wr);
252
253	if(!e) return NULL;
254	if( now > ((struct reply_info*)e->data)->ttl ) {
255		lock_rw_unlock(&e->lock);
256		return NULL;
257	}
258	return (struct msgreply_entry*)e->key;
259}
260
261/** find and add A and AAAA records for nameservers in delegpt */
262static int
263find_add_addrs(struct module_env* env, uint16_t qclass,
264	struct regional* region, struct delegpt* dp, time_t now,
265	struct dns_msg** msg)
266{
267	struct delegpt_ns* ns;
268	struct msgreply_entry* neg;
269	struct ub_packed_rrset_key* akey;
270	for(ns = dp->nslist; ns; ns = ns->next) {
271		akey = rrset_cache_lookup(env->rrset_cache, ns->name,
272			ns->namelen, LDNS_RR_TYPE_A, qclass, 0, now, 0);
273		if(akey) {
274			if(!delegpt_add_rrset_A(dp, region, akey, 0)) {
275				lock_rw_unlock(&akey->entry.lock);
276				return 0;
277			}
278			if(msg)
279				addr_to_additional(akey, region, *msg, now);
280			lock_rw_unlock(&akey->entry.lock);
281		} else {
282			/* BIT_CD on false because delegpt lookup does
283			 * not use dns64 translation */
284			neg = msg_cache_lookup(env, ns->name, ns->namelen,
285				LDNS_RR_TYPE_A, qclass, 0, now, 0);
286			if(neg) {
287				delegpt_add_neg_msg(dp, neg);
288				lock_rw_unlock(&neg->entry.lock);
289			}
290		}
291		akey = rrset_cache_lookup(env->rrset_cache, ns->name,
292			ns->namelen, LDNS_RR_TYPE_AAAA, qclass, 0, now, 0);
293		if(akey) {
294			if(!delegpt_add_rrset_AAAA(dp, region, akey, 0)) {
295				lock_rw_unlock(&akey->entry.lock);
296				return 0;
297			}
298			if(msg)
299				addr_to_additional(akey, region, *msg, now);
300			lock_rw_unlock(&akey->entry.lock);
301		} else {
302			/* BIT_CD on false because delegpt lookup does
303			 * not use dns64 translation */
304			neg = msg_cache_lookup(env, ns->name, ns->namelen,
305				LDNS_RR_TYPE_AAAA, qclass, 0, now, 0);
306			if(neg) {
307				delegpt_add_neg_msg(dp, neg);
308				lock_rw_unlock(&neg->entry.lock);
309			}
310		}
311	}
312	return 1;
313}
314
315/** find and add A and AAAA records for missing nameservers in delegpt */
316int
317cache_fill_missing(struct module_env* env, uint16_t qclass,
318	struct regional* region, struct delegpt* dp)
319{
320	struct delegpt_ns* ns;
321	struct msgreply_entry* neg;
322	struct ub_packed_rrset_key* akey;
323	time_t now = *env->now;
324	for(ns = dp->nslist; ns; ns = ns->next) {
325		akey = rrset_cache_lookup(env->rrset_cache, ns->name,
326			ns->namelen, LDNS_RR_TYPE_A, qclass, 0, now, 0);
327		if(akey) {
328			if(!delegpt_add_rrset_A(dp, region, akey, ns->lame)) {
329				lock_rw_unlock(&akey->entry.lock);
330				return 0;
331			}
332			log_nametypeclass(VERB_ALGO, "found in cache",
333				ns->name, LDNS_RR_TYPE_A, qclass);
334			lock_rw_unlock(&akey->entry.lock);
335		} else {
336			/* BIT_CD on false because delegpt lookup does
337			 * not use dns64 translation */
338			neg = msg_cache_lookup(env, ns->name, ns->namelen,
339				LDNS_RR_TYPE_A, qclass, 0, now, 0);
340			if(neg) {
341				delegpt_add_neg_msg(dp, neg);
342				lock_rw_unlock(&neg->entry.lock);
343			}
344		}
345		akey = rrset_cache_lookup(env->rrset_cache, ns->name,
346			ns->namelen, LDNS_RR_TYPE_AAAA, qclass, 0, now, 0);
347		if(akey) {
348			if(!delegpt_add_rrset_AAAA(dp, region, akey, ns->lame)) {
349				lock_rw_unlock(&akey->entry.lock);
350				return 0;
351			}
352			log_nametypeclass(VERB_ALGO, "found in cache",
353				ns->name, LDNS_RR_TYPE_AAAA, qclass);
354			lock_rw_unlock(&akey->entry.lock);
355		} else {
356			/* BIT_CD on false because delegpt lookup does
357			 * not use dns64 translation */
358			neg = msg_cache_lookup(env, ns->name, ns->namelen,
359				LDNS_RR_TYPE_AAAA, qclass, 0, now, 0);
360			if(neg) {
361				delegpt_add_neg_msg(dp, neg);
362				lock_rw_unlock(&neg->entry.lock);
363			}
364		}
365	}
366	return 1;
367}
368
369/** find and add DS or NSEC to delegation msg */
370static void
371find_add_ds(struct module_env* env, struct regional* region,
372	struct dns_msg* msg, struct delegpt* dp, time_t now)
373{
374	/* Lookup the DS or NSEC at the delegation point. */
375	struct ub_packed_rrset_key* rrset = rrset_cache_lookup(
376		env->rrset_cache, dp->name, dp->namelen, LDNS_RR_TYPE_DS,
377		msg->qinfo.qclass, 0, now, 0);
378	if(!rrset) {
379		/* NOTE: this won't work for alternate NSEC schemes
380		 *	(opt-in, NSEC3) */
381		rrset = rrset_cache_lookup(env->rrset_cache, dp->name,
382			dp->namelen, LDNS_RR_TYPE_NSEC, msg->qinfo.qclass,
383			0, now, 0);
384		/* Note: the PACKED_RRSET_NSEC_AT_APEX flag is not used.
385		 * since this is a referral, we need the NSEC at the parent
386		 * side of the zone cut, not the NSEC at apex side. */
387		if(rrset && nsec_has_type(rrset, LDNS_RR_TYPE_DS)) {
388			lock_rw_unlock(&rrset->entry.lock);
389			rrset = NULL; /* discard wrong NSEC */
390		}
391	}
392	if(rrset) {
393		/* add it to auth section. This is the second rrset. */
394		if((msg->rep->rrsets[msg->rep->rrset_count] =
395			packed_rrset_copy_region(rrset, region, now))) {
396			msg->rep->ns_numrrsets++;
397			msg->rep->rrset_count++;
398		}
399		lock_rw_unlock(&rrset->entry.lock);
400	}
401}
402
403struct dns_msg*
404dns_msg_create(uint8_t* qname, size_t qnamelen, uint16_t qtype,
405	uint16_t qclass, struct regional* region, size_t capacity)
406{
407	struct dns_msg* msg = (struct dns_msg*)regional_alloc(region,
408		sizeof(struct dns_msg));
409	if(!msg)
410		return NULL;
411	msg->qinfo.qname = regional_alloc_init(region, qname, qnamelen);
412	if(!msg->qinfo.qname)
413		return NULL;
414	msg->qinfo.qname_len = qnamelen;
415	msg->qinfo.qtype = qtype;
416	msg->qinfo.qclass = qclass;
417	msg->qinfo.local_alias = NULL;
418	/* non-packed reply_info, because it needs to grow the array */
419	msg->rep = (struct reply_info*)regional_alloc_zero(region,
420		sizeof(struct reply_info)-sizeof(struct rrset_ref));
421	if(!msg->rep)
422		return NULL;
423	if(capacity > RR_COUNT_MAX)
424		return NULL; /* integer overflow protection */
425	msg->rep->flags = BIT_QR; /* with QR, no AA */
426	msg->rep->qdcount = 1;
427	msg->rep->rrsets = (struct ub_packed_rrset_key**)
428		regional_alloc(region,
429		capacity*sizeof(struct ub_packed_rrset_key*));
430	if(!msg->rep->rrsets)
431		return NULL;
432	return msg;
433}
434
435int
436dns_msg_authadd(struct dns_msg* msg, struct regional* region,
437	struct ub_packed_rrset_key* rrset, time_t now)
438{
439	if(!(msg->rep->rrsets[msg->rep->rrset_count++] =
440		packed_rrset_copy_region(rrset, region, now)))
441		return 0;
442	msg->rep->ns_numrrsets++;
443	return 1;
444}
445
446int
447dns_msg_ansadd(struct dns_msg* msg, struct regional* region,
448	struct ub_packed_rrset_key* rrset, time_t now)
449{
450	if(!(msg->rep->rrsets[msg->rep->rrset_count++] =
451		packed_rrset_copy_region(rrset, region, now)))
452		return 0;
453	msg->rep->an_numrrsets++;
454	return 1;
455}
456
457struct delegpt*
458dns_cache_find_delegation(struct module_env* env, uint8_t* qname,
459	size_t qnamelen, uint16_t qtype, uint16_t qclass,
460	struct regional* region, struct dns_msg** msg, time_t now)
461{
462	/* try to find closest NS rrset */
463	struct ub_packed_rrset_key* nskey;
464	struct packed_rrset_data* nsdata;
465	struct delegpt* dp;
466
467	nskey = find_closest_of_type(env, qname, qnamelen, qclass, now,
468		LDNS_RR_TYPE_NS, 0);
469	if(!nskey) /* hope the caller has hints to prime or something */
470		return NULL;
471	nsdata = (struct packed_rrset_data*)nskey->entry.data;
472	/* got the NS key, create delegation point */
473	dp = delegpt_create(region);
474	if(!dp || !delegpt_set_name(dp, region, nskey->rk.dname)) {
475		lock_rw_unlock(&nskey->entry.lock);
476		log_err("find_delegation: out of memory");
477		return NULL;
478	}
479	/* create referral message */
480	if(msg) {
481		/* allocate the array to as much as we could need:
482		 *	NS rrset + DS/NSEC rrset +
483		 *	A rrset for every NS RR
484		 *	AAAA rrset for every NS RR
485		 */
486		*msg = dns_msg_create(qname, qnamelen, qtype, qclass, region,
487			2 + nsdata->count*2);
488		if(!*msg || !dns_msg_authadd(*msg, region, nskey, now)) {
489			lock_rw_unlock(&nskey->entry.lock);
490			log_err("find_delegation: out of memory");
491			return NULL;
492		}
493	}
494	if(!delegpt_rrset_add_ns(dp, region, nskey, 0))
495		log_err("find_delegation: addns out of memory");
496	lock_rw_unlock(&nskey->entry.lock); /* first unlock before next lookup*/
497	/* find and add DS/NSEC (if any) */
498	if(msg)
499		find_add_ds(env, region, *msg, dp, now);
500	/* find and add A entries */
501	if(!find_add_addrs(env, qclass, region, dp, now, msg))
502		log_err("find_delegation: addrs out of memory");
503	return dp;
504}
505
506/** allocate dns_msg from query_info and reply_info */
507static struct dns_msg*
508gen_dns_msg(struct regional* region, struct query_info* q, size_t num)
509{
510	struct dns_msg* msg = (struct dns_msg*)regional_alloc(region,
511		sizeof(struct dns_msg));
512	if(!msg)
513		return NULL;
514	memcpy(&msg->qinfo, q, sizeof(struct query_info));
515	msg->qinfo.qname = regional_alloc_init(region, q->qname, q->qname_len);
516	if(!msg->qinfo.qname)
517		return NULL;
518	/* allocate replyinfo struct and rrset key array separately */
519	msg->rep = (struct reply_info*)regional_alloc(region,
520		sizeof(struct reply_info) - sizeof(struct rrset_ref));
521	if(!msg->rep)
522		return NULL;
523	if(num > RR_COUNT_MAX)
524		return NULL; /* integer overflow protection */
525	msg->rep->rrsets = (struct ub_packed_rrset_key**)
526		regional_alloc(region,
527		num * sizeof(struct ub_packed_rrset_key*));
528	if(!msg->rep->rrsets)
529		return NULL;
530	return msg;
531}
532
533struct dns_msg*
534tomsg(struct module_env* env, struct query_info* q, struct reply_info* r,
535	struct regional* region, time_t now, struct regional* scratch)
536{
537	struct dns_msg* msg;
538	size_t i;
539	if(now > r->ttl)
540		return NULL;
541	msg = gen_dns_msg(region, q, r->rrset_count);
542	if(!msg)
543		return NULL;
544	msg->rep->flags = r->flags;
545	msg->rep->qdcount = r->qdcount;
546	msg->rep->ttl = r->ttl - now;
547	if(r->prefetch_ttl > now)
548		msg->rep->prefetch_ttl = r->prefetch_ttl - now;
549	else	msg->rep->prefetch_ttl = PREFETCH_TTL_CALC(msg->rep->ttl);
550	msg->rep->serve_expired_ttl = msg->rep->ttl + SERVE_EXPIRED_TTL;
551	msg->rep->security = r->security;
552	msg->rep->an_numrrsets = r->an_numrrsets;
553	msg->rep->ns_numrrsets = r->ns_numrrsets;
554	msg->rep->ar_numrrsets = r->ar_numrrsets;
555	msg->rep->rrset_count = r->rrset_count;
556        msg->rep->authoritative = r->authoritative;
557	if(!rrset_array_lock(r->ref, r->rrset_count, now))
558		return NULL;
559	if(r->an_numrrsets > 0 && (r->rrsets[0]->rk.type == htons(
560		LDNS_RR_TYPE_CNAME) || r->rrsets[0]->rk.type == htons(
561		LDNS_RR_TYPE_DNAME)) && !reply_check_cname_chain(q, r)) {
562		/* cname chain is now invalid, reconstruct msg */
563		rrset_array_unlock(r->ref, r->rrset_count);
564		return NULL;
565	}
566	if(r->security == sec_status_secure && !reply_all_rrsets_secure(r)) {
567		/* message rrsets have changed status, revalidate */
568		rrset_array_unlock(r->ref, r->rrset_count);
569		return NULL;
570	}
571	for(i=0; i<msg->rep->rrset_count; i++) {
572		msg->rep->rrsets[i] = packed_rrset_copy_region(r->rrsets[i],
573			region, now);
574		if(!msg->rep->rrsets[i]) {
575			rrset_array_unlock(r->ref, r->rrset_count);
576			return NULL;
577		}
578	}
579	if(env)
580		rrset_array_unlock_touch(env->rrset_cache, scratch, r->ref,
581		r->rrset_count);
582	else
583		rrset_array_unlock(r->ref, r->rrset_count);
584	return msg;
585}
586
587/** synthesize RRset-only response from cached RRset item */
588static struct dns_msg*
589rrset_msg(struct ub_packed_rrset_key* rrset, struct regional* region,
590	time_t now, struct query_info* q)
591{
592	struct dns_msg* msg;
593	struct packed_rrset_data* d = (struct packed_rrset_data*)
594		rrset->entry.data;
595	if(now > d->ttl)
596		return NULL;
597	msg = gen_dns_msg(region, q, 1); /* only the CNAME (or other) RRset */
598	if(!msg)
599		return NULL;
600	msg->rep->flags = BIT_QR; /* reply, no AA, no error */
601        msg->rep->authoritative = 0; /* reply stored in cache can't be authoritative */
602	msg->rep->qdcount = 1;
603	msg->rep->ttl = d->ttl - now;
604	msg->rep->prefetch_ttl = PREFETCH_TTL_CALC(msg->rep->ttl);
605	msg->rep->serve_expired_ttl = msg->rep->ttl + SERVE_EXPIRED_TTL;
606	msg->rep->security = sec_status_unchecked;
607	msg->rep->an_numrrsets = 1;
608	msg->rep->ns_numrrsets = 0;
609	msg->rep->ar_numrrsets = 0;
610	msg->rep->rrset_count = 1;
611	msg->rep->rrsets[0] = packed_rrset_copy_region(rrset, region, now);
612	if(!msg->rep->rrsets[0]) /* copy CNAME */
613		return NULL;
614	return msg;
615}
616
617/** synthesize DNAME+CNAME response from cached DNAME item */
618static struct dns_msg*
619synth_dname_msg(struct ub_packed_rrset_key* rrset, struct regional* region,
620	time_t now, struct query_info* q, enum sec_status* sec_status)
621{
622	struct dns_msg* msg;
623	struct ub_packed_rrset_key* ck;
624	struct packed_rrset_data* newd, *d = (struct packed_rrset_data*)
625		rrset->entry.data;
626	uint8_t* newname, *dtarg = NULL;
627	size_t newlen, dtarglen;
628	if(now > d->ttl)
629		return NULL;
630	/* only allow validated (with DNSSEC) DNAMEs used from cache
631	 * for insecure DNAMEs, query again. */
632	*sec_status = d->security;
633	/* return sec status, so the status of the CNAME can be checked
634	 * by the calling routine. */
635	msg = gen_dns_msg(region, q, 2); /* DNAME + CNAME RRset */
636	if(!msg)
637		return NULL;
638	msg->rep->flags = BIT_QR; /* reply, no AA, no error */
639        msg->rep->authoritative = 0; /* reply stored in cache can't be authoritative */
640	msg->rep->qdcount = 1;
641	msg->rep->ttl = d->ttl - now;
642	msg->rep->prefetch_ttl = PREFETCH_TTL_CALC(msg->rep->ttl);
643	msg->rep->serve_expired_ttl = msg->rep->ttl + SERVE_EXPIRED_TTL;
644	msg->rep->security = sec_status_unchecked;
645	msg->rep->an_numrrsets = 1;
646	msg->rep->ns_numrrsets = 0;
647	msg->rep->ar_numrrsets = 0;
648	msg->rep->rrset_count = 1;
649	msg->rep->rrsets[0] = packed_rrset_copy_region(rrset, region, now);
650	if(!msg->rep->rrsets[0]) /* copy DNAME */
651		return NULL;
652	/* synth CNAME rrset */
653	get_cname_target(rrset, &dtarg, &dtarglen);
654	if(!dtarg)
655		return NULL;
656	newlen = q->qname_len + dtarglen - rrset->rk.dname_len;
657	if(newlen > LDNS_MAX_DOMAINLEN) {
658		msg->rep->flags |= LDNS_RCODE_YXDOMAIN;
659		return msg;
660	}
661	newname = (uint8_t*)regional_alloc(region, newlen);
662	if(!newname)
663		return NULL;
664	/* new name is concatenation of qname front (without DNAME owner)
665	 * and DNAME target name */
666	memcpy(newname, q->qname, q->qname_len-rrset->rk.dname_len);
667	memmove(newname+(q->qname_len-rrset->rk.dname_len), dtarg, dtarglen);
668	/* create rest of CNAME rrset */
669	ck = (struct ub_packed_rrset_key*)regional_alloc(region,
670		sizeof(struct ub_packed_rrset_key));
671	if(!ck)
672		return NULL;
673	memset(&ck->entry, 0, sizeof(ck->entry));
674	msg->rep->rrsets[1] = ck;
675	ck->entry.key = ck;
676	ck->rk.type = htons(LDNS_RR_TYPE_CNAME);
677	ck->rk.rrset_class = rrset->rk.rrset_class;
678	ck->rk.flags = 0;
679	ck->rk.dname = regional_alloc_init(region, q->qname, q->qname_len);
680	if(!ck->rk.dname)
681		return NULL;
682	ck->rk.dname_len = q->qname_len;
683	ck->entry.hash = rrset_key_hash(&ck->rk);
684	newd = (struct packed_rrset_data*)regional_alloc_zero(region,
685		sizeof(struct packed_rrset_data) + sizeof(size_t) +
686		sizeof(uint8_t*) + sizeof(time_t) + sizeof(uint16_t)
687		+ newlen);
688	if(!newd)
689		return NULL;
690	ck->entry.data = newd;
691	newd->ttl = 0; /* 0 for synthesized CNAME TTL */
692	newd->count = 1;
693	newd->rrsig_count = 0;
694	newd->trust = rrset_trust_ans_noAA;
695	newd->rr_len = (size_t*)((uint8_t*)newd +
696		sizeof(struct packed_rrset_data));
697	newd->rr_len[0] = newlen + sizeof(uint16_t);
698	packed_rrset_ptr_fixup(newd);
699	newd->rr_ttl[0] = newd->ttl;
700	msg->rep->ttl = newd->ttl;
701	msg->rep->prefetch_ttl = PREFETCH_TTL_CALC(newd->ttl);
702	msg->rep->serve_expired_ttl = newd->ttl + SERVE_EXPIRED_TTL;
703	sldns_write_uint16(newd->rr_data[0], newlen);
704	memmove(newd->rr_data[0] + sizeof(uint16_t), newname, newlen);
705	msg->rep->an_numrrsets ++;
706	msg->rep->rrset_count ++;
707	return msg;
708}
709
710/** Fill TYPE_ANY response with some data from cache */
711static struct dns_msg*
712fill_any(struct module_env* env,
713	uint8_t* qname, size_t qnamelen, uint16_t qtype, uint16_t qclass,
714	struct regional* region)
715{
716	time_t now = *env->now;
717	struct dns_msg* msg = NULL;
718	uint16_t lookup[] = {LDNS_RR_TYPE_A, LDNS_RR_TYPE_AAAA,
719		LDNS_RR_TYPE_MX, LDNS_RR_TYPE_SOA, LDNS_RR_TYPE_NS,
720		LDNS_RR_TYPE_DNAME, 0};
721	int i, num=6; /* number of RR types to look up */
722	log_assert(lookup[num] == 0);
723
724	for(i=0; i<num; i++) {
725		/* look up this RR for inclusion in type ANY response */
726		struct ub_packed_rrset_key* rrset = rrset_cache_lookup(
727			env->rrset_cache, qname, qnamelen, lookup[i],
728			qclass, 0, now, 0);
729		struct packed_rrset_data *d;
730		if(!rrset)
731			continue;
732
733		/* only if rrset from answer section */
734		d = (struct packed_rrset_data*)rrset->entry.data;
735		if(d->trust == rrset_trust_add_noAA ||
736			d->trust == rrset_trust_auth_noAA ||
737			d->trust == rrset_trust_add_AA ||
738			d->trust == rrset_trust_auth_AA) {
739			lock_rw_unlock(&rrset->entry.lock);
740			continue;
741		}
742
743		/* create msg if none */
744		if(!msg) {
745			msg = dns_msg_create(qname, qnamelen, qtype, qclass,
746				region, (size_t)(num-i));
747			if(!msg) {
748				lock_rw_unlock(&rrset->entry.lock);
749				return NULL;
750			}
751		}
752
753		/* add RRset to response */
754		if(!dns_msg_ansadd(msg, region, rrset, now)) {
755			lock_rw_unlock(&rrset->entry.lock);
756			return NULL;
757		}
758		lock_rw_unlock(&rrset->entry.lock);
759	}
760	return msg;
761}
762
763struct dns_msg*
764dns_cache_lookup(struct module_env* env,
765	uint8_t* qname, size_t qnamelen, uint16_t qtype, uint16_t qclass,
766	uint16_t flags, struct regional* region, struct regional* scratch,
767	int no_partial)
768{
769	struct lruhash_entry* e;
770	struct query_info k;
771	hashvalue_type h;
772	time_t now = *env->now;
773	struct ub_packed_rrset_key* rrset;
774
775	/* lookup first, this has both NXdomains and ANSWER responses */
776	k.qname = qname;
777	k.qname_len = qnamelen;
778	k.qtype = qtype;
779	k.qclass = qclass;
780	k.local_alias = NULL;
781	h = query_info_hash(&k, flags);
782	e = slabhash_lookup(env->msg_cache, h, &k, 0);
783	if(e) {
784		struct msgreply_entry* key = (struct msgreply_entry*)e->key;
785		struct reply_info* data = (struct reply_info*)e->data;
786		struct dns_msg* msg = tomsg(env, &key->key, data, region, now,
787			scratch);
788		if(msg) {
789			lock_rw_unlock(&e->lock);
790			return msg;
791		}
792		/* could be msg==NULL; due to TTL or not all rrsets available */
793		lock_rw_unlock(&e->lock);
794	}
795
796	/* see if a DNAME exists. Checked for first, to enforce that DNAMEs
797	 * are more important, the CNAME is resynthesized and thus
798	 * consistent with the DNAME */
799	if(!no_partial &&
800		(rrset=find_closest_of_type(env, qname, qnamelen, qclass, now,
801		LDNS_RR_TYPE_DNAME, 1))) {
802		/* synthesize a DNAME+CNAME message based on this */
803		enum sec_status sec_status = sec_status_unchecked;
804		struct dns_msg* msg = synth_dname_msg(rrset, region, now, &k,
805			&sec_status);
806		if(msg) {
807			struct ub_packed_rrset_key* cname_rrset;
808			lock_rw_unlock(&rrset->entry.lock);
809			/* now, after unlocking the DNAME rrset lock,
810			 * check the sec_status, and see if we need to look
811			 * up the CNAME record associated before it can
812			 * be used */
813			/* normally, only secure DNAMEs allowed from cache*/
814			if(sec_status == sec_status_secure)
815				return msg;
816			/* but if we have a CNAME cached with this name, then we
817			 * have previously already allowed this name to pass.
818			 * the next cache lookup is going to fetch that CNAME itself,
819			 * but it is better to have the (unsigned)DNAME + CNAME in
820			 * that case */
821			cname_rrset = rrset_cache_lookup(
822				env->rrset_cache, qname, qnamelen,
823				LDNS_RR_TYPE_CNAME, qclass, 0, now, 0);
824			if(cname_rrset) {
825				/* CNAME already synthesized by
826				 * synth_dname_msg routine, so we can
827				 * straight up return the msg */
828				lock_rw_unlock(&cname_rrset->entry.lock);
829				return msg;
830			}
831		} else {
832			lock_rw_unlock(&rrset->entry.lock);
833		}
834	}
835
836	/* see if we have CNAME for this domain,
837	 * but not for DS records (which are part of the parent) */
838	if(!no_partial && qtype != LDNS_RR_TYPE_DS &&
839	   (rrset=rrset_cache_lookup(env->rrset_cache, qname, qnamelen,
840		LDNS_RR_TYPE_CNAME, qclass, 0, now, 0))) {
841		uint8_t* wc = NULL;
842		size_t wl;
843		/* if the rrset is not a wildcard expansion, with wcname */
844		/* because, if we return that CNAME rrset on its own, it is
845		 * missing the NSEC or NSEC3 proof */
846		if(!(val_rrset_wildcard(rrset, &wc, &wl) && wc != NULL)) {
847			struct dns_msg* msg = rrset_msg(rrset, region, now, &k);
848			if(msg) {
849				lock_rw_unlock(&rrset->entry.lock);
850				return msg;
851			}
852		}
853		lock_rw_unlock(&rrset->entry.lock);
854	}
855
856	/* construct DS, DNSKEY, DLV messages from rrset cache. */
857	if((qtype == LDNS_RR_TYPE_DS || qtype == LDNS_RR_TYPE_DNSKEY ||
858		qtype == LDNS_RR_TYPE_DLV) &&
859		(rrset=rrset_cache_lookup(env->rrset_cache, qname, qnamelen,
860		qtype, qclass, 0, now, 0))) {
861		/* if the rrset is from the additional section, and the
862		 * signatures have fallen off, then do not synthesize a msg
863		 * instead, allow a full query for signed results to happen.
864		 * Forego all rrset data from additional section, because
865		 * some signatures may not be present and cause validation
866		 * failure.
867		 */
868		struct packed_rrset_data *d = (struct packed_rrset_data*)
869			rrset->entry.data;
870		if(d->trust != rrset_trust_add_noAA &&
871			d->trust != rrset_trust_add_AA &&
872			(qtype == LDNS_RR_TYPE_DS ||
873				(d->trust != rrset_trust_auth_noAA
874				&& d->trust != rrset_trust_auth_AA) )) {
875			struct dns_msg* msg = rrset_msg(rrset, region, now, &k);
876			if(msg) {
877				lock_rw_unlock(&rrset->entry.lock);
878				return msg;
879			}
880		}
881		lock_rw_unlock(&rrset->entry.lock);
882	}
883
884	/* stop downwards cache search on NXDOMAIN.
885	 * Empty nonterminals are NOERROR, so an NXDOMAIN for foo
886	 * means bla.foo also does not exist.  The DNSSEC proofs are
887	 * the same.  We search upwards for NXDOMAINs. */
888	if(env->cfg->harden_below_nxdomain)
889	    while(!dname_is_root(k.qname)) {
890		dname_remove_label(&k.qname, &k.qname_len);
891		h = query_info_hash(&k, flags);
892		e = slabhash_lookup(env->msg_cache, h, &k, 0);
893		if(!e && k.qtype != LDNS_RR_TYPE_A &&
894			env->cfg->qname_minimisation) {
895			k.qtype = LDNS_RR_TYPE_A;
896			h = query_info_hash(&k, flags);
897			e = slabhash_lookup(env->msg_cache, h, &k, 0);
898		}
899		if(e) {
900			struct reply_info* data = (struct reply_info*)e->data;
901			struct dns_msg* msg;
902			if(FLAGS_GET_RCODE(data->flags) == LDNS_RCODE_NXDOMAIN
903			  && data->security == sec_status_secure
904			  && (msg=tomsg(env, &k, data, region, now, scratch))){
905				lock_rw_unlock(&e->lock);
906				msg->qinfo.qname=qname;
907				msg->qinfo.qname_len=qnamelen;
908				/* check that DNSSEC really works out */
909				msg->rep->security = sec_status_unchecked;
910				return msg;
911			}
912			lock_rw_unlock(&e->lock);
913		}
914		k.qtype = qtype;
915	    }
916
917	/* fill common RR types for ANY response to avoid requery */
918	if(qtype == LDNS_RR_TYPE_ANY) {
919		return fill_any(env, qname, qnamelen, qtype, qclass, region);
920	}
921
922	return NULL;
923}
924
925int
926dns_cache_store(struct module_env* env, struct query_info* msgqinf,
927        struct reply_info* msgrep, int is_referral, time_t leeway, int pside,
928	struct regional* region, uint32_t flags)
929{
930	struct reply_info* rep = NULL;
931	/* alloc, malloc properly (not in region, like msg is) */
932	rep = reply_info_copy(msgrep, env->alloc, NULL);
933	if(!rep)
934		return 0;
935	/* ttl must be relative ;i.e. 0..86400 not  time(0)+86400.
936	 * the env->now is added to message and RRsets in this routine. */
937	/* the leeway is used to invalidate other rrsets earlier */
938
939	if(is_referral) {
940		/* store rrsets */
941		struct rrset_ref ref;
942		size_t i;
943		for(i=0; i<rep->rrset_count; i++) {
944			packed_rrset_ttl_add((struct packed_rrset_data*)
945				rep->rrsets[i]->entry.data, *env->now);
946			ref.key = rep->rrsets[i];
947			ref.id = rep->rrsets[i]->id;
948			/*ignore ret: it was in the cache, ref updated */
949			/* no leeway for typeNS */
950			(void)rrset_cache_update(env->rrset_cache, &ref,
951				env->alloc, *env->now +
952				((ntohs(ref.key->rk.type)==LDNS_RR_TYPE_NS
953				 && !pside) ? 0:leeway));
954		}
955		free(rep);
956		return 1;
957	} else {
958		/* store msg, and rrsets */
959		struct query_info qinf;
960		hashvalue_type h;
961
962		qinf = *msgqinf;
963		qinf.qname = memdup(msgqinf->qname, msgqinf->qname_len);
964		if(!qinf.qname) {
965			reply_info_parsedelete(rep, env->alloc);
966			return 0;
967		}
968		/* fixup flags to be sensible for a reply based on the cache */
969		/* this module means that RA is available. It is an answer QR.
970		 * Not AA from cache. Not CD in cache (depends on client bit). */
971		rep->flags |= (BIT_RA | BIT_QR);
972		rep->flags &= ~(BIT_AA | BIT_CD);
973		h = query_info_hash(&qinf, (uint16_t)flags);
974		dns_cache_store_msg(env, &qinf, h, rep, leeway, pside, msgrep,
975			flags, region);
976		/* qname is used inside query_info_entrysetup, and set to
977		 * NULL. If it has not been used, free it. free(0) is safe. */
978		free(qinf.qname);
979	}
980	return 1;
981}
982
983int
984dns_cache_prefetch_adjust(struct module_env* env, struct query_info* qinfo,
985        time_t adjust, uint16_t flags)
986{
987	struct msgreply_entry* msg;
988	msg = msg_cache_lookup(env, qinfo->qname, qinfo->qname_len,
989		qinfo->qtype, qinfo->qclass, flags, *env->now, 1);
990	if(msg) {
991		struct reply_info* rep = (struct reply_info*)msg->entry.data;
992		if(rep) {
993			rep->prefetch_ttl += adjust;
994			lock_rw_unlock(&msg->entry.lock);
995			return 1;
996		}
997		lock_rw_unlock(&msg->entry.lock);
998	}
999	return 0;
1000}
1001