2 * This file is part of PowerDNS or dnsdist.
3 * Copyright -- PowerDNS.COM B.V. and its contributors
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of version 2 of the GNU General Public License as
7 * published by the Free Software Foundation.
9 * In addition, for the avoidance of any doubt, permission is granted to
10 * link this program with OpenSSL and to (re)distribute the binaries
11 * produced as the result of such linking.
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
24 #include "ext/luawrapper/include/LuaContext.hpp"
30 #include <boost/circular_buffer.hpp>
31 #include <boost/variant.hpp>
36 #include "dnscrypt.hh"
37 #include "dnsdist-cache.hh"
39 #include "dnsdist-dynbpf.hh"
40 #include "bpf-filter.hh"
43 #include <boost/uuid/uuid.hpp>
44 #include <boost/uuid/uuid_generators.hpp>
47 void* carbonDumpThread();
48 uint64_t uptimeOfProcess(const std::string& str);
52 DynBlock& operator=(const DynBlock& rhs)
57 blocks.store(rhs.blocks);
62 struct timespec until;
64 mutable std::atomic<unsigned int> blocks;
67 extern GlobalStateHolder<NetmaskTree<DynBlock>> g_dynblockNMG;
69 extern vector<pair<struct timeval, std::string> > g_confDelta;
73 using stat_t=std::atomic<uint64_t>; // aww yiss ;-)
75 stat_t servfailResponses{0};
77 stat_t nonCompliantQueries{0};
78 stat_t nonCompliantResponses{0};
80 stat_t emptyQueries{0};
82 stat_t blockFilter{0};
85 stat_t ruleNXDomain{0};
86 stat_t ruleRefused{0};
87 stat_t selfAnswered{0};
88 stat_t downstreamTimeouts{0};
89 stat_t downstreamSendErrors{0};
93 stat_t cacheMisses{0};
94 stat_t latency0_1{0}, latency1_10{0}, latency10_50{0}, latency50_100{0}, latency100_1000{0}, latencySlow{0};
96 double latencyAvg100{0}, latencyAvg1000{0}, latencyAvg10000{0}, latencyAvg1000000{0};
97 typedef std::function<uint64_t(const std::string&)> statfunction_t;
98 typedef boost::variant<stat_t*, double*, statfunction_t> entry_t;
99 std::vector<std::pair<std::string, entry_t>> entries{
100 {"responses", &responses},
101 {"servfail-responses", &servfailResponses},
102 {"queries", &queries},
103 {"acl-drops", &aclDrops},
104 {"block-filter", &blockFilter},
105 {"rule-drop", &ruleDrop},
106 {"rule-nxdomain", &ruleNXDomain},
107 {"rule-refused", &ruleRefused},
108 {"self-answered", &selfAnswered},
109 {"downstream-timeouts", &downstreamTimeouts},
110 {"downstream-send-errors", &downstreamSendErrors},
111 {"trunc-failures", &truncFail},
112 {"no-policy", &noPolicy},
113 {"latency0-1", &latency0_1},
114 {"latency1-10", &latency1_10},
115 {"latency10-50", &latency10_50},
116 {"latency50-100", &latency50_100},
117 {"latency100-1000", &latency100_1000},
118 {"latency-slow", &latencySlow},
119 {"latency-avg100", &latencyAvg100},
120 {"latency-avg1000", &latencyAvg1000},
121 {"latency-avg10000", &latencyAvg10000},
122 {"latency-avg1000000", &latencyAvg1000000},
123 {"uptime", uptimeOfProcess},
124 {"real-memory-usage", getRealMemoryUsage},
125 {"noncompliant-queries", &nonCompliantQueries},
126 {"noncompliant-responses", &nonCompliantResponses},
127 {"rdqueries", &rdQueries},
128 {"empty-queries", &emptyQueries},
129 {"cache-hits", &cacheHits},
130 {"cache-misses", &cacheMisses},
131 {"cpu-user-msec", getCPUTimeUser},
132 {"cpu-sys-msec", getCPUTimeSystem},
133 {"fd-usage", getOpenFileDescriptors},
134 {"dyn-blocked", &dynBlocked},
135 {"dyn-block-nmg-size", [](const std::string&) { return g_dynblockNMG.getLocal()->size(); }}
140 extern struct DNSDistStats g_stats;
145 StopWatch(bool realTime=false): d_needRealTime(realTime)
148 struct timespec d_start{0,0};
149 bool d_needRealTime{false};
152 if(gettime(&d_start, d_needRealTime) < 0)
153 unixDie("Getting timestamp");
157 double udiff() const {
159 if(gettime(&now, d_needRealTime) < 0)
160 unixDie("Getting timestamp");
162 return 1000000.0*(now.tv_sec - d_start.tv_sec) + (now.tv_nsec - d_start.tv_nsec)/1000.0;
165 double udiffAndSet() {
167 if(gettime(&now, d_needRealTime) < 0)
168 unixDie("Getting timestamp");
170 auto ret= 1000000.0*(now.tv_sec - d_start.tv_sec) + (now.tv_nsec - d_start.tv_nsec)/1000.0;
184 QPSLimiter(unsigned int rate, unsigned int burst) : d_rate(rate), d_burst(burst), d_tokens(burst)
190 unsigned int getRate() const
192 return d_passthrough? 0 : d_rate;
195 int getPassed() const
199 int getBlocked() const
204 bool check() const // this is not quite fair
208 auto delta = d_prev.udiffAndSet();
210 d_tokens += 1.0*d_rate * (delta/1000000.0);
212 if(d_tokens > d_burst)
216 if(d_tokens >= 1.0) { // we need this because burst=1 is weird otherwise
227 bool d_passthrough{true};
229 unsigned int d_burst;
230 mutable double d_tokens;
231 mutable StopWatch d_prev;
232 mutable unsigned int d_passed{0};
233 mutable unsigned int d_blocked{0};
238 IDState() : origFD(-1), sentTime(true), delayMsec(0) { origDest.sin4.sin_family = 0;}
239 IDState(const IDState& orig)
241 origFD = orig.origFD;
242 origID = orig.origID;
243 origRemote = orig.origRemote;
244 origDest = orig.origDest;
245 delayMsec = orig.delayMsec;
246 age.store(orig.age.load());
249 int origFD; // set to <0 to indicate this state is empty // 4
251 ComboAddress origRemote; // 28
252 ComboAddress origDest; // 28
253 StopWatch sentTime; // 16
256 std::shared_ptr<DnsCryptQuery> dnsCryptQuery{0};
259 boost::uuids::uuid uniqueId;
261 std::shared_ptr<DNSDistPacketCache> packetCache{nullptr};
262 uint32_t cacheKey; // 8
263 std::atomic<uint16_t> age; // 4
265 uint16_t qclass; // 2
266 uint16_t origID; // 2
267 uint16_t origFlags; // 2
269 bool ednsAdded{false};
270 bool ecsAdded{false};
271 bool skipCache{false};
272 bool destHarvested{false}; // if true, origDest holds the original dest addr, otherwise the listening addr
278 queryRing.set_capacity(10000);
279 respRing.set_capacity(10000);
280 pthread_rwlock_init(&queryLock, 0);
284 struct timespec when;
285 ComboAddress requestor;
291 boost::circular_buffer<Query> queryRing;
294 struct timespec when;
295 ComboAddress requestor;
301 ComboAddress ds; // who handled it
303 boost::circular_buffer<Response> respRing;
304 std::mutex respMutex;
305 pthread_rwlock_t queryLock;
307 std::unordered_map<int, vector<boost::variant<string,double> > > getTopBandwidth(unsigned int numentries);
308 size_t numDistinctRequestors();
311 extern Rings g_rings;
313 typedef std::unordered_map<string, unsigned int> QueryCountRecords;
314 typedef std::function<std::tuple<bool, string>(DNSQuestion dq)> QueryCountFilter;
318 pthread_rwlock_init(&queryLock, 0);
320 QueryCountRecords records;
321 QueryCountFilter filter;
322 pthread_rwlock_t queryLock;
326 extern QueryCount g_qcount;
332 DnsCryptContext* dnscryptCtx{0};
334 std::atomic<uint64_t> queries{0};
338 int getSocket() const
340 return udpFD != -1 ? udpFD : tcpFD;
344 shared_ptr<BPFFilter> d_filter;
349 d_filter->removeSocket(getSocket());
354 void attachFilter(shared_ptr<BPFFilter> bpf)
358 bpf->addSocket(getSocket());
361 #endif /* HAVE_EBPF */
364 class TCPClientCollection {
365 std::vector<int> d_tcpclientthreads;
366 std::atomic<uint64_t> d_numthreads{0};
367 std::atomic<uint64_t> d_pos{0};
368 std::atomic<uint64_t> d_queued{0};
369 uint64_t d_maxthreads{0};
373 TCPClientCollection(size_t maxThreads)
375 d_maxthreads = maxThreads;
376 d_tcpclientthreads.reserve(maxThreads);
380 uint64_t pos = d_pos++;
382 return d_tcpclientthreads[pos % d_numthreads];
384 bool hasReachedMaxThreads() const
386 return d_numthreads >= d_maxthreads;
388 uint64_t getThreadsCount() const
392 uint64_t getQueuedCount() const
396 void decrementQueuedCount()
400 void addTCPClientThread();
403 extern std::shared_ptr<TCPClientCollection> g_tcpclientthreads;
405 struct DownstreamState
407 DownstreamState(const ComboAddress& remote_, const ComboAddress& sourceAddr_, unsigned int sourceItf);
408 DownstreamState(const ComboAddress& remote_): DownstreamState(remote_, ComboAddress(), 0) {}
419 vector<IDState> idStates;
420 ComboAddress sourceAddr;
421 DNSName checkName{"a.root-servers.net."};
422 QType checkType{QType::A};
423 std::atomic<uint64_t> idOffset{0};
424 std::atomic<uint64_t> sendErrors{0};
425 std::atomic<uint64_t> outstanding{0};
426 std::atomic<uint64_t> reuseds{0};
427 std::atomic<uint64_t> queries{0};
429 std::atomic<uint64_t> sendErrors{0};
430 std::atomic<uint64_t> reuseds{0};
431 std::atomic<uint64_t> queries{0};
434 double queryLoad{0.0};
435 double dropRate{0.0};
436 double latencyUsec{0.0};
439 int tcpRecvTimeout{30};
440 int tcpSendTimeout{30};
441 unsigned int sourceItf{0};
443 uint8_t currentCheckFailures{0};
444 uint8_t maxCheckFailures{1};
447 enum class Availability { Up, Down, Auto} availability{Availability::Auto};
448 bool mustResolve{false};
449 bool upStatus{false};
454 if(availability == Availability::Down)
456 if(availability == Availability::Up)
460 void setUp() { availability = Availability::Up; }
461 void setDown() { availability = Availability::Down; }
462 void setAuto() { availability = Availability::Auto; }
463 string getName() const {
465 return remote.toStringWithPort();
469 string getNameWithAddr() const {
471 return remote.toStringWithPort();
473 return name + " (" + remote.toStringWithPort()+ ")";
477 using servers_t =vector<std::shared_ptr<DownstreamState>>;
479 extern uint16_t g_ECSSourcePrefixV4;
480 extern uint16_t g_ECSSourcePrefixV6;
481 extern bool g_ECSOverride;
485 DNSQuestion(const DNSName* name, uint16_t type, uint16_t class_, const ComboAddress* lc, const ComboAddress* rem, struct dnsheader* header, size_t bufferSize, uint16_t queryLen, bool isTcp): qname(name), qtype(type), qclass(class_), local(lc), remote(rem), dh(header), size(bufferSize), len(queryLen), ecsPrefixLength(rem->sin4.sin_family == AF_INET ? g_ECSSourcePrefixV4 : g_ECSSourcePrefixV6), tcp(isTcp), ecsOverride(g_ECSOverride) { }
488 boost::uuids::uuid uniqueId;
490 const DNSName* qname;
491 const uint16_t qtype;
492 const uint16_t qclass;
493 const ComboAddress* local;
494 const ComboAddress* remote;
495 struct dnsheader* dh;
498 uint16_t ecsPrefixLength;
500 bool skipCache{false};
505 struct DNSResponse : DNSQuestion
507 DNSResponse(const DNSName* name, uint16_t type, uint16_t class_, const ComboAddress* lc, const ComboAddress* rem, struct dnsheader* header, size_t bufferSize, uint16_t queryLen, bool isTcp, const struct timespec* queryTime_): DNSQuestion(name, type, class_, lc, rem, header, bufferSize, queryLen, isTcp), queryTime(queryTime_) { }
509 const struct timespec* queryTime;
512 typedef std::function<bool(const DNSQuestion*)> blockfilter_t;
513 template <class T> using NumberedVector = std::vector<std::pair<unsigned int, T> >;
515 void* responderThread(std::shared_ptr<DownstreamState> state);
516 extern std::mutex g_luamutex;
517 extern LuaContext g_lua;
518 extern std::string g_outputBuffer; // locking for this is ok, as locked by g_luamutex
523 virtual bool matches(const DNSQuestion* dq) const =0;
524 virtual string toString() const = 0;
525 mutable std::atomic<uint64_t> d_matches{0};
528 /* so what could you do:
531 provide actual answer,
532 allow & and stop processing,
534 modify header: (servfail|refused|notimp), set TC=1,
540 enum class Action { Drop, Nxdomain, Refused, Spoof, Allow, HeaderModify, Pool, Delay, None};
541 virtual Action operator()(DNSQuestion*, string* ruleresult) const =0;
542 virtual string toString() const = 0;
543 virtual std::unordered_map<string, double> getStats() const
549 class DNSResponseAction
552 enum class Action { Allow, Delay, Drop, HeaderModify, None };
553 virtual Action operator()(DNSResponse*, string* ruleresult) const =0;
554 virtual string toString() const = 0;
557 using NumberedServerVector = NumberedVector<shared_ptr<DownstreamState>>;
558 typedef std::function<shared_ptr<DownstreamState>(const NumberedServerVector& servers, const DNSQuestion*)> policyfunc_t;
568 const std::shared_ptr<DNSDistPacketCache> getCache() const { return packetCache; };
570 NumberedVector<shared_ptr<DownstreamState>> servers;
571 std::shared_ptr<DNSDistPacketCache> packetCache{nullptr};
573 using pools_t=map<std::string,std::shared_ptr<ServerPool>>;
574 void addServerToPool(pools_t& pools, const string& poolName, std::shared_ptr<DownstreamState> server);
575 void removeServerFromPool(pools_t& pools, const string& poolName, std::shared_ptr<DownstreamState> server);
581 unsigned int interval;
584 enum ednsHeaderFlags {
585 EDNS_HEADER_FLAG_NONE = 0,
586 EDNS_HEADER_FLAG_DO = 32768
589 extern GlobalStateHolder<SuffixMatchTree<DynBlock>> g_dynblockSMT;
590 extern DNSAction::Action g_dynBlockAction;
592 extern GlobalStateHolder<vector<CarbonConfig> > g_carbon;
593 extern GlobalStateHolder<ServerPolicy> g_policy;
594 extern GlobalStateHolder<servers_t> g_dstates;
595 extern GlobalStateHolder<pools_t> g_pools;
596 extern GlobalStateHolder<vector<pair<std::shared_ptr<DNSRule>, std::shared_ptr<DNSAction> > > > g_rulactions;
597 extern GlobalStateHolder<vector<pair<std::shared_ptr<DNSRule>, std::shared_ptr<DNSResponseAction> > > > g_resprulactions;
598 extern GlobalStateHolder<NetmaskGroup> g_ACL;
600 extern ComboAddress g_serverControl; // not changed during runtime
602 extern std::vector<std::tuple<ComboAddress, bool, bool, int>> g_locals; // not changed at runtime (we hope XXX)
603 extern vector<ClientState*> g_frontends;
604 extern std::string g_key; // in theory needs locking
605 extern bool g_truncateTC;
606 extern bool g_fixupCase;
607 extern int g_tcpRecvTimeout;
608 extern int g_tcpSendTimeout;
609 extern int g_udpTimeout;
610 extern uint16_t g_maxOutstanding;
611 extern std::atomic<bool> g_configurationDone;
612 extern uint64_t g_maxTCPClientThreads;
613 extern uint64_t g_maxTCPQueuedConnections;
614 extern std::atomic<uint16_t> g_cacheCleaningDelay;
615 extern std::atomic<uint16_t> g_cacheCleaningPercentage;
616 extern bool g_verboseHealthChecks;
617 extern uint32_t g_staleCacheEntriesTTL;
618 extern bool g_apiReadWrite;
619 extern std::string g_apiConfigDirectory;
620 extern bool g_servFailOnNoPolicy;
622 struct ConsoleKeyword {
625 std::string parameters;
626 std::string description;
627 std::string toString() const
629 std::string res(name);
631 res += "(" + parameters + ")";
638 extern const std::vector<ConsoleKeyword> g_consoleKeywords;
641 extern shared_ptr<BPFFilter> g_defaultBPFFilter;
642 extern std::vector<std::shared_ptr<DynBPFFilter> > g_dynBPFFilters;
643 #endif /* HAVE_EBPF */
647 void controlThread(int fd, ComboAddress local);
648 vector<std::function<void(void)>> setupLua(bool client, const std::string& config);
649 std::shared_ptr<ServerPool> getPool(const pools_t& pools, const std::string& poolName);
650 std::shared_ptr<ServerPool> createPoolIfNotExists(pools_t& pools, const string& poolName);
651 const NumberedServerVector& getDownstreamCandidates(const pools_t& pools, const std::string& poolName);
653 std::shared_ptr<DownstreamState> firstAvailable(const NumberedServerVector& servers, const DNSQuestion* dq);
655 std::shared_ptr<DownstreamState> leastOutstanding(const NumberedServerVector& servers, const DNSQuestion* dq);
656 std::shared_ptr<DownstreamState> wrandom(const NumberedServerVector& servers, const DNSQuestion* dq);
657 std::shared_ptr<DownstreamState> whashed(const NumberedServerVector& servers, const DNSQuestion* dq);
658 std::shared_ptr<DownstreamState> roundrobin(const NumberedServerVector& servers, const DNSQuestion* dq);
659 int getEDNSZ(const char* packet, unsigned int len);
660 void spoofResponseFromString(DNSQuestion& dq, const string& spoofContent);
661 uint16_t getEDNSOptionCode(const char * packet, size_t len);
662 void dnsdistWebserverThread(int sock, const ComboAddress& local, const string& password, const string& apiKey, const boost::optional<std::map<std::string, std::string> >&);
663 bool getMsgLen32(int fd, uint32_t* len);
664 bool putMsgLen32(int fd, uint32_t len);
665 void* tcpAcceptorThread(void* p);
667 void moreLua(bool client);
668 void doClient(ComboAddress server, const std::string& command);
670 void controlClientThread(int fd, ComboAddress client);
672 char** my_completion( const char * text , int start, int end);
674 void setLuaNoSideEffect(); // if nothing has been declared, set that there are no side effects
675 void setLuaSideEffect(); // set to report a side effect, cancelling all _no_ side effect calls
676 bool getLuaNoSideEffect(); // set if there were only explicit declarations of _no_ side effect
677 void resetLuaSideEffect(); // reset to indeterminate state
679 bool responseContentMatches(const char* response, const uint16_t responseLen, const DNSName& qname, const uint16_t qtype, const uint16_t qclass, const ComboAddress& remote);
680 bool processQuery(LocalStateHolder<NetmaskTree<DynBlock> >& localDynBlockNMG,
681 LocalStateHolder<SuffixMatchTree<DynBlock> >& localDynBlockSMT, LocalStateHolder<vector<pair<std::shared_ptr<DNSRule>, std::shared_ptr<DNSAction> > > >& localRulactions, blockfilter_t blockFilter, DNSQuestion& dq, string& poolname, int* delayMsec, const struct timespec& now);
682 bool processResponse(LocalStateHolder<vector<pair<std::shared_ptr<DNSRule>, std::shared_ptr<DNSResponseAction> > > >& localRespRulactions, DNSResponse& dr, int* delayMsec);
683 bool fixUpResponse(char** response, uint16_t* responseLen, size_t* responseSize, const DNSName& qname, uint16_t origFlags, bool ednsAdded, bool ecsAdded, std::vector<uint8_t>& rewrittenResponse, uint16_t addRoom);
684 void restoreFlags(struct dnsheader* dh, uint16_t origFlags);
687 extern std::vector<std::tuple<ComboAddress,DnsCryptContext,bool,int>> g_dnsCryptLocals;
689 int handleDnsCryptQuery(DnsCryptContext* ctx, char* packet, uint16_t len, std::shared_ptr<DnsCryptQuery>& query, uint16_t* decryptedQueryLen, bool tcp, std::vector<uint8_t>& reponse);
690 bool encryptResponse(char* response, uint16_t* responseLen, size_t responseSize, bool tcp, std::shared_ptr<DnsCryptQuery> dnsCryptQuery);