2 ###############################################################################
4 # libloc - A library to determine the location of someone on the Internet #
6 # Copyright (C) 2020 IPFire Development Team <info@ipfire.org> #
8 # This library is free software; you can redistribute it and/or #
9 # modify it under the terms of the GNU Lesser General Public #
10 # License as published by the Free Software Foundation; either #
11 # version 2.1 of the License, or (at your option) any later version. #
13 # This library is distributed in the hope that it will be useful, #
14 # but WITHOUT ANY WARRANTY; without even the implied warranty of #
15 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU #
16 # Lesser General Public License for more details. #
18 ###############################################################################
28 # Load our location module
30 import location
.database
31 import location
.importer
32 from location
.i18n
import _
35 log
= logging
.getLogger("location.importer")
40 parser
= argparse
.ArgumentParser(
41 description
=_("Location Importer Command Line Interface"),
43 subparsers
= parser
.add_subparsers()
45 # Global configuration flags
46 parser
.add_argument("--debug", action
="store_true",
47 help=_("Enable debug output"))
50 parser
.add_argument("--version", action
="version",
51 version
="%(prog)s @VERSION@")
54 parser
.add_argument("--database-host", required
=True,
55 help=_("Database Hostname"), metavar
=_("HOST"))
56 parser
.add_argument("--database-name", required
=True,
57 help=_("Database Name"), metavar
=_("NAME"))
58 parser
.add_argument("--database-username", required
=True,
59 help=_("Database Username"), metavar
=_("USERNAME"))
60 parser
.add_argument("--database-password", required
=True,
61 help=_("Database Password"), metavar
=_("PASSWORD"))
64 write
= subparsers
.add_parser("write", help=_("Write database to file"))
65 write
.set_defaults(func
=self
.handle_write
)
66 write
.add_argument("file", nargs
=1, help=_("Database File"))
67 write
.add_argument("--signing-key", nargs
="?", type=open, help=_("Signing Key"))
68 write
.add_argument("--vendor", nargs
="?", help=_("Sets the vendor"))
69 write
.add_argument("--description", nargs
="?", help=_("Sets a description"))
70 write
.add_argument("--license", nargs
="?", help=_("Sets the license"))
73 update_whois
= subparsers
.add_parser("update-whois", help=_("Update WHOIS Information"))
74 update_whois
.set_defaults(func
=self
.handle_update_whois
)
76 # Update announcements
77 update_announcements
= subparsers
.add_parser("update-announcements",
78 help=_("Update BGP Annoucements"))
79 update_announcements
.set_defaults(func
=self
.handle_update_announcements
)
80 update_announcements
.add_argument("server", nargs
=1,
81 help=_("Route Server to connect to"), metavar
=_("SERVER"))
84 update_overrides
= subparsers
.add_parser("update-overrides",
85 help=_("Update overrides"),
87 update_overrides
.add_argument(
88 "files", nargs
="+", help=_("Files to import"),
90 update_overrides
.set_defaults(func
=self
.handle_update_overrides
)
92 args
= parser
.parse_args()
94 # Enable debug logging
96 location
.logger
.set_level(logging
.DEBUG
)
98 # Print usage if no action was given
99 if not "func" in args
:
106 # Parse command line arguments
107 args
= self
.parse_cli()
109 # Initialise database
110 self
.db
= self
._setup
_database
(args
)
113 ret
= args
.func(args
)
115 # Return with exit code
119 # Otherwise just exit
122 def _setup_database(self
, ns
):
124 Initialise the database
126 # Connect to database
127 db
= location
.database
.Connection(
128 host
=ns
.database_host
, database
=ns
.database_name
,
129 user
=ns
.database_username
, password
=ns
.database_password
,
132 with db
.transaction():
135 CREATE TABLE IF NOT EXISTS announcements(network inet, autnum bigint,
136 first_seen_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
137 last_seen_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP);
138 CREATE UNIQUE INDEX IF NOT EXISTS announcements_networks ON announcements(network);
139 CREATE INDEX IF NOT EXISTS announcements_family ON announcements(family(network));
142 CREATE TABLE IF NOT EXISTS autnums(number bigint, name text NOT NULL);
143 CREATE UNIQUE INDEX IF NOT EXISTS autnums_number ON autnums(number);
146 CREATE TABLE IF NOT EXISTS networks(network inet, country text);
147 CREATE UNIQUE INDEX IF NOT EXISTS networks_network ON networks(network);
148 CREATE INDEX IF NOT EXISTS networks_search ON networks USING GIST(network inet_ops);
151 CREATE TABLE IF NOT EXISTS autnum_overrides(
152 number bigint NOT NULL,
154 is_anonymous_proxy boolean DEFAULT FALSE,
155 is_satellite_provider boolean DEFAULT FALSE,
156 is_anycast boolean DEFAULT FALSE
158 CREATE UNIQUE INDEX IF NOT EXISTS autnum_overrides_number
159 ON autnum_overrides(number);
161 CREATE TABLE IF NOT EXISTS network_overrides(
162 network inet NOT NULL,
164 is_anonymous_proxy boolean DEFAULT FALSE,
165 is_satellite_provider boolean DEFAULT FALSE,
166 is_anycast boolean DEFAULT FALSE
168 CREATE UNIQUE INDEX IF NOT EXISTS network_overrides_network
169 ON network_overrides(network);
174 def handle_write(self
, ns
):
176 Compiles a database in libloc format out of what is in the database
181 writer
= location
.Writer(ns
.signing_key
)
185 writer
.vendor
= ns
.vendor
188 writer
.description
= ns
.description
191 writer
.license
= ns
.license
193 # Add all Autonomous Systems
194 log
.info("Writing Autonomous Systems...")
196 # Select all ASes with a name
197 rows
= self
.db
.query("""
199 autnums.number AS number,
201 (SELECT overrides.name FROM autnum_overrides overrides
202 WHERE overrides.number = autnums.number),
206 WHERE name <> %s ORDER BY number
210 a
= writer
.add_as(row
.number
)
214 log
.info("Writing networks...")
216 # Select all known networks
217 rows
= self
.db
.query("""
219 DISTINCT ON (announcements.network)
220 announcements.network AS network,
221 announcements.autnum AS autnum,
222 networks.country AS country,
224 -- Must be part of returned values for ORDER BY clause
225 masklen(networks.network) AS sort,
230 SELECT is_anonymous_proxy FROM network_overrides overrides
231 WHERE announcements.network <<= overrides.network
232 ORDER BY masklen(overrides.network) DESC
236 SELECT is_anonymous_proxy FROM autnum_overrides overrides
237 WHERE announcements.autnum = overrides.number
239 ) AS is_anonymous_proxy,
242 SELECT is_satellite_provider FROM network_overrides overrides
243 WHERE announcements.network <<= overrides.network
244 ORDER BY masklen(overrides.network) DESC
248 SELECT is_satellite_provider FROM autnum_overrides overrides
249 WHERE announcements.autnum = overrides.number
251 ) AS is_satellite_provider,
254 SELECT is_anycast FROM network_overrides overrides
255 WHERE announcements.network <<= overrides.network
256 ORDER BY masklen(overrides.network) DESC
260 SELECT is_anycast FROM autnum_overrides overrides
261 WHERE announcements.autnum = overrides.number
265 LEFT JOIN networks ON announcements.network <<= networks.network
266 ORDER BY announcements.network, sort DESC
270 network
= writer
.add_network(row
.network
)
273 network
.asn
, network
.country_code
= row
.autnum
, row
.country
276 if row
.is_anonymous_proxy
:
277 network
.set_flag(location
.NETWORK_FLAG_ANONYMOUS_PROXY
)
279 if row
.is_satellite_provider
:
280 network
.set_flag(location
.NETWORK_FLAG_SATELLITE_PROVIDER
)
283 network
.set_flag(location
.NETWORK_FLAG_ANYCAST
)
285 # Write everything to file
286 log
.info("Writing database to file...")
290 def handle_update_whois(self
, ns
):
291 downloader
= location
.importer
.Downloader()
293 # Download all sources
294 with self
.db
.transaction():
295 # Create some temporary tables to store parsed data
297 CREATE TEMPORARY TABLE _autnums(number integer, organization text)
299 CREATE UNIQUE INDEX _autnums_number ON _autnums(number);
301 CREATE TEMPORARY TABLE _organizations(handle text, name text)
303 CREATE UNIQUE INDEX _organizations_handle ON _organizations(handle);
306 for source
in location
.importer
.WHOIS_SOURCES
:
307 with downloader
.request(source
, return_blocks
=True) as f
:
309 self
._parse
_block
(block
)
312 INSERT INTO autnums(number, name)
313 SELECT _autnums.number, _organizations.name FROM _autnums
314 LEFT JOIN _organizations ON _autnums.organization = _organizations.handle
315 ON CONFLICT (number) DO UPDATE SET name = excluded.name;
318 # Download all extended sources
319 for source
in location
.importer
.EXTENDED_SOURCES
:
320 with self
.db
.transaction():
322 with downloader
.request(source
) as f
:
324 self
._parse
_line
(line
)
326 def _parse_block(self
, block
):
327 # Get first line to find out what type of block this is
331 if line
.startswith("aut-num:"):
332 return self
._parse
_autnum
_block
(block
)
335 elif line
.startswith("organisation:"):
336 return self
._parse
_org
_block
(block
)
338 def _parse_autnum_block(self
, block
):
342 key
, val
= split_line(line
)
345 m
= re
.match(r
"^(AS|as)(\d+)", val
)
347 autnum
["asn"] = m
.group(2)
356 # Insert into database
357 self
.db
.execute("INSERT INTO _autnums(number, organization) \
358 VALUES(%s, %s) ON CONFLICT (number) DO UPDATE SET \
359 organization = excluded.organization",
360 autnum
.get("asn"), autnum
.get("org"),
363 def _parse_org_block(self
, block
):
367 key
, val
= split_line(line
)
369 if key
in ("organisation", "org-name"):
376 self
.db
.execute("INSERT INTO _organizations(handle, name) \
377 VALUES(%s, %s) ON CONFLICT (handle) DO \
378 UPDATE SET name = excluded.name",
379 org
.get("organisation"), org
.get("org-name"),
382 def _parse_line(self
, line
):
384 if line
.startswith("2"):
388 if line
.startswith("#"):
392 registry
, country_code
, type, line
= line
.split("|", 3)
394 log
.warning("Could not parse line: %s" % line
)
397 # Skip any lines that are for stats only
398 if country_code
== "*":
401 if type in ("ipv6", "ipv4"):
402 return self
._parse
_ip
_line
(country_code
, type, line
)
404 def _parse_ip_line(self
, country
, type, line
):
406 address
, prefix
, date
, status
, organization
= line
.split("|")
410 # Try parsing the line without organization
412 address
, prefix
, date
, status
= line
.split("|")
414 log
.warning("Unhandled line format: %s" % line
)
417 # Skip anything that isn't properly assigned
418 if not status
in ("assigned", "allocated"):
421 # Cast prefix into an integer
425 log
.warning("Invalid prefix: %s" % prefix
)
428 # Fix prefix length for IPv4
430 prefix
= 32 - int(math
.log(prefix
, 2))
432 # Try to parse the address
434 network
= ipaddress
.ip_network("%s/%s" % (address
, prefix
), strict
=False)
436 log
.warning("Invalid IP address: %s" % address
)
439 self
.db
.execute("INSERT INTO networks(network, country) \
440 VALUES(%s, %s) ON CONFLICT (network) DO \
441 UPDATE SET country = excluded.country",
442 "%s" % network
, country
,
445 def handle_update_announcements(self
, ns
):
446 server
= ns
.server
[0]
448 # Pre-compile regular expression for routes
449 #route = re.compile(b"^\*>?\s[\si]?([^\s]+)[.\s]*?(\d+)\si$", re.MULTILINE)
450 route
= re
.compile(b
"^\*[\s\>]i([^\s]+).+?(\d+)\si\r\n", re
.MULTILINE|re
.DOTALL
)
452 with telnetlib
.Telnet(server
) as t
:
455 # t.set_debuglevel(10)
457 # Wait for console greeting
458 greeting
= t
.read_until(b
"> ")
459 log
.debug(greeting
.decode())
462 t
.write(b
"terminal length 0\n")
464 # Wait for the prompt to return
467 # Fetch the routing tables
468 with self
.db
.transaction():
469 for protocol
in ("ipv6", "ipv4"):
470 log
.info("Requesting %s routing table" % protocol
)
472 # Request the full unicast routing table
473 t
.write(b
"show bgp %s unicast\n" % protocol
.encode())
475 # Read entire header which ends with "Path"
476 t
.read_until(b
"Path\r\n")
479 # Try reading a full entry
480 # Those might be broken across multiple lines but ends with i
481 line
= t
.read_until(b
"i\r\n", timeout
=5)
485 # Show line for debugging
486 #log.debug(repr(line))
488 # Try finding a route in here
489 m
= route
.match(line
)
491 network
, autnum
= m
.groups()
493 # Convert network to string
494 network
= network
.decode()
496 # Append /24 for IPv4 addresses
497 if not "/" in network
and not ":" in network
:
498 network
= "%s/24" % network
500 # Convert AS number to integer
503 log
.info("Found announcement for %s by %s" % (network
, autnum
))
505 self
.db
.execute("INSERT INTO announcements(network, autnum) \
506 VALUES(%s, %s) ON CONFLICT (network) DO \
507 UPDATE SET autnum = excluded.autnum, last_seen_at = CURRENT_TIMESTAMP",
511 log
.info("Finished reading the %s routing table" % protocol
)
513 # Purge anything we never want here
515 -- Delete default routes
516 DELETE FROM announcements WHERE network = '::/0' OR network = '0.0.0.0/0';
518 -- Delete anything that is not global unicast address space
519 DELETE FROM announcements WHERE family(network) = 6 AND NOT network <<= '2000::/3';
521 -- DELETE "current network" address space
522 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '0.0.0.0/8';
524 -- DELETE local loopback address space
525 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '127.0.0.0/8';
527 -- DELETE RFC 1918 address space
528 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '10.0.0.0/8';
529 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '172.16.0.0/12';
530 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '192.168.0.0/16';
532 -- DELETE test, benchmark and documentation address space
533 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '192.0.0.0/24';
534 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '192.0.2.0/24';
535 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '198.18.0.0/15';
536 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '198.51.100.0/24';
537 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '203.0.113.0/24';
539 -- DELETE CGNAT address space (RFC 6598)
540 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '100.64.0.0/10';
542 -- DELETE link local address space
543 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '169.254.0.0/16';
545 -- DELETE IPv6 to IPv4 (6to4) address space
546 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '192.88.99.0/24';
548 -- DELETE multicast and reserved address space
549 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '224.0.0.0/4';
550 DELETE FROM announcements WHERE family(network) = 4 AND network <<= '240.0.0.0/4';
552 -- Delete networks that are too small to be in the global routing table
553 DELETE FROM announcements WHERE family(network) = 6 AND masklen(network) > 48;
554 DELETE FROM announcements WHERE family(network) = 4 AND masklen(network) > 24;
556 -- Delete any non-public or reserved ASNs
557 DELETE FROM announcements WHERE NOT (
558 (autnum >= 1 AND autnum <= 23455)
560 (autnum >= 23457 AND autnum <= 64495)
562 (autnum >= 131072 AND autnum <= 4199999999)
565 -- Delete everything that we have not seen for 14 days
566 DELETE FROM announcements WHERE last_seen_at <= CURRENT_TIMESTAMP - INTERVAL '14 days';
569 def handle_update_overrides(self
, ns
):
570 with self
.db
.transaction():
571 # Drop all data that we have
573 TRUNCATE TABLE autnum_overrides;
574 TRUNCATE TABLE network_overrides;
577 for file in ns
.files
:
578 log
.info("Reading %s..." % file)
580 with
open(file, "rb") as f
:
581 for type, block
in location
.importer
.read_blocks(f
):
583 network
= block
.get("net")
584 # Try to parse and normalise the network
586 network
= ipaddress
.ip_network(network
, strict
=False)
587 except ValueError as e
:
588 log
.warning("Invalid IP network: %s: %s" % (network
, e
))
592 INSERT INTO network_overrides(
596 is_satellite_provider,
598 ) VALUES (%s, %s, %s, %s, %s)
599 ON CONFLICT (network) DO NOTHING""",
601 block
.get("country"),
602 block
.get("is-anonymous-proxy") == "yes",
603 block
.get("is-satellite-provider") == "yes",
604 block
.get("is-anycast") == "yes",
607 elif type == "autnum":
608 autnum
= block
.get("autnum")
610 # Check if AS number begins with "AS"
611 if not autnum
.startswith("AS"):
612 log
.warning("Invalid AS number: %s" % autnum
)
619 INSERT INTO autnum_overrides(
623 is_satellite_provider,
625 ) VALUES(%s, %s, %s, %s, %s)
626 ON CONFLICT DO NOTHING""",
627 autnum
, block
.get("name"),
628 block
.get("is-anonymous-proxy") == "yes",
629 block
.get("is-satellite-provider") == "yes",
630 block
.get("is-anycast") == "yes",
634 log
.warning("Unsupport type: %s" % type)
637 def split_line(line
):
638 key
, colon
, val
= line
.partition(":")
640 # Strip any excess space
647 # Run the command line interface