diff options
author | Rob Austein <sra@hactrn.net> | 2012-05-02 21:18:08 +0000 |
---|---|---|
committer | Rob Austein <sra@hactrn.net> | 2012-05-02 21:18:08 +0000 |
commit | 0bf7f83eadf95a5297468e68983140c606371dc0 (patch) | |
tree | 839e3d4ca0c5559520fd0b4121a128e1ebdc8e10 | |
parent | 85e5f1a75ba64ab905eb66596057fcf362d4910e (diff) |
First cut at hack to dump all relevant IANA data to CSV. Output still
needs to be merged with ERX data from ARIN's database, as IANA only
deals with /8s in IPv4 space. Haven't figured out yet whether that
should be a separate script or not. See #33.
svn path=/branches/tk33/; revision=4460
-rw-r--r-- | scripts/iana-to-csv.py | 64 |
1 files changed, 64 insertions, 0 deletions
diff --git a/scripts/iana-to-csv.py b/scripts/iana-to-csv.py new file mode 100644 index 00000000..dd524d8c --- /dev/null +++ b/scripts/iana-to-csv.py @@ -0,0 +1,64 @@ +""" +Parse IANA XML data. + +$Id$ + +Copyright (C) 2010-2012 Internet Systems Consortium ("ISC") + +Permission to use, copy, modify, and distribute this software for any +purpose with or without fee is hereby granted, provided that the above +copyright notice and this permission notice appear in all copies. + +THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES WITH +REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY +AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR ANY SPECIAL, DIRECT, +INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM +LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE +OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR +PERFORMANCE OF THIS SOFTWARE. +""" + +import sys +import lxml.etree +from rpki.csv_utils import csv_writer + +def iterate_xml(filename, tag): + return lxml.etree.parse(filename).getroot().getiterator(tag) + +def ns(tag): + return "{http://www.iana.org/assignments}" + tag + +tag_description = ns("description") +tag_designation = ns("designation") +tag_record = ns("record") +tag_number = ns("number") +tag_prefix = ns("prefix") + +handles = {} + +for rir in ("AfriNIC", "APNIC", "ARIN", "LACNIC", "RIPE NCC"): + handles[rir] = handles["Assigned by %s" % rir] = handles["Administered by %s" % rir] = rir.split()[0].upper() + +asns = csv_writer("asns.csv") +prefixes = csv_writer("prefixes.csv") + +for record in iterate_xml("as-numbers.xml", tag_record): + description = record.findtext(tag_description) + if description in handles: + asns.writerow((handles[description], record.findtext(tag_number))) + +for record in iterate_xml("ipv4-address-space.xml", tag_record): + designation = record.findtext(tag_designation) + if designation in handles: + prefix = record.findtext(tag_prefix) + p, l = prefix.split("/") + assert l == "8", "Violated /8 assumption: %r" % prefix + prefixes.writerow((handles[designation], "%d.0.0.0/8" % int(p))) + +for record in iterate_xml("ipv6-unicast-address-assignments.xml", tag_record): + description = record.findtext(tag_description) + if record.findtext(tag_description) in handles: + prefixes.writerow((handles[description], record.findtext(tag_prefix))) + +asns.close() +prefixes.close() |