aboutsummaryrefslogtreecommitdiff
path: root/scripts/iana-to-csv.py
diff options
context:
space:
mode:
authorRob Austein <sra@hactrn.net>2012-05-02 21:18:08 +0000
committerRob Austein <sra@hactrn.net>2012-05-02 21:18:08 +0000
commit0bf7f83eadf95a5297468e68983140c606371dc0 (patch)
tree839e3d4ca0c5559520fd0b4121a128e1ebdc8e10 /scripts/iana-to-csv.py
parent85e5f1a75ba64ab905eb66596057fcf362d4910e (diff)
First cut at hack to dump all relevant IANA data to CSV. Output still
needs to be merged with ERX data from ARIN's database, as IANA only deals with /8s in IPv4 space. Haven't figured out yet whether that should be a separate script or not. See #33. svn path=/branches/tk33/; revision=4460
Diffstat (limited to 'scripts/iana-to-csv.py')
-rw-r--r--scripts/iana-to-csv.py64
1 files changed, 64 insertions, 0 deletions
diff --git a/scripts/iana-to-csv.py b/scripts/iana-to-csv.py
new file mode 100644
index 00000000..dd524d8c
--- /dev/null
+++ b/scripts/iana-to-csv.py
@@ -0,0 +1,64 @@
+"""
+Parse IANA XML data.
+
+$Id$
+
+Copyright (C) 2010-2012 Internet Systems Consortium ("ISC")
+
+Permission to use, copy, modify, and distribute this software for any
+purpose with or without fee is hereby granted, provided that the above
+copyright notice and this permission notice appear in all copies.
+
+THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES WITH
+REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY
+AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR ANY SPECIAL, DIRECT,
+INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM
+LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE
+OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
+PERFORMANCE OF THIS SOFTWARE.
+"""
+
+import sys
+import lxml.etree
+from rpki.csv_utils import csv_writer
+
+def iterate_xml(filename, tag):
+ return lxml.etree.parse(filename).getroot().getiterator(tag)
+
+def ns(tag):
+ return "{http://www.iana.org/assignments}" + tag
+
+tag_description = ns("description")
+tag_designation = ns("designation")
+tag_record = ns("record")
+tag_number = ns("number")
+tag_prefix = ns("prefix")
+
+handles = {}
+
+for rir in ("AfriNIC", "APNIC", "ARIN", "LACNIC", "RIPE NCC"):
+ handles[rir] = handles["Assigned by %s" % rir] = handles["Administered by %s" % rir] = rir.split()[0].upper()
+
+asns = csv_writer("asns.csv")
+prefixes = csv_writer("prefixes.csv")
+
+for record in iterate_xml("as-numbers.xml", tag_record):
+ description = record.findtext(tag_description)
+ if description in handles:
+ asns.writerow((handles[description], record.findtext(tag_number)))
+
+for record in iterate_xml("ipv4-address-space.xml", tag_record):
+ designation = record.findtext(tag_designation)
+ if designation in handles:
+ prefix = record.findtext(tag_prefix)
+ p, l = prefix.split("/")
+ assert l == "8", "Violated /8 assumption: %r" % prefix
+ prefixes.writerow((handles[designation], "%d.0.0.0/8" % int(p)))
+
+for record in iterate_xml("ipv6-unicast-address-assignments.xml", tag_record):
+ description = record.findtext(tag_description)
+ if record.findtext(tag_description) in handles:
+ prefixes.writerow((handles[description], record.findtext(tag_prefix)))
+
+asns.close()
+prefixes.close()