""" Parse a WHOIS research dump and write out (just) the RPKI-relevant fields in myrpki-format CSV syntax. Unfortunately, unlike the ARIN and APNIC databases, the RIPE database doesn't really have any useful concept of an organizational handle. More precisely, while it has handles out the wazoo, none of them are useful as a reliable grouping mechanism for tracking which set of resources are held by a particular organization. So, instead of being able to track all of an organization's resources with a single handle as we can in the ARIN and APNIC databases, the best we can do with the RIPE database is to track individual resources, each with its own resource handle. Well, for prefixes -- ASN entries behave more like in the ARIN and APNIC databases. Feh. NB: The input data for this script is publicly available via FTP, but you'll have to fetch the data from RIPE yourself, and be sure to see the terms and conditions referenced by the data file header comments. $Id$ Copyright (C) 2009-2012 Internet Systems Consortium ("ISC") Permission to use, copy, modify, and distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. """ import gzip from rpki.csv_utils import csv_writer class Handle(dict): want_tags = () want_status = ("ASSIGNED", "ASSIGNEDPA", "ASSIGNEDPI") debug = False def set(self, tag, val): if tag in self.want_tags: self[tag] = "".join(val.split(" ")) def check(self): for tag in self.want_tags: if not tag in self: return False if self.debug: self.log() return True def __repr__(self): return "<%s %s>" % (self.__class__.__name__, " ".join("%s:%s" % (tag, self.get(tag, "?")) for tag in self.want_tags)) def log(self): print repr(self) def finish(self, ctx): self.check() class aut_num(Handle): want_tags = ("aut-num", "mnt-by") # "as-name" def set(self, tag, val): if tag == "aut-num" and val.startswith("AS"): val = val[2:] Handle.set(self, tag, val) def finish(self, ctx): if self.check(): ctx.asns.writerow((self["mnt-by"], self["aut-num"])) class inetnum(Handle): want_tags = ("inetnum", "netname", "status") # "mnt-by" def finish(self, ctx): if self.check() and self["status"] in self.want_status: ctx.prefixes.writerow((self["netname"], self["inetnum"])) class inet6num(Handle): want_tags = ("inet6num", "netname", "status") # "mnt-by" def finish(self, ctx): if self.check() and self["status"] in self.want_status: ctx.prefixes.writerow((self["netname"], self["inet6num"])) class main(object): types = dict((x.want_tags[0], x) for x in (aut_num, inetnum, inet6num)) def finish_statement(self, done): if self.statement: tag, sep, val = self.statement.partition(":") assert sep, "Couldn't find separator in %r" % self.statement tag = tag.strip().lower() val = val.strip().upper() if self.cur is None: self.cur = self.types[tag]() if tag in self.types else False if self.cur is not False: self.cur.set(tag, val) if done and self.cur: self.cur.finish(self) self.cur = None filenames = ("ripe.db.aut-num.gz", "ripe.db.inet6num.gz", "ripe.db.inetnum.gz") def __init__(self): self.asns = csv_writer("asns.csv") self.prefixes = csv_writer("prefixes.csv") for fn in self.filenames: f = gzip.open(fn) self.statement = "" self.cur = None for line in f: line = line.expandtabs().partition("#")[0].rstrip("\n") if line and not line[0].isalpha(): self.statement += line[1:] if line[0] == "+" else line else: self.finish_statement(not line) self.statement = line self.finish_statement(True) f.close() self.asns.close() self.prefixes.close() main() '#n54'>54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207