star4knight
#!/usr/bin/env python
# -*- encoding=utf8 -*-

import urllib
import sys
import re

def print_usage():
    print "ips usage:"
    print "\tips xx.xx.xx.xx"
    

def locate_ip(ip):
    req = urllib.urlopen("http://www.ip138.com/ips1388.asp?ip=%s&action=2"%ip)
    lines = req.readlines()
    for line in lines:
	line = unicode(line,\'gb2312\')
	# query succeed
	if line.strip().find(\'<td align="center"><ul class="ul1"><li>\') != -1 :
	    idx = line.find(\'<td align="center"><ul class="ul1"><li>\')
	    #TODO replace this dirty handle
	    print line[idx:].replace(\'</li><li>\',"\n").replace(\'<td align="center"><ul class="ul1"><li>\',\'\').replace(\'</li></ul></td>\',\'\').strip()
	# query fail
	if line.strip().find(\'<td align="center"><h1>\') != -1:
	    idx = line.find(\'<td align="center"><h1>\') 
	    #TODO replace this dirty handle
	    print line[idx:].replace(\'<br/><br/></td>\',\'\').replace(\'</h1>\',\' \').replace(\'<td align="center"><h1>\',\'\')

if __name__ == "__main__":
    #print sys.argv
    if len(sys.argv) == 2:
	ip = sys.argv[1]
	pat = re.compile("^\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}$")
	if pat.match(ip):
	    print "ip is : " ,ip
	    locate_ip(ip)
    else:
	print_usage()

  

分类:

技术点:

相关文章: