>>> import urllib2 >>> import urllib >>> p = urllib2.urlopen("http://www.google.com") >>> p> >>> c = p.read() >>> dir(p) ['__doc__', '__init__', '__iter__', '__module__', '__repr__', 'close', 'code', 'fileno', 'fp', 'getcode', 'geturl', 'headers', 'info', 'msg', 'next', 'read', 'readline', 'readlines', 'url'] >>> p.url 'http://www.google.co.jp/?gfe_rd=cr&ei=MtZkWNDXDYSL8QeD46cY' >>> p.headers >>> p.headers.items() [('x-xss-protection', '1; mode=block'), ('set-cookie', 'NID=93=O65u9flBWzM92U9MzcezfIXaeG9itO-ala3ogt6T7fipovY5ily4QBNUxbUbsVga_hYeJEKWDq891mFaPgZm2Ya_1gvUZm37K2pNfFpOUVxCptVtOSAn3OXvUHCzKBaC; expires=Fri, 30-Jun-2017 09:24:02 GMT; path=/; domain=.google.co.jp; HttpOnly'), ('accept-ranges', 'none'), ('expires', '-1'), ('vary', 'Accept-Encoding'), ('server', 'gws'), ('connection', 'close'), ('cache-control', 'private, max-age=0'), ('date', 'Thu, 29 Dec 2016 09:24:02 GMT'), ('p3p', 'CP="This is not a P3P policy! See https://www.google.com/support/accounts/answer/151657?hl=en for more info."'), ('content-type', 'text/html; charset=Shift_JIS'), ('x-frame-options', 'SAMEORIGIN')] >>> p.headers['content-type'] 'text/html; charset=Shift_JIS'
>>> s = = urllib2.urlopen("http://www.example.com") SyntaxError: invalid syntax >>> s = urllib2.urlopen("http://www.example.com") >>> s.url 'http://www.example.com' >>> s.headers.items() [('content-length', '1270'), ('x-ec-custom-error', '1'), ('x-cache', 'HIT'), ('expires', 'Thu, 05 Jan 2017 09:28:12 GMT'), ('vary', 'Accept-Encoding'), ('server', 'ECS (rhv/818F)'), ('last-modified', 'Fri, 09 Aug 2013 23:54:35 GMT'), ('connection', 'close'), ('etag', '"359670651+gzip+ident"'), ('cache-control', 'max-age=604800'), ('date', 'Thu, 29 Dec 2016 09:28:12 GMT'), ('content-type', 'text/html')]
parsing xml
from xml.com import minidom
json
>>> import json >>> j = '{"one": 1, "numbers": [1,2,3.5]}' >>> json.loads(j) {u'numbers': [1, 2, 3.5], u'one': 1}
def total_ups(): j = json.loads(reddit_front) sum(c['data']['ups'] for c in j['data']['children'])
host ip info
host ip info
IP_URL = "http://api.hostip.info/?ip=" def get_coords(ip): url = IP_URL + ip content = None content = urllib2.urlopen(url).read() except URLError: return if content: d = minidom.parseString(content) coords = d.getElementByTagName("gml:coordinates") if coords and coords[0].childNodes[0].nodeValue: lon, lat = coords[0].childNodes[0].nodeValue.split(',') return db.GetPt(lat, lon)
Gmap
GMAPS_URL = "" def gmap_img(points): markers = '&'.join('makers=%s,%s' % (p.lat, p.lon) for p in points) return GMAPS_URL + markers print gmaps_img([Point])