from urllib import urlopen #import library
def get_page(url): #open url response = urlopen(url) objectt = response.read() return objectt #---------> imprime el codigo html def get_object(objectt,start,end): start_object = objectt.find(start) end_object = objectt.find(end) name_object = objectt[start_object:end_object] return name_object diccionario = {} diccionario['link'] = str(get_object(page,'<a href=','itemBox')) diccionario['name'] = str(get_object(diccionario["link"],'/es/','</a>')) diccionario['address'] = str(get_object(diccionario["link"],'/es/','</a>')) return diccionario print get_object(get_page('http://www.1golf.eu/es/campos-de-golf/reino-unido/inglaterra/?offset=160'),'<a href=','itemBox') def get_links(get_page(url)): lst = [] while page.find('<a href=')!= -1: start_link = page.find('<a href=') end_link = page.find ('itemBox', start_link) url = page[start_link: end_link+1] lst.append(url) page = page[end_link] return lst |
Comunication is the art of combine information
Imagination is the mental capacity to picture things.
Categories
All
Hall of FameJohn Conway
Post Archives
January 2024
if you ain´t new ideas then you need learn new stuff.
XPRICEShot trends |