# -*- coding: UTF-8 -*- from lxml import etree from StringIO import StringIO if __name__ == "__main__": document=""" 1-3 2006-03-13 08:44:52 SANTIAGO PUENTE 13/03/2006 Robertin MANZANO 2006-03-10 15:52:29 """ j=0 while 1: print j j+=1 tree = etree.fromstring(document) images_url = tree.xpath('//link[@rel="media"][@href]') image_url_name=images_url[0].attrib['href']