from xml.parsers.expat import ParserCreate import re def parse(data): def start_el(name, attrs): ParsedXML['start'][name] = attrs def char_handler(data): patt = re.compile('\S+', re.UNICODE) if patt.search(data): ParsedXML['data'].append(data) ParsedXML = {'start':{}, 'end':[], 'data':[]} parser = ParserCreate() parser.StartElementHandler = start_el parser.CharacterDataHandler = char_handler parser.Parse(data) return ParsedXML def hasURL(xml, url): parsed_sitemap = parse(xml) data = parsed_sitemap['data'] return url in data