Last change
on this file since 3665 was
3152,
checked in by zidane, 13 years ago
|
fixes pep8
|
-
Property svn:eol-style set to
native
|
File size:
619 bytes
|
Line | |
---|
1 | from xml.parsers.expat import ParserCreate |
---|
2 | import re |
---|
3 | |
---|
4 | |
---|
5 | def parse(data): |
---|
6 | def start_el(name, attrs): |
---|
7 | ParsedXML['start'][name] = attrs |
---|
8 | |
---|
9 | def char_handler(data): |
---|
10 | patt = re.compile('\S+', re.UNICODE) |
---|
11 | if patt.search(data): |
---|
12 | ParsedXML['data'].append(data) |
---|
13 | |
---|
14 | ParsedXML = {'start': {}, 'end': [], 'data': []} |
---|
15 | parser = ParserCreate() |
---|
16 | parser.StartElementHandler = start_el |
---|
17 | parser.CharacterDataHandler = char_handler |
---|
18 | parser.Parse(data) |
---|
19 | return ParsedXML |
---|
20 | |
---|
21 | |
---|
22 | def hasURL(xml, url): |
---|
23 | parsed_sitemap = parse(xml) |
---|
24 | data = parsed_sitemap['data'] |
---|
25 | return url in data |
---|
Note: See
TracBrowser
for help on using the repository browser.