Last change
on this file since 2116 was
1,
checked in by myroslav, 19 years ago
|
Building directory structure
|
-
Property svn:eol-style set to
native
|
File size:
613 bytes
|
Rev | Line | |
---|
[1] | 1 | from xml.parsers.expat import ParserCreate |
---|
| 2 | import re |
---|
| 3 | |
---|
| 4 | def parse(data): |
---|
| 5 | def start_el(name, attrs): |
---|
| 6 | ParsedXML['start'][name] = attrs |
---|
| 7 | |
---|
| 8 | def char_handler(data): |
---|
| 9 | patt = re.compile('\S+', re.UNICODE) |
---|
| 10 | if patt.search(data): |
---|
| 11 | ParsedXML['data'].append(data) |
---|
| 12 | |
---|
| 13 | ParsedXML = {'start':{}, 'end':[], 'data':[]} |
---|
| 14 | parser = ParserCreate() |
---|
| 15 | parser.StartElementHandler = start_el |
---|
| 16 | parser.CharacterDataHandler = char_handler |
---|
| 17 | parser.Parse(data) |
---|
| 18 | return ParsedXML |
---|
| 19 | |
---|
| 20 | def hasURL(xml, url): |
---|
| 21 | parsed_sitemap = parse(xml) |
---|
| 22 | data = parsed_sitemap['data'] |
---|
| 23 | return url in data |
---|
Note: See
TracBrowser
for help on using the repository browser.