Changeset 1958 in products for quintagroup.seoptimizer/branches/refactoring2.3.0/quintagroup/seoptimizer/browser/keywords.py
- Timestamp:
- Mar 19, 2010 2:59:57 PM (14 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
quintagroup.seoptimizer/branches/refactoring2.3.0/quintagroup/seoptimizer/browser/keywords.py
r1918 r1958 1 import urllib, re, os, commands2 from xml.dom import minidom,Node1 import re, commands 2 from xml.dom import Node 3 3 4 4 from zope.interface import implements … … 51 51 mapping={'result':'\n'.join(result)}), 52 52 context=self.context) 53 54 def walkTextNodes(self, parent, page_words=[]):55 for node in parent.childNodes:56 if node.nodeType == Node.ELEMENT_NODE:57 self.walkTextNodes(node, page_words)58 elif node.nodeType == Node.TEXT_NODE:59 value = node.nodeValue60 if value is not None:61 page_words.extend(map(lambda x: x.lower(), value.split()))62 63 def strip_tags(self, in_text):64 s_list = list(in_text)65 i,j = 0,066 67 while i < len(s_list):68 if s_list[i] == '<':69 while s_list[i] != '>':70 # pop everything from the the left-angle bracket until the right-angle bracket71 s_list.pop(i)72 73 # pops the right-angle bracket, too74 s_list.pop(i)75 else:76 i=i+177 78 # convert the list back into text79 join_char=''80 return join_char.join(s_list)
Note: See TracChangeset
for help on using the changeset viewer.