view pyikriam/lazy/www/work/find.py @ 246:60c4b4b78a01

code clean
author "Hisn Yi, Chen <ossug.hychen@gmail.com>"
date Mon, 01 Dec 2008 00:25:07 +0800
parents a4c364888197
children
line wrap: on
line source

from lxml import etree
from cStringIO import StringIO

class Finder:

    dom_tree = None
    xpath = None

    def __init__(self, working_product):
        self.working_prodcut = working_product

        self.encoding = 'utf8'
    
    def find(self, express , callback = None):
        
        if self.dom_tree is None:   self.set_dom_tree(self.working_prodcut.content)
 
        xpath = self.dom_tree.xpath(express)
        
        if callback:    return self.callback(xpath)
        return xpath

    def set_dom_tree(self, content):
        stream = StringIO(content)

        parser = etree.HTMLParser(encoding=self.encoding)
        self.dom_tree = etree.parse(stream, parser)