将文字转成网页

import sys, re
from handlers import HTMLRenderer
from util import blocks
from rules import rule_list

#将文本转成网页
class Parser:
    
    def __init__(self, handler):
        self.handler = handler
        self.rules = []     
        self.filters = []   

    def addRule(self, rule):
       
        self.rules.append(rule)

    def addFilter(self, pattern, name):
       
        def filter(block, handler):
          
            return re.sub(pattern, handler.sub(name), block)
        self.filters.append(filter)

    def parse(self, file):
       
        self.handler.start('document')
      
        for block in blocks(file):
         
            for filter in self.filters:
                block = filter(block, self.handler)
           
            for rule in self.rules:
              
                if rule.condition(block):
                    last = rule.action(block, self.handler)
                  
                    if last: 
                        break
      
        self.handler.end('document')


class BasicTextParser(Parser):
  

    def __init__(self, handler):
        super().__init__(handler)
        for rule in rule_list:
            self.addRule(rule)
        self.addFilter(r'\*(.+?)\*', 'emphasis')
        self.addFilter(r'(http://[\.a-zA-Z/]+)', 'url')
        self.addFilter(r'([\.a-zA-Z]+@[\.a-zA-Z]+[a-zA-Z]+)', 'mail')


def main():
    handler = HTMLRenderer()
    parser = BasicTextParser(handler)
    parser.parse(sys.stdin)


if __name__ == '__main__':
    main()


    $ cd ~/Code
$ wget http://labfile.oss.aliyuncs.com/courses/70/python_markup.zip
$ unzip python_markup.zip
$ cp unzip python_markup/test.txt .

 

posted @ 2020-05-18 16:52  王者2  阅读(804)  评论(0编辑  收藏  举报