squirrel2300

导航

using python to compute production rules

#coding=utf8

import logging
import itertools
import re
import sys

logger = logging.getLogger()
root_format = "[%(filename)s:%(lineno)s \t- %(funcName)-10s() ]: %(message)s"
logging.basicConfig(format=root_format)
logger.setLevel(logging.DEBUG)


branch_production_dict = [["pat1",["<suba1><subb1>","<suba2><subb2>"]],
       ["pat2",["<suba2.1><subb2.1>","<suba2.2><subb2.2>"]],
       ["pat3",["<suba3.1><subb3.1>","<suba3.2><subb3.2>"]]
      ]
leaf_production_dict_0 = {"suba1":['a1.1','a1.2'],
       'subb1':['b1.1','b1.2'],
       'suba2':['a2.1','a2.2'],
       'subb2':['b2.1','b2.2'],
       "suba2.1":['a1.1','a1.2'],
       'subb2.1':['b1.1','b1.2'],
       'suba2.2':['a2.1','a2.2'],
       'subb2.2':['b2.1','b2.2'],
       "suba3.1":['a1.1','a1.2'],
       'subb3.1':['b1.1','b1.2'],
       'suba3.2':['a2.1','a2.2'],
       'subb3.2':['b2.1','b2.2'],
       }
leaf_production_dict = {}
for i in leaf_production_dict_0.keys():
    val = []
    for j in leaf_production_dict_0[i]:
        val.append('<'+i+'>'+'('+j+')')
    leaf_production_dict[i]= val

        

dt3 = {}
dt4 = {}
logging.debug(str(branch_production_dict))

def prod_and_link(list_vec):
    res = []
    for i in itertools.product(*list_vec):
        tmp = list(i)
        one = ""
        for j in tmp:
            one += j
        #print(one)
        res.append(one)
        #print(res)
    return res
for ii in branch_production_dict:
    i=ii[0]
    #sys.stdout.write('for ')
    #print(i)
    logging.debug('for '+str(i))
    val = ii[1]
    ttt = []
    nttt = []
    for j in val:
        tmp_segs = re.split('>|<',j)
        segs=[]
        nt_segs=[]
        for k in tmp_segs:
            if len(k) > 0:
                segs.append(leaf_production_dict[k])
                nt_segs.append(['<'+k+'>'])
            #get a seg
        prod_res = prod_and_link(segs)
        logging.debug(str(nt_segs))
        nt_prod_res = prod_and_link(nt_segs)
        ttt += prod_res
        nttt += nt_prod_res
    logging.debug(str(ttt))
    dt3[i]=ttt
    dt4[i]=nttt

logging.debug(str(dt3))
dt4 = {}
for i in dt3.keys():
    dt4_val= []
    for j in dt3[i]:
        split_res = re.split('(>\()|(\)<)',j)
        split_res = list(split_res)
        logging.debug("split_res : "+str(split_res))
        #print(split_res)
        #print(type(split_res))
        n=0
        p = ''
        q = ''
        for k in [kk for kk in split_res if all([kk != None, kk!=')<',kk!='>('])]:
            logging.debug("kk in " + str([kk for kk in split_res if all([kk != None, kk!=')<',kk!='>('])]))
            if n == 0:
                p += '<'+k+'>'
                n = 1
            elif n == 1:
                q += '('+k+')'
                n = 0
            logging.debug("p:"+p+',q:'+q)

            
        p = p[1:]
        q = q[:-1]
        dt4_val.append(p+'='+q)
    dt4[i] = dt4_val

logging.debug(str(dt4))
link_res = prod_and_link([['a','b'],['c','d']])
#print( link_res )
#[test2.py:110     - <module>  () ]: {'pat2': ['<suba2.1><subb2.1>=(a1.1)(b1.1)', '<suba2.1><subb2.1>=(a1.1)(b1.2)', '<suba2.1><subb2.1>=(a1.2)(b1.1)', '<suba2.1><subb2.1>=(a1.2)(b1.2)', '<suba2.2><subb2.2>=(a2.1)(b2.1)', '<suba2.2><subb2.2>=(a2.1)(b2.2)', '<suba2.2><subb2.2>=(a2.2)(b2.1)', '<suba2.2><subb2.2>=(a2.2)(b2.2)'], 'pat1': ['<suba1><subb1>=(a1.1)(b1.1)', '<suba1><subb1>=(a1.1)(b1.2)', '<suba1><subb1>=(a1.2)(b1.1)', '<suba1><subb1>=(a1.2)(b1.2)', '<suba2><subb2>=(a2.1)(b2.1)', '<suba2><subb2>=(a2.1)(b2.2)', '<suba2><subb2>=(a2.2)(b2.1)', '<suba2><subb2>=(a2.2)(b2.2)'], 'pat3': ['<suba3.1><subb3.1>=(a1.1)(b1.1)', '<suba3.1><subb3.1>=(a1.1)(b1.2)', '<suba3.1><subb3.1>=(a1.2)(b1.1)', '<suba3.1><subb3.1>=(a1.2)(b1.2)', '<suba3.2><subb3.2>=(a2.1)(b2.1)', '<suba3.2><subb3.2>=(a2.1)(b2.2)', '<suba3.2><subb3.2>=(a2.2)(b2.1)', '<suba3.2><subb3.2>=(a2.2)(b2.2)']}


posted on 2017-04-13 01:51  squirrel2300  阅读(128)  评论(0编辑  收藏  举报