hdoj 2222 Keywords Search(AC自动机)

题目链接:http://acm.hdu.edu.cn/showproblem.php?pid=2222

思路分析:该问题为多模式匹配问题,使用AC自动机解决;需要注意的问题是如何统计该待查询的字符串包含的关键字:

假设待查找的字符串为str[0..n],则str[i…j]可能为某一个关键字;假设当前正在匹配字符str[k],则以str[i..k]为关键字的所有可能

可能的关键字的最后一个字符为str[k],使用fail指针进行跳转并判断以str[k]结尾的该结点是否为关键字最后一个结点,重复进行该

操作直到回溯到根节点。

 

代码如下:

#include <cstdio>
#include <cstring>
#include <iostream>
using namespace std;

const int KIND = 26;
const int LEN_STR = 50 + 10;
const int MAX_N = 1000000 + 10;

struct Node;
Node *q[MAX_N];
char insert_str[LEN_STR];
char str[MAX_N];

struct Node {
    Node *fail;
    Node *next[KIND];
    int count;

    Node()
    {
        fail = NULL;
        count = 0;
        memset(next, NULL, sizeof(next));
    }
};

void Insert(char *str, Node *root)
{
    Node *p = root;
    int i = 0, index = 0;

    while (str[i]) {
        index = str[i++] - 'a';
        if (p->next[index] == NULL)
            p->next[index] = new Node();
        p = p->next[index];
    }
    p->count++; // 单词的末尾会被标记为1
}

void BuildAcAutomation(Node *root)
{
    int head = 0, tail = 0;

    root->fail = NULL;
    q[tail++] = root;
    while (head != tail) {
        Node *temp = q[head++];
        Node *p = NULL;

        for (int i = 0; i < KIND; ++i) {
            if (temp->next[i]) {
                if (temp == root)
                    temp->next[i]->fail = root;
                else {
                    p = temp->fail;
                    while (p != NULL) {
                        if(p->next[i]) {
                            temp->next[i]->fail = p->next[i];
                            break;
                        }
                        p = p->fail;
                    }
                    if (p == NULL)
                        temp->next[i]->fail = root;
                }
                q[tail++] = temp->next[i];
            }
            
        }
    }
}

int Query(char *str, Node *root)
{
    int i = 0, cnt = 0, index = 0;
    Node *p = root;

    while (str[i]) {
        index = str[i] - 'a';
        while (!p->next[index] && p != root)
            p = p->fail;
        p = p->next[index];
        p = (p == NULL) ? root : p;

        Node *temp = p;
        while (temp != root && temp->count != -1) {
            cnt += temp->count;
            temp->count = -1;
            temp = temp->fail;
        }
        ++i;
    }
    return cnt;
}

int main()
{
    int case_times = 0;
    int ans = 0, n = 0;

    scanf("%d", &case_times);
    while (case_times--) {
        Node *root = new Node();
        scanf("%d", &n);
        while (n--) {
            scanf("%s", insert_str);
            Insert(insert_str, root);
        }
        BuildAcAutomation(root);

        scanf("%s", &str);
        ans = Query(str, root);
        printf("%d\n", ans);
    }
    return 0;
}
posted @ 2015-07-17 23:17  Leptus  阅读(261)  评论(0编辑  收藏  举报