基于rust 编写的高性能全文检索服务
sonic 是基于rust 编写的一个高性能,可简单替换es 的方案,没有提供http 接口,而是走的tcp 协议,目前已经
有了好多语言的包装库,可以方便使用
参考使用
- 环境准备
version: "3"
services:
sonic:
image: valeriansaliou/sonic:v1.3.0
ports:
- "1491:1491"
volumes:
- "./config.cfg:/etc/sonic.cfg"
meilisearch:
image: getmeili/meilisearch
ports:
- "7700:7700"
- golang 代码
package main
import (
"fmt"
"os"
"github.com/expectedsh/go-sonic/sonic"
"github.com/meilisearch/meilisearch-go"
)
func main() {
ingester, err := sonic.NewIngester("localhost", 1491, "dalong")
if err != nil {
panic(err)
}
_ = ingester.BulkPush("movies", "general", 3, []sonic.IngestBulkRecord{
{Object: "id:6ab56b4kk3", Text: "Star wars"},
{Object: "id:5hg67f8dg5", Text: "Spider man"},
{Object: "id:1m2n3b4vf6", Text: "Batman"},
{Object: "id:1111111", Text: "荣锋亮 测试应用 技术测试"},
{Object: "id:68d96h5h9d0", Text: "This is another movie"},
})
_ = ingester.BulkPush("movies", "general", 3, []sonic.IngestBulkRecord{
{Object: "id:6ab56b4kk3", Text: "Star wars"},
{Object: "id:5hg67f8dg5", Text: "Spider man"},
{Object: "id:1m2n3b4vf6", Text: "Batman"},
{Object: "id:1111112", Text: "111荣锋亮 测试应用 技术测试"},
{Object: "id:68d96h5h9d0", Text: "This is another movie"},
})
_ = ingester.BulkPush("movies", "general", 3, []sonic.IngestBulkRecord{
{Object: "id:6ab56b4kk3", Text: "Star wars"},
{Object: "id:5hg67f8dg5", Text: "Spider man"},
{Object: "id:1m2n3b4vf6", Text: "Batman"},
{Object: "id:1111113", Text: "111荣锋亮 测试应用 技术测试"},
{Object: "id:68d96h5h9d0", Text: "This is another movie"},
})
search, err := sonic.NewSearch("localhost", 1491, "dalong")
if err != nil {
panic(err)
}
results, _ := search.Query("movies", "general", "测", 10, 0)
fmt.Println(results)
var client = meilisearch.NewClient(meilisearch.Config{
Host: "http://127.0.0.1:7700",
})
// Create an index if your index does not already exist
if index, _ := client.Indexes().Get("books"); index.UID == "" {
fmt.Println("create index")
_, err = client.Indexes().Create(meilisearch.CreateIndexRequest{
UID: "books",
})
if err != nil {
fmt.Println(err)
os.Exit(1)
}
} else {
fmt.Println("index is created")
}
documents := []map[string]interface{}{
{"book_id": 123, "title": "Pride and Prejudice"},
{"book_id": 456, "title": "Le Petit Prince"},
{"book_id": 1, "title": "Alice In Wonderland"},
{"book_id": 1344, "title": "The Hobbit"},
{"book_id": 1345, "title": "荣锋亮 测试 应用"},
{"book_id": 1346, "title": "荣锋亮 测试 应用"},
{"book_id": 1347, "title": "荣锋亮 测试 使用应用"},
{"book_id": 1348, "title": `摘要:johnfercher/maroto 借鉴了bootstrap 的网格模式,使用了gofpdf 生成pdf,是一个很不错的golang pdf 工具 有一个问题是不支持中文(因为配置写的的原因)看到网上有一个中国人fork添加了AddUTF8Font 支持,这样 中文就可以显示了,以下是一个参考的使 `},
{"book_id": 4, "title": "Harry Potter and the Half-Blood Prince"},
{"book_id": 42, "title": "The Hitchhiker's Guide to the Galaxy"},
}
updateRes, err := client.Documents("books").AddOrUpdate(documents) // => { "updateId": 0 }
if err != nil {
fmt.Println(err)
os.Exit(1)
}
fmt.Println(updateRes.UpdateID)
searchRes, err := client.Search("books").Search(meilisearch.SearchRequest{
Query: "使用",
Limit: 10,
})
if err != nil {
fmt.Println(err)
os.Exit(1)
}
fmt.Println(searchRes.Hits)
}
说明
基于rust 开发的全文检索引擎还是比较多的,MeiliSearch 也是一个类似的,同时比较活跃,提供的功能也比较多
参考资料
https://github.com/valeriansaliou/sonic
https://github.com/expectedsh/go-sonic
https://github.com/tantivy-search/tantivy
https://github.com/meilisearch/MeiliSearch