【2024.01.19】huginn爬取什么值得买的排行榜
一句命令就行,主要是搭配RSS使用
docker run -d -p 3000:3000 ghcr.io/yhdsl/huginn:latest
这次主要是为了自定义爬取内容
筛选掉一些我用不上的,比如说奶粉啥的
{
"schema_version": 1,
"name": "什么值得买榜单",
"description": "关键词里面自己修改",
"source_url": false,
"guid": "3038bbb808e3628363d6d97ea85b50d5",
"tag_fg_color": "#ffffff",
"tag_bg_color": "#f33535",
"icon": "gear",
"exported_at": "2024-01-23T00:23:15Z",
"agents": [
{
"type": "Agents::TriggerAgent",
"name": "什么值得买-筛选数据(关键词)",
"disabled": false,
"guid": "0635876a2d42933095f5463f1b0d95bc",
"options": {
"expected_receive_period_in_days": "2",
"keep_event": "true",
"rules": [
{
"type": "!regex",
"value": "酒|咖啡|手机|收藏|窖|过期|水饺|抽纸|老抽|生抽|牛|鸭|话费|奶粉|生蚝|羊|海鲜|螺狮粉|镜片|火锅|移动|电信|联通|券|油|大米|显卡|红包|鸡蛋|童装|洁厕|罐头|保温杯|饭|华为|猫粮|苹果|手表|轮胎|酱|料理|糕|人参|宝宝|橙|味精",
"path": "title"
}
]
},
"keep_events_for": 259200,
"propagate_immediately": true
},
{
"type": "Agents::TriggerAgent",
"name": "什么值得买-筛选数据(评论数、值数)",
"disabled": false,
"guid": "c2d97ac7c7a30c36dcd6f59752e5b735",
"options": {
"expected_receive_period_in_days": "2",
"keep_event": "true",
"rules": [
{
"type": "field>=value",
"value": "5",
"path": "$.worth"
},
{
"type": "field>=value",
"value": "5",
"path": "$.comment"
}
]
},
"keep_events_for": 0,
"propagate_immediately": false
},
{
"type": "Agents::WebsiteAgent",
"name": "什么值得买-获取数据",
"disabled": false,
"guid": "c693a156bc391111f3bd6ff08fb1ced2",
"options": {
"expected_update_period_in_days": "2",
"url": "{{ url }}",
"type": "html",
"mode": "all",
"extract": {
"title": {
"xpath": "//*[@id=\"feed-main\"]/div[2]/div/div[1]/h1",
"value": "normalize-space(.) "
},
"content": {
"xpath": "//*[@id=\"feed-main\"]/div[3]/article/div[1]",
"value": "normalize-space(.) "
},
"photo": {
"xpath": "//*[@id=\"feed-main\"]/div[2]/a/img",
"value": "@src"
},
"worth": {
"xpath": "//*[@id=\"rating_worthy_num\"]",
"value": "normalize-space(.) "
},
"worth_percent": {
"xpath": "//*[@id=\"rating_all_num\"]",
"value": "normalize-space(.) "
},
"comment": {
"xpath": "//*[@id=\"content\"]/div/div[1]/div[3]/a/span",
"value": "normalize-space(.) "
},
"not_worth": {
"xpath": "//*[@id=\"rating_unworthy_num\"]",
"value": "normalize-space(.) "
},
"link_to_buy": {
"xpath": "//*[@id=\"feed-main\"]/div[2]/a",
"value": "@href"
},
"price": {
"xpath": "//*[@id=\"feed-main\"]/div[2]/div/div[1]/div/span/div/span[1]",
"value": "normalize-space(.) "
}
}
},
"schedule": "every_12h",
"keep_events_for": 259200,
"propagate_immediately": true
},
{
"type": "Agents::WebsiteAgent",
"name": "什么值得买-源数据",
"disabled": false,
"guid": "c7c2f2cd1fff9b75c390fb6d1a3f0d54",
"options": {
"expected_update_period_in_days": "2",
"url": "https://faxian.smzdm.com/h2s0t0f0c0p1/",
"type": "html",
"mode": "on_change",
"extract": {
"url": {
"xpath": "//*[@id=\"feed-main-list\"]/li/div/div[1]/a[1]",
"value": "@href"
},
"title": {
"xpath": "//*[@id=\"feed-main-list\"]/li/div/h5/a",
"value": "normalize-space(.)"
}
}
},
"schedule": "every_10m",
"keep_events_for": 259200,
"propagate_immediately": true
},
{
"type": "Agents::DataOutputAgent",
"name": "什么值得买-RSS",
"disabled": false,
"guid": "cc405cd989e17453bb9f5aacb0ab7ab3",
"options": {
"secrets": [
"smzdm"
],
"expected_receive_period_in_days": 2,
"template": {
"title": "什么值得买-热门榜",
"description": "什么值得买热门",
"item": {
"title": "{{title}}",
"description": "<p>{{price}} 值{{worth}} 不值{{not_worth}} {{worth_percent}}</p><p>{{content}}</p><div class=\"img_description\"></div><p></p><img src=\"{{photo}}\" referrerpolicy=\"no-referrer\"><div class=\"img_description\"></div><p><a href=\"{{link_to_buy}}\">购买链接</a></p>",
"link": "{{link_to_buy}}"
},
"link": "{{link_to_buy}}",
"icon": "https://post.smzdm.com/favicon.ico?v=2023091316",
"ttl": "120"
},
"ns_media": "true"
},
"propagate_immediately": true
}
],
"links": [
{
"source": 0,
"receiver": 2
},
{
"source": 1,
"receiver": 4
},
{
"source": 2,
"receiver": 1
},
{
"source": 3,
"receiver": 0
}
],
"control_links": [
]
}