2025-11-18 17:56:10 +08:00
|
|
|
|
-- ====================================================
|
|
|
|
|
|
-- 定时任务元数据初始化脚本
|
|
|
|
|
|
-- ====================================================
|
|
|
|
|
|
|
|
|
|
|
|
-- 插入人民日报新闻爬取任务的元数据
|
|
|
|
|
|
|
|
|
|
|
|
-- 1. 关键字搜索爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
2025-11-21 16:49:37 +08:00
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'1',
|
|
|
|
|
|
'rmbr_keyword_search',
|
|
|
|
|
|
'关键字搜索爬取',
|
|
|
|
|
|
'根据关键字搜索人民日报新闻内容',
|
|
|
|
|
|
'人民日报新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
2025-11-19 16:04:50 +08:00
|
|
|
|
'crawler/rmrb/RmrbSearch.py',
|
2025-11-18 17:56:10 +08:00
|
|
|
|
'[
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "query",
|
|
|
|
|
|
"description": "搜索关键字",
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"type": "Input",
|
|
|
|
|
|
"valueType": "String",
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"value": "",
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "total",
|
|
|
|
|
|
"description": "总新闻数量",
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"type": "InputNumber",
|
|
|
|
|
|
"valueType": "Integer",
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"value": 10,
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
}
|
|
|
|
|
|
]',
|
|
|
|
|
|
1,
|
2025-11-21 16:49:37 +08:00
|
|
|
|
1,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 2. 排行榜爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
2025-11-21 16:49:37 +08:00
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'2',
|
|
|
|
|
|
'rmbr_hotpoint',
|
|
|
|
|
|
'排行榜爬取',
|
|
|
|
|
|
'爬取人民日报热门排行榜新闻',
|
|
|
|
|
|
'人民日报新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
2025-11-19 16:04:50 +08:00
|
|
|
|
'crawler/rmrb/RmrbHotPoint.py',
|
2025-11-18 17:56:10 +08:00
|
|
|
|
'[]',
|
2025-11-21 16:49:37 +08:00
|
|
|
|
1,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
2,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 3. 往日精彩头条爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
2025-11-21 16:49:37 +08:00
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'3',
|
|
|
|
|
|
'rmbr_trending',
|
|
|
|
|
|
'往日精彩头条爬取',
|
|
|
|
|
|
'爬取人民日报往日精彩头条新闻',
|
|
|
|
|
|
'人民日报新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
2025-11-19 16:04:50 +08:00
|
|
|
|
'crawler/rmrb/RmrbTrending.py',
|
2025-11-18 17:56:10 +08:00
|
|
|
|
'[
|
|
|
|
|
|
{
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"name": "dateRange",
|
|
|
|
|
|
"description": "日期范围",
|
|
|
|
|
|
"type": "DateRangePicker",
|
|
|
|
|
|
"valueType": "String",
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"value": "",
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"required": false,
|
|
|
|
|
|
"startKey": "startDate",
|
|
|
|
|
|
"endKey": "endDate"
|
|
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "yesterday",
|
|
|
|
|
|
"description": "是否是昨天",
|
|
|
|
|
|
"type": "Switch",
|
|
|
|
|
|
"valueType": "Boolean",
|
|
|
|
|
|
"value": true,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"required": false
|
2025-11-21 16:49:37 +08:00
|
|
|
|
}
|
|
|
|
|
|
]',
|
|
|
|
|
|
1,
|
|
|
|
|
|
3,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 4. 新华网关键字搜索爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'4',
|
|
|
|
|
|
'xhw_keyword_search',
|
|
|
|
|
|
'关键字搜索爬取',
|
|
|
|
|
|
'根据关键字搜索新华网新闻内容',
|
|
|
|
|
|
'新华网新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'crawler/xhw/XhwSearch.py',
|
|
|
|
|
|
'[
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "query",
|
|
|
|
|
|
"description": "搜索关键字",
|
|
|
|
|
|
"type": "Input",
|
|
|
|
|
|
"valueType": "String",
|
|
|
|
|
|
"value": "",
|
|
|
|
|
|
"required": true
|
2025-11-18 17:56:10 +08:00
|
|
|
|
},
|
|
|
|
|
|
{
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"name": "total",
|
|
|
|
|
|
"description": "抓取数量",
|
|
|
|
|
|
"type": "InputNumber",
|
|
|
|
|
|
"valueType": "Integer",
|
|
|
|
|
|
"value": 10,
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
}
|
|
|
|
|
|
]',
|
|
|
|
|
|
1,
|
|
|
|
|
|
4,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 5. 新华网热点新闻爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'5',
|
|
|
|
|
|
'xhw_hot_point',
|
|
|
|
|
|
'热点新闻爬取',
|
|
|
|
|
|
'爬取新华网热点新闻',
|
|
|
|
|
|
'新华网新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'crawler/xhw/XhwHotPoint.py',
|
|
|
|
|
|
'[]',
|
|
|
|
|
|
1,
|
|
|
|
|
|
5,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 6. 新华网推荐新闻爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'6',
|
|
|
|
|
|
'xhw_commend',
|
|
|
|
|
|
'推荐新闻爬取',
|
|
|
|
|
|
'爬取新华网推荐新闻',
|
|
|
|
|
|
'新华网新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'crawler/xhw/XhwCommend.py',
|
|
|
|
|
|
'[]',
|
|
|
|
|
|
1,
|
|
|
|
|
|
6,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 7. 学习强国关键字搜索爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'7',
|
|
|
|
|
|
'xxqg_keyword_search',
|
|
|
|
|
|
'关键字搜索爬取',
|
|
|
|
|
|
'根据关键字搜索学习强国新闻内容',
|
|
|
|
|
|
'学习强国新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'crawler/xxqg/XxqgSearch.py',
|
|
|
|
|
|
'[
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "query",
|
|
|
|
|
|
"description": "搜索关键字",
|
|
|
|
|
|
"type": "Input",
|
|
|
|
|
|
"valueType": "String",
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"value": "",
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"required": true
|
|
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "total",
|
|
|
|
|
|
"description": "抓取数量",
|
|
|
|
|
|
"type": "InputNumber",
|
|
|
|
|
|
"valueType": "Integer",
|
|
|
|
|
|
"value": 10,
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
}
|
|
|
|
|
|
]',
|
|
|
|
|
|
1,
|
|
|
|
|
|
7,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 8. 学习强国栏目新闻爬取
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'8',
|
|
|
|
|
|
'xxqg_column_crawl',
|
|
|
|
|
|
'栏目新闻爬取',
|
|
|
|
|
|
'爬取学习强国指定栏目的新闻内容',
|
|
|
|
|
|
'学习强国新闻爬取',
|
|
|
|
|
|
'newsCrewerTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'crawler/xxqg/XxqgColumn.py',
|
|
|
|
|
|
'[
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "column",
|
|
|
|
|
|
"description": "栏目名称",
|
|
|
|
|
|
"type": "Select",
|
|
|
|
|
|
"valueType": "String",
|
|
|
|
|
|
"value": "important",
|
|
|
|
|
|
"required": true,
|
|
|
|
|
|
"options": [
|
|
|
|
|
|
{"label": "重要新闻", "value": "important"},
|
|
|
|
|
|
{"label": "学习时评", "value": "xuexishiping"},
|
|
|
|
|
|
{"label": "综合新闻", "value": "zonghexinwen"},
|
|
|
|
|
|
{"label": "中宣部发布", "value": "zhongxuanbu"}
|
|
|
|
|
|
]
|
2025-11-18 17:56:10 +08:00
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "yesterday",
|
2025-11-21 16:49:37 +08:00
|
|
|
|
"description": "是否抓取昨天的数据",
|
|
|
|
|
|
"type": "Switch",
|
|
|
|
|
|
"valueType": "Boolean",
|
2025-11-18 17:56:10 +08:00
|
|
|
|
"value": true,
|
|
|
|
|
|
"required": false
|
2025-11-21 16:49:37 +08:00
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "dateRange",
|
|
|
|
|
|
"description": "日期范围",
|
|
|
|
|
|
"type": "DateRangePicker",
|
|
|
|
|
|
"valueType": "String",
|
|
|
|
|
|
"value": "",
|
|
|
|
|
|
"required": false,
|
|
|
|
|
|
"startKey": "start",
|
|
|
|
|
|
"endKey": "end"
|
2025-11-18 17:56:10 +08:00
|
|
|
|
}
|
|
|
|
|
|
]',
|
2025-11-21 16:49:37 +08:00
|
|
|
|
1,
|
|
|
|
|
|
8,
|
2025-11-18 17:56:10 +08:00
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
2025-11-21 16:49:37 +08:00
|
|
|
|
);
|
|
|
|
|
|
|
2025-11-25 14:45:11 +08:00
|
|
|
|
-- 9. 热门资源推荐任务
|
|
|
|
|
|
INSERT INTO `tb_crontab_task_meta` (
|
|
|
|
|
|
`id`, `meta_id`, `name`, `description`, `category`,
|
|
|
|
|
|
`bean_name`, `method_name`, `script_path`, `param_schema`, `auto_publish`,
|
|
|
|
|
|
`sort_order`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'9',
|
|
|
|
|
|
'top_recommend_task',
|
|
|
|
|
|
'热门资源推荐',
|
|
|
|
|
|
'每天凌晨1点自动更新热门推荐资源(浏览量TOP10+最新发布TOP10)',
|
|
|
|
|
|
'系统内部任务',
|
|
|
|
|
|
'topRecommendTask',
|
|
|
|
|
|
'execute',
|
|
|
|
|
|
'',
|
2025-11-25 16:00:09 +08:00
|
|
|
|
'[
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "viewNum",
|
|
|
|
|
|
"description": "按浏览量取多少条",
|
|
|
|
|
|
"type": "InputNumber",
|
|
|
|
|
|
"valueType": "Integer",
|
|
|
|
|
|
"value": 10,
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
},
|
|
|
|
|
|
{
|
|
|
|
|
|
"name": "timeNum",
|
|
|
|
|
|
"description": "按时间取多少条",
|
|
|
|
|
|
"type": "InputNumber",
|
|
|
|
|
|
"valueType": "Integer",
|
|
|
|
|
|
"value": 10,
|
|
|
|
|
|
"required": true
|
|
|
|
|
|
}
|
|
|
|
|
|
]',
|
2025-11-25 14:45:11 +08:00
|
|
|
|
0,
|
|
|
|
|
|
9,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
-- 创建热门资源推荐任务实例
|
|
|
|
|
|
INSERT INTO `tb_crontab_task` (
|
|
|
|
|
|
`id`, `task_id`, `meta_id`, `task_name`,`task_group`, `description`,`bean_name`,
|
|
|
|
|
|
`cron_expression`, `method_name`, `method_params`, `status`, `creator`, `create_time`
|
|
|
|
|
|
) VALUES (
|
|
|
|
|
|
'9',
|
|
|
|
|
|
'task_top_recommend_daily',
|
|
|
|
|
|
'top_recommend_task',
|
|
|
|
|
|
'每日热门资源推荐更新',
|
|
|
|
|
|
'系统内部任务',
|
|
|
|
|
|
'每天凌晨1点自动更新热门推荐资源列表',
|
|
|
|
|
|
'topRecommendTask',
|
|
|
|
|
|
'0 0 1 * * ?',
|
|
|
|
|
|
'execute',
|
2025-11-25 16:00:09 +08:00
|
|
|
|
'{"viewNum":10,"timeNum":10}',
|
2025-11-25 14:45:11 +08:00
|
|
|
|
1,
|
|
|
|
|
|
'system',
|
|
|
|
|
|
NOW()
|
|
|
|
|
|
);
|
|
|
|
|
|
-- 赋予root用户和superadmin角色对热门资源推荐任务的读写执行权限
|
|
|
|
|
|
INSERT INTO `tb_resource_permission` (`id`, `resource_type`, `resource_id`, `dept_id`,
|
|
|
|
|
|
`role_id`, `can_read`, `can_write`, `can_execute`, `creator`, `updater`,
|
|
|
|
|
|
`create_time`, `update_time`, `delete_time`, `deleted`)
|
|
|
|
|
|
VALUES ('671f0c40642e6a69c2be9b6d7a4e986e', 7, 'task_top_recommend_daily', 'root_department',
|
|
|
|
|
|
'superadmin', 1, 1, 1, '1', NULL,
|
|
|
|
|
|
'2025-11-25 13:57:16', '2025-11-25 13:57:16', NULL, 0);
|
|
|
|
|
|
INSERT INTO `tb_resource_permission` (`id`, `resource_type`, `resource_id`, `dept_id`,
|
|
|
|
|
|
`role_id`, `can_read`, `can_write`, `can_execute`, `creator`, `updater`,
|
|
|
|
|
|
`create_time`, `update_time`, `delete_time`, `deleted`)
|
|
|
|
|
|
VALUES ('c365853b6a0e38a9c504962de4403e57', 7, 'task_top_recommend_daily', NULL, NULL,
|
|
|
|
|
|
1, 0, 0, '1', NULL,
|
|
|
|
|
|
'2025-11-25 13:57:16', '2025-11-25 13:57:16', NULL, 0);
|