!19 魔改版合并

Merge pull request !19 from 我是D/dev
This commit is contained in:
小东 2019-12-24 15:19:35 +08:00 committed by Gitee
commit cdac7d2e73
10 changed files with 69 additions and 30 deletions

View File

@ -5,12 +5,9 @@ import java.util.HashMap;
import java.util.Map;
import org.apache.commons.lang3.time.DateFormatUtils;
import org.quartz.JobDataMap;
import org.quartz.JobExecutionContext;
import org.quartz.JobExecutionException;
import org.quartz.*;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.slf4j.MDC;
import org.spiderflow.context.SpiderContext;
import org.spiderflow.context.SpiderContextHolder;
import org.spiderflow.core.Spider;
@ -65,14 +62,15 @@ public class SpiderJob extends QuartzJobBean {
}
public void run(SpiderFlow spiderFlow, Date nextExecuteTime) {
SpiderJobContext context = null;
Date now = new Date();
SpiderJobContext context = SpiderJobContext.create(this.spiderLogPath, spiderFlow.getId() + ".log");
SpiderContextHolder.set(context);
Task task = new Task();
task.setFlowId(spiderFlow.getId());
task.setBeginTime(new Date());
try {
taskService.save(task);
context = SpiderJobContext.create(this.spiderLogPath, spiderFlow.getId() + task.getId() + ".log");
SpiderContextHolder.set(context);
contextMap.put(task.getId(), context);
logger.info("开始执行任务{}", spiderFlow.getName());
spider.run(spiderFlow, context);
@ -80,7 +78,9 @@ public class SpiderJob extends QuartzJobBean {
} catch (Exception e) {
logger.error("执行任务{}出错", spiderFlow.getName(), e);
} finally {
context.close();
if (context != null) {
context.close();
}
task.setEndTime(new Date());
taskService.saveOrUpdate(task);
contextMap.remove(task.getId());

View File

@ -15,6 +15,8 @@ import org.spiderflow.core.model.SpiderFlow;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.stereotype.Component;
import java.util.Date;
/**
* 爬虫定时执行管理
* @author Administrator
@ -51,7 +53,7 @@ public class SpiderJobManager {
* @param spiderFlow 爬虫流程图
* @return boolean true/false
*/
public boolean addJob(SpiderFlow spiderFlow){
public Date addJob(SpiderFlow spiderFlow){
try {
JobDetail job = JobBuilder.newJob(SpiderJob.class).withIdentity(getJobKey(spiderFlow.getId())).build();
job.getJobDataMap().put(JOB_PARAM_NAME, spiderFlow);
@ -60,12 +62,10 @@ public class SpiderJobManager {
CronTrigger trigger = TriggerBuilder.newTrigger().withIdentity(getTriggerKey(spiderFlow.getId())).withSchedule(cronScheduleBuilder).build();
scheduler.scheduleJob(job,trigger);
return true;
return scheduler.scheduleJob(job,trigger);
} catch (SchedulerException e) {
logger.error("创建定时任务出错",e);
return false;
return null;
}
}

View File

@ -54,10 +54,16 @@ public interface SpiderFlowMapper extends BaseMapper<SpiderFlow>{
@Update("update sp_flow set enabled = #{enabled} where id = #{id}")
int resetSpiderStatus(@Param("id") String id, @Param("enabled") String enabled);
@Update("update sp_flow set next_execute_time = null where id = #{id}")
int resetNextExecuteTime(@Param("id") String id);
@Select("select id,name from sp_flow")
List<SpiderFlow> selectFlows();
@Select("select id,name from sp_flow where id != #{id}")
List<SpiderFlow> selectOtherFlows(@Param("id") String id);
@Select("select max(a.id) from `sp_task` a left join sp_flow b on a.flow_id = b.id where b.id = #{id}")
int getFlowMaxTaskId(@Param("id")String id);
}

View File

@ -43,10 +43,14 @@ public class SpiderFlowService extends ServiceImpl<SpiderFlowMapper, SpiderFlow>
@PostConstruct
private void initJobs(){
List<SpiderFlow> spiderFlows = sfMapper.selectList(new QueryWrapper<SpiderFlow>().eq("enabled", "1"));
if(spiderFlows != null){
if(spiderFlows != null && !spiderFlows.isEmpty()){
for (SpiderFlow sf : spiderFlows) {
if(StringUtils.isNotEmpty(sf.getCron())){
spiderJobManager.addJob(sf);
Date nextExecuteTimt = spiderJobManager.addJob(sf);
if (nextExecuteTimt != null) {
sf.setNextExecuteTime(nextExecuteTimt);
sfMapper.updateById(sf);
}
}
}
}
@ -110,14 +114,19 @@ public class SpiderFlowService extends ServiceImpl<SpiderFlowMapper, SpiderFlow>
public void stop(String id){
sfMapper.resetSpiderStatus(id,"0");
sfMapper.resetNextExecuteTime(id);
spiderJobManager.remove(id);
}
public void start(String id){
spiderJobManager.remove(id);
SpiderFlow spiderFlow = getById(id);
spiderJobManager.addJob(spiderFlow);
sfMapper.resetSpiderStatus(id,"1");
Date nextExecuteTime = spiderJobManager.addJob(spiderFlow);
if (nextExecuteTime != null) {
spiderFlow.setNextExecuteTime(nextExecuteTime);
sfMapper.updateById(spiderFlow);
sfMapper.resetSpiderStatus(id, "1");
}
}
public void run(String id){
@ -164,4 +173,8 @@ public class SpiderFlowService extends ServiceImpl<SpiderFlowMapper, SpiderFlow>
}
return list;
}
public Integer getFlowMaxTaskId(String flowId){
return sfMapper.getFlowMaxTaskId(flowId);
}
}

View File

@ -156,8 +156,12 @@ public class SpiderFlowController {
}
@RequestMapping("/log")
public JsonBean<List<Line>> log(String id, String keywords, Long index, Integer count, Boolean reversed,Boolean matchcase,Boolean regx){
try (RandomAccessFileReader reader = new RandomAccessFileReader(new RandomAccessFile(new File(spiderLogPath,id + ".log"),"r"), index == null ? -1 : index, reversed == null || reversed)){
public JsonBean<List<Line>> log(String id, String taskId, String keywords, Long index, Integer count, Boolean reversed, Boolean matchcase, Boolean regx) {
if (StringUtils.isBlank(taskId)) {
Integer maxId = spiderFlowService.getFlowMaxTaskId(id);
taskId = maxId == null ? "" : maxId.toString();
}
try (RandomAccessFileReader reader = new RandomAccessFileReader(new RandomAccessFile(new File(spiderLogPath,id + taskId +".log"),"r"), index == null ? -1 : index, reversed == null || reversed)){
return new JsonBean<>(reader.readLine(count == null ? 10 : count,keywords,matchcase != null && matchcase,regx != null && regx));
} catch(FileNotFoundException e){
return new JsonBean<>(0,"日志文件不存在");

View File

@ -495,35 +495,43 @@ $(function(){
},{
name : 'request',
image : '',
title : '开始抓取'
title : '开始抓取',
desc : '抓取静态HTML页面或者API接口抓取结果存为resp变量中。<br/>支持方法参考命令提示。'
},{
name : 'variable',
image : '',
title : '定义变量'
title : '定义变量',
desc : '定义流程变量。<br/>定义变量有先后顺序,先定义变量后续可以使用,拖动可以交换变量顺序。'
},{
name : 'loop',
image : '',
title : '循环'
title : '循环',
desc : ''
},{
name : 'loopJoin',
image : '',
title : '循环结束'
title : '循环结束',
desc : ''
},{
name : 'output',
image : '',
title : '输出'
title : '输出',
desc : '输出流程中的变量结果(仅测试下有用)'
},{
name : 'executeSql',
image : '',
title : '执行SQL'
title : '执行SQL',
desc : '执行sql需配置数据源sql执行结果存于变量rs中。<br/>语句类型为select返回:List&lt;Map&lt;String,Object&gt;&gt;<br/>语句类型为selectOne返回:Map&lt;String,Object&gt;<br/>语句类型为selectInt返回:Integer<br/>语句类型为insert、update、delete返回:int批量操作返回int数组<br/>sql中变量必须用 # # 包裹,如:#${title}#'
},{
name : 'function',
image : '',
title : '执行函数'
title : '执行函数',
desc : '单独执行函数方法,结果不保存为变量'
},{
name : 'process',
image : '',
title : '子流程'
title : '子流程',
desc : '执行其他spiderFlow流程父子流程变量共享'
}];
var addShape = function(shape){
var image = new Image();
@ -532,7 +540,11 @@ $(function(){
image.id = shape.name;
image.onclick = function (ev) {
if(shape.desc){
layer.tips("(" + shape.name + ")" + shape.title + "<hr/>" + shape.desc, '#' + shape.name);
layer.tips("(" + shape.name + ")" + shape.title + "<hr/>" + shape.desc, '#' + shape.name,{
tips: [1, '#3595CC'],
area: ['auto', 'auto'],
time: 4000
});
}
}
if(!shape.hidden){

View File

@ -5,6 +5,7 @@ function LogViewer(options){
this.onSearchFinish = options.onSearchFinish || function(){};
this.bufferSize = this.maxLines * 10;
this.logId = options.logId;
this.taskId = options.taskId;
this.url = options.url;
this.buffer = [];
this.displayIndex = -1;
@ -148,6 +149,7 @@ LogViewer.prototype.loadLines = function(count,callback,async){
reversed : this.reversed,
count : this.bufferSize,
id : this.logId,
taskId: this.taskId,
index : _this.index,
keywords : this.keywords,
matchcase : this.matchcase,

View File

@ -170,10 +170,12 @@
<script type="text/javascript">
$(function(){
var logId = getQueryString('id');
var taskId = getQueryString('taskId');
var viewer = new LogViewer({
url: 'spider/log',
maxLines : parseInt(($('.log-container').height() - 8) / 14),
logId : logId,
taskId: taskId,
element : $('.log-container'),
onSearchFinish : function(hasData){
if(hasData){

View File

@ -187,7 +187,7 @@
</script>
<script type="text/html" id="buttons">
<a class="layui-btn layui-btn-sm btn-run" data-id="{{d.id}}">手动运行</a>
<a class="layui-btn layui-btn-sm btn-log" data-name="{{d.name}}" data-id="{{d.id}}">查看日志</a>
<a class="layui-btn layui-btn-sm btn-log" data-name="{{d.name}}" data-id="{{d.id}}">最新日志</a>
<a class="layui-btn layui-btn-sm btn-remove" data-id="{{d.id}}">删除</a>
</script>
</body>

View File

@ -90,14 +90,14 @@
layui.layer.close(index);
})
}).on('click','.btn-log',function(){
parent.openTab(decodeURIComponent(decodeURIComponent(getQueryString('name'))) + '-日志',$(this).data('id') + '-log','log.html?id=' + $(this).data('id'));
parent.openTab(decodeURIComponent(decodeURIComponent(getQueryString('name'))) + '-日志',$(this).data('id') + '-log','log.html?id=' + $(this).data('id') + "&taskId=" + $(this).data("task"));
})
</script>
<script type="text/html" id="buttons">
{{# if(!d.endTime){ }}
<a class="layui-btn layui-btn-sm btn-stop" data-id="{{d.id}}">停止</a>
{{# } }}
<a class="layui-btn layui-btn-sm btn-log" data-id="{{d.flowId}}">查看日志</a>
<a class="layui-btn layui-btn-sm btn-log" data-id="{{d.flowId}}" data-task="{{d.id}}">查看日志</a>
<a class="layui-btn layui-btn-sm btn-remove" data-id="{{d.id}}">删除记录</a>
</script>
</body>