|
@@ -197,8 +197,7 @@ func (t *Task) StartJob() {
|
|
|
tmp["iscompete"] = sp.IsCompete //2021-11-01以后新增的爬虫不在展示原文链接(保存服务判断)
|
|
|
//spider.Store(sp.StoreMode, sp.StoreToMsgEvent, sp.Collection, sp.CoverAttr, result, true)
|
|
|
}
|
|
|
- tmp["state"] = 1
|
|
|
- result := t.CheckField(tmp) //校验字段
|
|
|
+ result := t.CheckField(tmp, sp) //校验字段
|
|
|
//下载成功
|
|
|
update = append(update, query)
|
|
|
update = append(update, map[string]interface{}{"$set": result})
|
|
@@ -221,7 +220,7 @@ func (t *Task) StartJob() {
|
|
|
}
|
|
|
|
|
|
//字段校验
|
|
|
-func (t *Task) CheckField(tmp map[string]interface{}) map[string]interface{} {
|
|
|
+func (t *Task) CheckField(tmp map[string]interface{}, sp *spider.Spider) map[string]interface{} {
|
|
|
defer qu.Catch()
|
|
|
result := map[string]interface{}{}
|
|
|
if len(t.CheckFields) > 0 {
|
|
@@ -251,17 +250,20 @@ func (t *Task) CheckField(tmp map[string]interface{}) map[string]interface{} {
|
|
|
}
|
|
|
}
|
|
|
if !fieldOk { //字段值下载出错,该条数据下载失败
|
|
|
- result["state"] = -1
|
|
|
- return result
|
|
|
+ return map[string]interface{}{"state": -1}
|
|
|
} else if fieldOk && t.IsBidding { //bidding数据指定更新某字段
|
|
|
result[field] = tmp[field]
|
|
|
}
|
|
|
}
|
|
|
- if t.IsBidding {
|
|
|
- result["state"] = 1
|
|
|
- return result
|
|
|
- }
|
|
|
}
|
|
|
+ if t.IsBidding { //bidding数据
|
|
|
+ result["state"] = 1
|
|
|
+ return result
|
|
|
+ }
|
|
|
+ //非bidding信息
|
|
|
+ tmp["state"] = 1
|
|
|
+ tmp["T"] = sp.Collection
|
|
|
+ tmp["infoformat"] = sp.Infoformat
|
|
|
return tmp
|
|
|
}
|
|
|
|
|
@@ -303,7 +305,7 @@ func (t *Task) SendNotBiddingData() {
|
|
|
id := tmp["_id"]
|
|
|
delete(tmp, "_id")
|
|
|
tmp["dataging"] = 0 //补充dataging字段
|
|
|
- tmp["T"] = "bidding"
|
|
|
+ //tmp["T"] = "bidding"
|
|
|
ok, id, coll := SaveObj(4002, "title", tmp)
|
|
|
update := []map[string]interface{}{
|
|
|
map[string]interface{}{"_id": id},
|