|
@@ -0,0 +1,124 @@ |
|
|
|
|
|
package svc |
|
|
|
|
|
|
|
|
|
|
|
import ( |
|
|
|
|
|
"applet/app/es/md" |
|
|
|
|
|
md2 "applet/app/task/md" |
|
|
|
|
|
"applet/app/utils" |
|
|
|
|
|
"code.fnuoos.com/go_rely_warehouse/zyos_go_es.git/es" |
|
|
|
|
|
"code.fnuoos.com/go_rely_warehouse/zyos_go_third_party_api.git/gzmiyuan" |
|
|
|
|
|
"fmt" |
|
|
|
|
|
"github.com/syyongx/php2go" |
|
|
|
|
|
"strings" |
|
|
|
|
|
"time" |
|
|
|
|
|
) |
|
|
|
|
|
|
|
|
|
|
|
func DataCollectCronMiyuanRealNews(types int) { |
|
|
|
|
|
key := md.ZhiosRealNewsData |
|
|
|
|
|
//es.CreateIndexIfNotExists(key, md.ZhiosRealNewsDataField) |
|
|
|
|
|
ids := []string{"MC", "TM", "JD", "PDD", "CD", "ZD", "MS", "QYH"} |
|
|
|
|
|
ids = []string{"JD"} |
|
|
|
|
|
num := 10 |
|
|
|
|
|
if types == 0 { |
|
|
|
|
|
ids = []string{""} |
|
|
|
|
|
num = 3 |
|
|
|
|
|
} |
|
|
|
|
|
size := 10 |
|
|
|
|
|
now := time.Now() |
|
|
|
|
|
fmt.Println("============", time.Since(now)) |
|
|
|
|
|
for _, v := range ids { |
|
|
|
|
|
for i := 1; i <= num; i++ { |
|
|
|
|
|
newsData, err := gzmiyuan.GetGzmiRealData(utils.IntToStr(size), utils.IntToStr(i), v) |
|
|
|
|
|
if newsData == nil || err != nil { |
|
|
|
|
|
continue |
|
|
|
|
|
} |
|
|
|
|
|
platformMap := map[string]string{"MC": "10001", "TM": "10003", "JD": "10004", "PDD": "10005", "CD": "10006", "ZD": "10002", "MS": "10007", "QYH": "10000"} |
|
|
|
|
|
for _, item := range newsData { |
|
|
|
|
|
var tmp = md2.RealNewsData{ |
|
|
|
|
|
Id: item.Id, |
|
|
|
|
|
CateId: utils.SerializeStr([]string{platformMap[item.OpenType]}), |
|
|
|
|
|
Images: utils.SerializeStr(strings.Split(item.XianbaoImageUrl, ",")), |
|
|
|
|
|
Platform: "my", |
|
|
|
|
|
StartTime: utils.TimeStdParseUnix(item.CreateTime), |
|
|
|
|
|
OldContent: item.XianbaoContent, |
|
|
|
|
|
} |
|
|
|
|
|
tmp.Key = php2go.Md5("hdk_real_news_my_" + utils.IntToStr(item.Id)) |
|
|
|
|
|
var uniqueId = tmp.Key |
|
|
|
|
|
doc, _ := es.FirstDoc(key, uniqueId) |
|
|
|
|
|
if doc == nil { |
|
|
|
|
|
goodsList := ToContent(item.XianbaoContent) |
|
|
|
|
|
|
|
|
|
|
|
tmp.Content = utils.SerializeStr(goodsList) |
|
|
|
|
|
fmt.Println(tmp) |
|
|
|
|
|
createDocRet, err := es.CreateDoc(key, uniqueId, tmp) |
|
|
|
|
|
if err != nil { |
|
|
|
|
|
return |
|
|
|
|
|
} |
|
|
|
|
|
fmt.Printf("CreateDoc ==> %+v \n\n", createDocRet) |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
} |
|
|
|
|
|
fmt.Println("==========================end", time.Since(now)) |
|
|
|
|
|
} |
|
|
|
|
|
func To(str, str1, str2 string) string { |
|
|
|
|
|
tmp := strings.Split(str, str1) |
|
|
|
|
|
if len(tmp) > 0 { |
|
|
|
|
|
tmp1 := strings.Split(tmp[1], str2) |
|
|
|
|
|
if len(tmp1) > 0 { |
|
|
|
|
|
return tmp1[0] |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
return "" |
|
|
|
|
|
} |
|
|
|
|
|
func ToContent(str string) []map[string]string { |
|
|
|
|
|
platformTypeList := map[string]string{ |
|
|
|
|
|
"JD": "jd", |
|
|
|
|
|
"PDD": "pdd", |
|
|
|
|
|
"TB": "taobao", |
|
|
|
|
|
"TM": "tmall", |
|
|
|
|
|
} |
|
|
|
|
|
str = strings.ReplaceAll(str, "<br>", "\n") |
|
|
|
|
|
strs := strings.Split(str, "<div ") |
|
|
|
|
|
fmt.Println(strs) |
|
|
|
|
|
var goodsList = make([]map[string]string, 0) |
|
|
|
|
|
for _, v := range strs { |
|
|
|
|
|
goodsListTmp := map[string]string{ |
|
|
|
|
|
"is_click": "0", |
|
|
|
|
|
"content": v, |
|
|
|
|
|
"gid": "", |
|
|
|
|
|
"url": "", |
|
|
|
|
|
"platform_type": "", |
|
|
|
|
|
} |
|
|
|
|
|
if strings.Contains(v, "href=") { |
|
|
|
|
|
var tmps = strings.Split(v, "</div>") |
|
|
|
|
|
for _, v1 := range tmps { |
|
|
|
|
|
if strings.Contains(v1, "href=") { |
|
|
|
|
|
url := To(v1, "href=\"", "\"") |
|
|
|
|
|
gid := To(v1, "item_id=\"", "\"") |
|
|
|
|
|
platformType := To(v1, "open_type=\"", "\"") |
|
|
|
|
|
goodsListTmp = map[string]string{ |
|
|
|
|
|
"is_click": "1", |
|
|
|
|
|
"content": "去购买>\n", |
|
|
|
|
|
"gid": gid, |
|
|
|
|
|
"url": "", |
|
|
|
|
|
"platform_type": platformTypeList[platformType], |
|
|
|
|
|
} |
|
|
|
|
|
if platformType == "JD" && gid == "" { |
|
|
|
|
|
goodsListTmp = map[string]string{ |
|
|
|
|
|
"is_click": "0", |
|
|
|
|
|
"content": url, |
|
|
|
|
|
"gid": "", |
|
|
|
|
|
"url": "", |
|
|
|
|
|
"platform_type": platformTypeList[platformType], |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
goodsList = append(goodsList, goodsListTmp) |
|
|
|
|
|
|
|
|
|
|
|
} |
|
|
|
|
|
return goodsList |
|
|
|
|
|
} |