intimate/extractor/twitcasting_extractor/twitcasting_extractor.go

153 lines
4.4 KiB
Go
Raw Normal View History

2020-08-11 10:26:17 +00:00
package main
import (
"database/sql"
"intimate"
"log"
"regexp"
"strconv"
"strings"
"time"
"github.com/474420502/extractor"
"github.com/474420502/requests"
)
// sstore 源存储实例, 为存储源数据的实现. 表格具体参考sql/intimate_source.sql
var sstore *intimate.StoreSource = intimate.NewStoreSource(string(intimate.STOpenrec))
// estore 解析存储连接实例
var estore *intimate.StoreExtractor = intimate.NewStoreExtractor()
type LiveData struct {
UserName string `exp:"//span[@class='tw-live-author__info-username']" method:"Text"`
Follower string `exp:"(//span[@class='tw-user-nav-list-count'])[2]" method:"Text"`
MaxViews string `exp:"//span[@id='max_viewer_count']" method:"Text"`
LiveTitle string `exp:"//meta[@property='og:title']" method:"AttributeValue,content"`
2020-08-12 04:22:46 +00:00
LiveStart string `exp:"//time[@data-kind='relative']" method:"AttributeValue,datetime"`
2020-08-11 10:26:17 +00:00
LiveDuration string `exp:"//span[@id='updatetimer']" method:"AttributeValue,data-duration"`
2020-08-12 04:22:46 +00:00
Tags []string `exp:"//div[@class='tw-live-author__commandbox--tags']//a[@class='tag tag-info']" method:"Text"`
2020-08-11 10:26:17 +00:00
}
func main() {
ps := intimate.NewPerfectShutdown()
2020-08-12 04:22:46 +00:00
ses := requests.NewSession()
2020-08-11 10:26:17 +00:00
for !ps.IsClose() {
streamer, err := estore.Pop(intimate.Ptwitcasting)
if err != nil {
2020-08-12 04:22:46 +00:00
log.Println(err, streamer.UserId)
2020-08-11 10:26:17 +00:00
}
2020-08-12 04:22:46 +00:00
streamer.LiveUrl = sql.NullString{String: "https://twitcasting.tv/" + streamer.UserId, Valid: true}
resp, err := ses.Get(streamer.LiveUrl.String).Execute()
2020-08-11 10:26:17 +00:00
if err != nil {
2020-08-12 04:22:46 +00:00
estore.UpdateError(streamer, err)
log.Println(err, streamer.UserId)
continue
2020-08-11 10:26:17 +00:00
}
var ldata *LiveData
2020-08-12 09:42:27 +00:00
etor := extractor.ExtractHtml(resp.Content())
2020-08-11 10:26:17 +00:00
ldata = etor.GetObjectByTag(LiveData{}).(*LiveData)
ldata.MaxViews = regexp.MustCompile("\\d+").FindString(ldata.MaxViews)
coincount := 0
for i := 0; ; i++ {
2020-08-12 04:22:46 +00:00
giverurl := streamer.LiveUrl.String + "/backers/" + strconv.Itoa(i)
2020-08-11 10:26:17 +00:00
resp, err = ses.Get(giverurl).Execute()
if err != nil {
2020-08-12 09:42:27 +00:00
estore.UpdateError(streamer, err)
2020-08-11 10:26:17 +00:00
log.Panic(err)
}
2020-08-12 09:42:27 +00:00
etor := extractor.ExtractHtml(resp.Content())
2020-08-11 10:26:17 +00:00
xp, err := etor.XPaths("//td[@class='tw-memorial-table-recent-point']")
if err != nil {
2020-08-12 09:42:27 +00:00
estore.UpdateError(streamer, err)
2020-08-11 10:26:17 +00:00
log.Panic(err)
}
coins := xp.GetTexts()
for _, cointxt := range coins {
scointxt := strings.Split(cointxt, "/")
if len(scointxt) == 2 {
coin := strings.Trim(scointxt[1], " ")
c, err := strconv.Atoi(coin)
if err == nil {
coincount += c
}
2020-08-12 04:22:46 +00:00
// log.Println(coin, coincount)
2020-08-11 10:26:17 +00:00
} else {
log.Println("coin error: ", cointxt)
}
}
if len(coins) < 20 {
break
}
}
streamer.Platform = intimate.Ptwitcasting
streamer.UpdateTime = sql.NullTime{Time: time.Now(), Valid: true}
streamer.UserName = sql.NullString{String: ldata.UserName, Valid: true}
2020-08-12 04:22:46 +00:00
streamer.Operator = 10
// streamer.UpdateInterval = 60
2020-08-11 10:26:17 +00:00
clog := &intimate.CollectLog{}
clog.UserId = streamer.UserId
clog.Gratuity = sql.NullInt64{Int64: int64(coincount), Valid: true}
clog.Platform = streamer.Platform
clog.UpdateTime = streamer.UpdateTime
clog.LiveTitle = sql.NullString{String: ldata.LiveTitle, Valid: true}
2020-08-12 04:22:46 +00:00
fl, err := intimate.ParseNumberEx(ldata.Follower)
2020-08-11 10:26:17 +00:00
if err == nil {
clog.Followers = sql.NullInt64{Int64: int64(fl), Valid: true}
2020-08-12 04:22:46 +00:00
switch {
case fl <= 100:
streamer.UpdateInterval = 360
case fl <= 1000:
streamer.UpdateInterval = 240
case fl <= 100:
streamer.UpdateInterval = 120
default:
streamer.UpdateInterval = 60
}
2020-08-11 10:26:17 +00:00
} else {
log.Println(err)
}
views, err := strconv.Atoi(ldata.MaxViews)
if err == nil {
clog.Views = sql.NullInt64{Int64: int64(views), Valid: true}
} else {
2020-08-12 04:22:46 +00:00
clog.Views = sql.NullInt64{Int64: int64(0), Valid: true}
// log.Println(err, streamer.UserId)
2020-08-11 10:26:17 +00:00
}
2020-08-12 04:22:46 +00:00
// st, err := strconv.Atoi(ldata.LiveStart)
st, err := time.Parse("Mon, 02 Jan 2006 15:04:05 -0700", ldata.LiveStart)
2020-08-11 10:26:17 +00:00
if err == nil {
2020-08-12 04:22:46 +00:00
startTime := st
2020-08-11 10:26:17 +00:00
clog.LiveStartTime = sql.NullTime{Time: startTime, Valid: true}
dt, err := strconv.Atoi(ldata.LiveDuration)
2020-08-12 04:22:46 +00:00
if time.Now().Sub(startTime) >= time.Hour*24*90 {
streamer.Operator = 5
}
2020-08-11 10:26:17 +00:00
2020-08-12 04:22:46 +00:00
if err == nil {
endTime := startTime.Add((time.Duration)(dt) * time.Millisecond)
2020-08-11 10:26:17 +00:00
clog.LiveEndTime = sql.NullTime{Time: endTime, Valid: true}
} else {
2020-08-12 04:22:46 +00:00
log.Println(err, streamer.UserId)
2020-08-11 10:26:17 +00:00
}
} else {
2020-08-12 04:22:46 +00:00
log.Println(err, streamer.UserId)
2020-08-11 10:26:17 +00:00
}
streamer.LatestLogUid = estore.InsertClog(clog)
estore.UpdateStreamer(streamer)
}
}