优化爬虫执行逻辑

This commit is contained in:
fantasticbin 2024-04-04 08:35:20 +08:00
parent ef7891de9c
commit 4c8838846a
2 changed files with 19 additions and 14 deletions

View File

@ -9,7 +9,7 @@ var rootCmd = &cobra.Command{
Use: "anime",
Short: "Anime crawler written by go",
Run: func(cmd *cobra.Command, args []string) {
start()
NewCrawler().Start()
fmt.Println("抓取完成")
},
}

View File

@ -12,11 +12,17 @@ import (
"sync"
)
var wg sync.WaitGroup
type Crawler struct {
wg sync.WaitGroup
path string
}
// start 开始执行
func start() {
path := output
func NewCrawler() *Crawler {
return &Crawler{}
}
func (c *Crawler) Start() {
c.path = output
if folderTitleUrl != "" {
chapterTitle := FindChapterTitle(folderTitleUrl, chapter)
title := strings.Join([]string{
@ -25,26 +31,25 @@ func start() {
"话-",
chapterTitle,
}, "")
path = filepath.Join(output, title) // 组装章节路径
c.path = filepath.Join(output, title) // 组装章节路径
}
err := IfPathNotExistDoMkdir(path)
err := IfPathNotExistDoMkdir(c.path)
if err != nil {
fmt.Println("输出目录创建失败:", err)
return
}
c.wg.Add(max)
for i := 1; i <= max; i++ {
wg.Add(1)
go get(i, path)
go c.do(i)
}
wg.Wait()
c.wg.Wait()
}
// get 获取漫画图片
func get(num int, path string) {
defer wg.Done()
func (c *Crawler) do(num int) {
defer c.wg.Done()
// 兼容未携带斜杆的地址
if url[0] != '/' {
@ -88,7 +93,7 @@ func get(num int, path string) {
}(resp.Body)
reader := bufio.NewReaderSize(resp.Body, 32*1024)
file, err := os.Create(path + "/" + fileName)
file, err := os.Create(c.path + "/" + fileName)
if err != nil {
fmt.Println(fileName, "图片创建失败:", err)
return