go - 我怎样才能使这个脚本多线程
问题描述
我使用代码的方式是从文件中传递一个 url 列表并用我的代码运行每个 url,代码使用 bufio,所以我可以从文件中传递 url。
命令:猫 test2.txt | ./mygofile
https://beap.adss.yahoo.com/
https://id.answers.yahoo.com/search
https://brokenurl
https://id.answers.yahoo.com/KnowledgeSearchService
https://id.answers.yahoo.com/question/nextQuestion
示例 URL 的内容
package main
import (
"log"
"bufio"
"bytes"
"fmt"
"net/http"
"os"
"strings"
"crypto/tls"
)
func main() {
tr := http.DefaultTransport.(*http.Transport).Clone()
tr.TLSClientConfig = &tls.Config{InsecureSkipVerify: true}
client := &http.Client{Transport: tr}
passedUrl := bufio.NewScanner(os.Stdin)
var pUrl string
for passedUrl.Scan() {
fmt.Println(passedUrl.Text())
if strings.Contains(passedUrl.Text(), "://"){
pUrl = passedUrl.Text()
} else {
pUrl = "https://" + passedUrl.Text()
}
body := "<?xml version=\"1.0\"?>"
req, err := http.NewRequest("POST", pUrl, bytes.NewBuffer([]byte(body)))
if err != nil {
log.Println(err)
}
req.Header.Add("Content-Type", "application/xml; charset=utf-8")
resp, err := client.Do(req)
if err != nil {
log.Println(err)
continue // stop here and process next item
}
defer resp.Body.Close()
}
}
问题是当我提供大量 url 时代码非常慢。有什么方法可以让代码以简单的方式多线程或更快
解决方案
创建工作者 goroutine 池。worker goroutine 从通道获取要处理的 url,并在通道关闭时退出。主 goroutine 将 url 提供给通道并在完成后关闭通道。
tr := http.DefaultTransport.(*http.Transport).Clone()
tr.TLSClientConfig = &tls.Config{InsecureSkipVerify: true}
client := &http.Client{Transport: tr}
var wg sync.WaitGroup
work := make(chan string)
for i := 0; i < 10; i++ {
wg.Add()
go func() {
defer wg.Done()
for pUrl := range work {
fmt.Println(purl)
if !strings.Contains(purl, "://") {
pUrl = "https://" + passedUrl.Text()
}
body := "<?xml version=\"1.0\"?>"
req, err := http.NewRequest("POST", pUrl, strings.NewReader(body))
if err != nil {
log.Println(err)
continue
}
req.Header.Add("Content-Type", "application/xml; charset=utf-8")
resp, err := client.Do(req)
if err != nil {
log.Println(err)
continue // stop here and process next item
}
// do something with resp
resp.Body.Close()
}
}()
}
passedUrl := bufio.NewScanner(os.Stdin)
for passedUrl.Scan() {
work <- passedUrl.Text()
}
close(work) // signal workers to exit
wg.Wait() // wait for workers to exit