一般图片的位置都藏在html中img的src标签里,所有我们可以遍历html的img标签,获取并存取,我采用了goquery一个很不错的解析html的库
下面上代码,爬的的是新浪的,主线程sleep是为了防止goroutine泄漏,当然也可以通过通道避免
package main
import (
"github.com/PuerkitoBio/goquery"
"fmt"
"os"
// "log"
"path"
"strings"
"regexp"
"math/rand"
"io"
"net/http"
"time"
)
func randFileName(dirPath string,suffix string) (fileName string) {
var randChar string = "abcdefghimnjkqzxyt0123456789ioedkaldncalew0129387iue"
var name string
size :=