Skip to content

Instantly share code, notes, and snippets.

@7yan00
Last active August 29, 2015 14:13
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 1 You must be signed in to fork a gist
  • Save 7yan00/ee98ac0eeb07ce5fff4c to your computer and use it in GitHub Desktop.
Save 7yan00/ee98ac0eeb07ce5fff4c to your computer and use it in GitHub Desktop.
hoge
package main
import (
"fmt"
"io"
"net/http"
"net/url"
"os"
"strings"
"sync"
"github.com/PuerkitoBio/goquery"
)
var stock = []string{}
var base string = "http://blog.golang.org/"
var i int = 0
var wg = new(sync.WaitGroup)
func main() {
doc, _ := goquery.NewDocument(base)
result := makeUrl(doc)
results := GetUrl(result)
for len(results) > 0 {
results = GetUrl(results)
}
fmt.Println(results)
wg.Wait()
}
func GetUrl(urls []*url.URL) []*url.URL {
sorceUrl := []*url.URL{}
L:
for _, item := range urls {
url_string := item.String()
if !strings.Contains(url_string, base) {
continue L
}
for e := 0; e < len(stock); e++ {
if url_string == stock[e] {
continue L
}
}
fmt.Println(url_string)
stock = append(stock, url_string)
doc, _ := goquery.NewDocument(base)
results := makeUrl(doc)
wg.Add(1)
go GetImage(doc)
sorceUrl = append(sorceUrl, results...)
}
fmt.Println("hohohohohohohohohoho")
return sorceUrl
}
func makeUrl(doc *goquery.Document) []*url.URL {
var result []*url.URL
doc.Find("a").Each(func(_ int, s *goquery.Selection) {
target, _ := s.Attr("href")
base, _ := url.Parse(base)
targets, _ := url.Parse(target)
result = append(result, base.ResolveReference(targets))
})
return result
}
func GetImage(doc *goquery.Document) {
var result []*url.URL
doc.Find("img").Each(func(_ int, s *goquery.Selection) {
target, _ := s.Attr("src")
base, _ := url.Parse(base)
targets, _ := url.Parse(target)
result = append(result, base.ResolveReference(targets))
})
for _, imageUrl := range result {
imageUrl_String := imageUrl.String()
response, err := http.Get(imageUrl_String)
if err != nil {
panic(err)
}
defer response.Body.Close()
file, err := os.Create(fmt.Sprintf("hoge%d.jpg", i))
i++
if err != nil {
panic(err)
}
defer file.Close()
io.Copy(file, response.Body)
}
wg.Done()
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment