walker/scrape_test.go
2022-06-02 11:17:56 +02:00

34 lines
650 B
Go

package walker
import (
"bytes"
_ "embed"
"fmt"
"testing"
"github.com/PuerkitoBio/goquery"
"github.com/davecgh/go-spew/spew"
)
//go:embed "test.html"
var testDoc []byte
func TestScrape(t *testing.T) {
doc, errNewDoc := goquery.NewDocumentFromReader(bytes.NewBuffer(testDoc))
spew.Dump(errNewDoc)
doc.Find("noscript").Each(func(i int, s *goquery.Selection) {
fmt.Println(s.Text())
doc, errNewDoc := goquery.NewDocumentFromReader(bytes.NewBuffer([]byte(s.Text())))
if errNewDoc == nil {
doc.Find("a").Each(func(i int, s *goquery.Selection) {
href, exists := s.Attr("href")
fmt.Println(i, exists, href)
})
}
})
}