12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182 |
- package goquery_test
- import (
- "fmt"
- "log"
- "net/http"
- "os"
- "strings"
- "github.com/PuerkitoBio/goquery"
- )
- // This example scrapes the reviews shown on the home page of metalsucks.net.
- func Example() {
- // Request the HTML page.
- res, err := http.Get("http://metalsucks.net")
- if err != nil {
- log.Fatal(err)
- }
- defer res.Body.Close()
- if res.StatusCode != 200 {
- log.Fatalf("status code error: %d %s", res.StatusCode, res.Status)
- }
- // Load the HTML document
- doc, err := goquery.NewDocumentFromReader(res.Body)
- if err != nil {
- log.Fatal(err)
- }
- // Find the review items
- doc.Find(".sidebar-reviews article .content-block").Each(func(i int, s *goquery.Selection) {
- // For each item found, get the band and title
- band := s.Find("a").Text()
- title := s.Find("i").Text()
- fmt.Printf("Review %d: %s - %s\n", i, band, title)
- })
- // To see the output of the Example while running the test suite (go test), simply
- // remove the leading "x" before Output on the next line. This will cause the
- // example to fail (all the "real" tests should pass).
- // xOutput: voluntarily fail the Example output.
- }
- // This example shows how to use NewDocumentFromReader from a file.
- func ExampleNewDocumentFromReader_file() {
- // create from a file
- f, err := os.Open("some/file.html")
- if err != nil {
- log.Fatal(err)
- }
- defer f.Close()
- doc, err := goquery.NewDocumentFromReader(f)
- if err != nil {
- log.Fatal(err)
- }
- // use the goquery document...
- _ = doc.Find("h1")
- }
- // This example shows how to use NewDocumentFromReader from a string.
- func ExampleNewDocumentFromReader_string() {
- // create from a string
- data := `
- <html>
- <head>
- <title>My document</title>
- </head>
- <body>
- <h1>Header</h1>
- </body>
- </html>`
- doc, err := goquery.NewDocumentFromReader(strings.NewReader(data))
- if err != nil {
- log.Fatal(err)
- }
- header := doc.Find("h1").Text()
- fmt.Println(header)
- // Output: Header
- }
|