goquery实现了类似于jQuery的功能,包括可链接的语法,用于操作和查询HTML文档。
它为Go语言带来了类似于jQuery的语法和一组功能。它基于Go的net/html包和CSS选择器库cascadia。在语法方面,它尽可能接近jQuery,尽可能使用相同的方法名称。
安装软件包:
go get github.com/PuerkitoBio/goquery
示例代码1:
package main
import (
"fmt"
"log"
"net/http"
"github.com/PuerkitoBio/goquery"
)
func ExampleScrape() {
// http请求res, err := http.Get("https://stackoverflow.com/questions/tagged/javascript")
if err != nil {
log.Fatal(err)
}
defer res.Body.Close()
if res.StatusCode != 200 {
log.Fatalf("status code error: %d %s", res.StatusCode, res.Status)
}
// 加载html内容doc, err := goquery.NewDocumentFromReader(res.Body)
if err != nil {
log.Fatal(err)
}
// 查找目标元素doc.Find(".question-summary .summary").Each(func(i int, s *goquery.Selection) {
title := s.Find("H3").Text()
fmt.Println(i, title)
})
}
func main() {
ExampleScrape()
}
示例代码2:
package main
import (
"fmt"
"log"
"github.com/PuerkitoBio/goquery"
)
type Earthquake struct {
Timestamp string
Latitide string
Longitude string
Magnitudo string
Depth string
Territory string
}
var arrayEarthquake []Earthquake
func postScrape() {
doc, err := goquery.NewDocument("http://www.bmkg.go.id/gempabumi/gempabumi-terkini.bmkg")
if err != nil {
log.Fatal(err)
}
doc.Find("tbody tr").Each(func(_ int, tr *goquery.Selection) {
e := Earthquake{}
tr.Find("td").Each(func(ix int, td *goquery.Selection) {
switch ix {
case 1:
e.Timestamp = td.Text()
case 2:
e.Latitide = td.Text()
case 3:
e.Longitude = td.Text()
case 4:
e.Magnitudo = td.Text()
case 5:
e.Depth = td.Text()
case 6:
e.Territory = td.Text()
}
})
arrayEarthquake = append(arrayEarthquake, e)
})
fmt.Println(arrayEarthquake)
}
func main() {
postScrape()
}