forked from ernesto-jimenez/scraperboard
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgoogle-cli.go
49 lines (40 loc) · 1009 Bytes
/
google-cli.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
package main
import (
"flag"
"fmt"
"github.com/ernesto-jimenez/scraperboard"
"net/url"
"strings"
)
func main() {
flag.Parse()
query := strings.Join(flag.Args(), " ")
searchURL := fmt.Sprintf("https://www.google.com/search?q=%s", url.QueryEscape(query))
scraper, _ := scraperboard.NewScraperFromString(scraperXML)
var response Response
scraper.ExtractFromURL(searchURL, &response)
for _, result := range response.Results {
fmt.Printf("%s:\n\t%s\n", result.Title, result.URL)
}
}
// Response contains an array of google results (Result)
type Response struct {
Results []Result
}
// Result has a Title and URL
type Result struct {
Title string
URL string
}
var scraperXML = `
<Scraper>
<Each name="results" selector="#search ol > li">
<Property name="title" selector="h3 a"/>
<Property name="url" selector="h3 a">
<Filter type="first"/>
<Filter type="attr" argument="href"/>
<Filter type="regex" argument="q=([^&]+)"/>
</Property>
</Each>
</Scraper>
`