Search/text-google.go

95 lines
2.1 KiB
Go
Raw Normal View History

2024-05-17 14:26:28 +02:00
// text-google.go
2024-04-15 08:35:17 +02:00
package main
import (
"fmt"
2024-04-15 08:35:17 +02:00
"log"
"net/http"
"net/url"
"strconv"
2024-04-15 08:35:17 +02:00
"strings"
"github.com/PuerkitoBio/goquery"
)
func PerformGoogleTextSearch(query, safe, lang string, page int) ([]TextSearchResult, error) {
const resultsPerPage = 10
2024-04-15 08:35:17 +02:00
var results []TextSearchResult
client := &http.Client{}
safeParam := "&safe=off"
if safe == "active" {
safeParam = "&safe=active"
}
langParam := ""
if lang != "" {
langParam = "&lr=" + lang
}
// Calculate the start index based on the page number
startIndex := (page - 1) * resultsPerPage
searchURL := "https://www.google.com/search?q=" + url.QueryEscape(query) + safeParam + langParam + "&udm=14&start=" + strconv.Itoa(startIndex)
2024-04-15 08:35:17 +02:00
req, err := http.NewRequest("GET", searchURL, nil)
if err != nil {
return nil, fmt.Errorf("failed to create request: %v", err)
2024-04-15 08:35:17 +02:00
}
req.Header.Set("User-Agent", "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/107.0.0.0 Safari/537.36")
resp, err := client.Do(req)
if err != nil {
return nil, fmt.Errorf("making request: %v", err)
2024-04-15 08:35:17 +02:00
}
defer resp.Body.Close()
if resp.StatusCode != http.StatusOK {
return nil, fmt.Errorf("unexpected status code: %d", resp.StatusCode)
}
2024-04-15 08:35:17 +02:00
doc, err := goquery.NewDocumentFromReader(resp.Body)
if err != nil {
return nil, fmt.Errorf("loading HTML document: %v", err)
2024-04-15 08:35:17 +02:00
}
doc.Find(".yuRUbf").Each(func(i int, s *goquery.Selection) {
link := s.Find("a")
href, exists := link.Attr("href")
if !exists {
if debugMode {
log.Printf("No href attribute found for result %d\n", i)
}
return
}
2024-04-15 08:35:17 +02:00
header := link.Find("h3").Text()
header = strings.TrimSpace(strings.TrimSuffix(header, ""))
descSelection := doc.Find(".VwiC3b").Eq(i)
description := ""
if descSelection.Length() > 0 {
description = descSelection.Text()
}
2024-05-18 01:59:29 +02:00
result := TextSearchResult{
2024-04-15 08:35:17 +02:00
URL: href,
Header: header,
Description: description,
2024-05-18 01:59:29 +02:00
}
results = append(results, result)
if debugMode {
log.Printf("Google result: %+v\n", result)
}
2024-04-15 08:35:17 +02:00
})
if len(results) == 0 {
if debugMode {
log.Println("No results found from Google")
}
}
2024-04-15 08:35:17 +02:00
return results, nil
}