Search/text-duckduckgo.go

71 lines
1.7 KiB
Go
Raw Normal View History

2024-05-18 01:59:29 +02:00
package main
import (
"fmt"
"log"
"net/http"
"net/url"
"strings"
"time"
2024-05-18 01:59:29 +02:00
"github.com/PuerkitoBio/goquery"
)
func PerformDuckDuckGoTextSearch(query, safe, lang string, page int) ([]TextSearchResult, time.Duration, error) {
startTime := time.Now() // Start the timer
2024-05-18 01:59:29 +02:00
var results []TextSearchResult
2024-06-09 21:44:49 +02:00
searchURL := buildDuckDuckGoSearchURL(query, page)
2024-05-18 01:59:29 +02:00
2024-06-09 12:43:46 +02:00
resp, err := http.Get(searchURL)
2024-05-18 01:59:29 +02:00
if err != nil {
return nil, 0, fmt.Errorf("making request: %v", err)
2024-05-18 01:59:29 +02:00
}
defer resp.Body.Close()
if resp.StatusCode != http.StatusOK {
return nil, 0, fmt.Errorf("unexpected status code: %d", resp.StatusCode)
2024-05-18 01:59:29 +02:00
}
doc, err := goquery.NewDocumentFromReader(resp.Body)
if err != nil {
return nil, 0, fmt.Errorf("loading HTML document: %v", err)
2024-05-18 01:59:29 +02:00
}
doc.Find(".result__body").Each(func(i int, s *goquery.Selection) {
header := s.Find(".result__a").Text()
description := s.Find(".result__snippet").Text()
rawURL, exists := s.Find(".result__a").Attr("href")
if exists {
parsedURL, err := url.Parse(rawURL)
if err == nil {
queryParams := parsedURL.Query()
uddg := queryParams.Get("uddg")
if uddg != "" {
result := TextSearchResult{
URL: uddg,
Header: strings.TrimSpace(header),
Description: strings.TrimSpace(description),
}
results = append(results, result)
if debugMode {
log.Printf("Processed DuckDuckGo result: %+v\n", result)
}
}
}
}
})
duration := time.Since(startTime) // Calculate the duration
return results, duration, nil
2024-05-18 01:59:29 +02:00
}
2024-06-09 21:44:49 +02:00
func buildDuckDuckGoSearchURL(query string, page int) string {
startParam := ""
if page > 1 {
startParam = fmt.Sprintf("&s=%d", (page-1)*10)
}
return fmt.Sprintf("https://duckduckgo.com/html/?q=%s%s", url.QueryEscape(query), startParam)
}