2024-05-18 01:59:29 +02:00
|
|
|
// text-duckduckgo.go
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"log"
|
|
|
|
"net/http"
|
|
|
|
"net/url"
|
|
|
|
"strings"
|
2024-05-19 22:57:23 +02:00
|
|
|
"time"
|
2024-05-18 01:59:29 +02:00
|
|
|
|
|
|
|
"github.com/PuerkitoBio/goquery"
|
|
|
|
)
|
|
|
|
|
2024-05-19 22:57:23 +02:00
|
|
|
func PerformDuckDuckGoTextSearch(query, safe, lang string, page int) ([]TextSearchResult, error) {
|
|
|
|
const resultsPerPage = 10
|
2024-05-18 01:59:29 +02:00
|
|
|
var results []TextSearchResult
|
|
|
|
|
2024-05-19 22:57:23 +02:00
|
|
|
client := &http.Client{Timeout: 10 * time.Second}
|
|
|
|
searchURL := fmt.Sprintf("https://duckduckgo.com/html/?q=%s&s=%d", url.QueryEscape(query), (page-1)*resultsPerPage)
|
|
|
|
|
|
|
|
req, err := http.NewRequest("GET", searchURL, nil)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to create request: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
req.Header.Set("User-Agent", "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/107.0.0.0 Safari/537.36")
|
|
|
|
|
|
|
|
resp, err := client.Do(req)
|
2024-05-18 01:59:29 +02:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("making request: %v", err)
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
|
|
return nil, fmt.Errorf("unexpected status code: %d", resp.StatusCode)
|
|
|
|
}
|
|
|
|
|
|
|
|
doc, err := goquery.NewDocumentFromReader(resp.Body)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("loading HTML document: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
doc.Find(".result__body").Each(func(i int, s *goquery.Selection) {
|
|
|
|
header := s.Find(".result__a").Text()
|
|
|
|
description := s.Find(".result__snippet").Text()
|
|
|
|
rawURL, exists := s.Find(".result__a").Attr("href")
|
|
|
|
if exists {
|
|
|
|
parsedURL, err := url.Parse(rawURL)
|
|
|
|
if err == nil {
|
|
|
|
queryParams := parsedURL.Query()
|
|
|
|
uddg := queryParams.Get("uddg")
|
|
|
|
if uddg != "" {
|
|
|
|
result := TextSearchResult{
|
|
|
|
URL: uddg,
|
|
|
|
Header: strings.TrimSpace(header),
|
|
|
|
Description: strings.TrimSpace(description),
|
|
|
|
}
|
|
|
|
results = append(results, result)
|
|
|
|
if debugMode {
|
|
|
|
log.Printf("Processed DuckDuckGo result: %+v\n", result)
|
|
|
|
}
|
2024-05-19 22:57:23 +02:00
|
|
|
} else {
|
|
|
|
if debugMode {
|
|
|
|
log.Printf("Missing 'uddg' parameter in URL: %s\n", rawURL)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if debugMode {
|
|
|
|
log.Printf("Error parsing URL: %s, error: %v\n", rawURL, err)
|
2024-05-18 01:59:29 +02:00
|
|
|
}
|
|
|
|
}
|
2024-05-19 22:57:23 +02:00
|
|
|
} else {
|
|
|
|
if debugMode {
|
|
|
|
log.Printf("Missing 'href' attribute in result anchor tag\n")
|
|
|
|
}
|
2024-05-18 01:59:29 +02:00
|
|
|
}
|
|
|
|
})
|
|
|
|
|
2024-05-19 22:57:23 +02:00
|
|
|
if len(results) == 0 {
|
|
|
|
if debugMode {
|
|
|
|
log.Println("No results found from DuckDuckGo")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-18 01:59:29 +02:00
|
|
|
return results, nil
|
|
|
|
}
|