Fixed Brave Meta search starting at page 2 instead of 1
Some checks failed
Run Integration Tests / test (push) Has been cancelled

This commit is contained in:
partisan 2025-03-15 11:42:32 +01:00
parent fa825d54a7
commit 9420810092

View file

@ -17,7 +17,10 @@ func PerformBraveTextSearch(query, safe, lang string, offset int) ([]TextSearchR
var results []TextSearchResult var results []TextSearchResult
// Build the search URL // Build the search URL
searchURL := fmt.Sprintf("https://search.brave.com/search?q=%s&offset=%d", url.QueryEscape(query), offset) searchURL := fmt.Sprintf("https://search.brave.com/search?q=%s", url.QueryEscape(query))
if offset > 1 {
searchURL += fmt.Sprintf("&offset=%d&spellcheck=0", offset-1)
}
req, err := http.NewRequest("GET", searchURL, nil) req, err := http.NewRequest("GET", searchURL, nil)
if err != nil { if err != nil {
@ -50,34 +53,47 @@ func PerformBraveTextSearch(query, safe, lang string, offset int) ([]TextSearchR
// Parse the response body // Parse the response body
doc, err := goquery.NewDocumentFromReader(strings.NewReader(string(body))) doc, err := goquery.NewDocumentFromReader(strings.NewReader(string(body)))
if err != nil { if err != nil {
printErr("Error parsing response body: %v", err) return nil, 0, fmt.Errorf("parsing HTML: %v", err)
return nil, 0, fmt.Errorf("parsing response body: %v", err)
} }
// Extract search results // Only grab .snippet blocks that have data-type="web"
doc.Find(".snippet").Each(func(i int, s *goquery.Selection) { doc.Find(`.snippet[data-type="web"]`).Each(func(i int, s *goquery.Selection) {
title := s.Find(".title").Text()
description := s.Find(".snippet-description").Text()
url, exists := s.Find("a").Attr("href")
// Add to results only if all components are present // The main clickable link is <a ... class="heading-serpresult">
if title != "" && description != "" && exists && url != "" { anchor := s.Find("a.heading-serpresult").First()
link, ok := anchor.Attr("href")
if !ok || link == "" {
return
}
// Title is inside <div class="title">
title := strings.TrimSpace(anchor.Find(".title").Text())
if title == "" {
// fallback if the .title is slightly off in the DOM
title = strings.TrimSpace(s.Find(".title").Text())
}
// Description is inside <div class="snippet-description">
desc := strings.TrimSpace(s.Find(".snippet-description").Text())
// Add only if everything is non-empty
if title != "" && desc != "" {
results = append(results, TextSearchResult{ results = append(results, TextSearchResult{
Header: title, Header: title,
URL: url, URL: link,
Description: description, Description: desc,
}) })
} }
}) })
duration := time.Since(startTime) // Calculate the duration duration := time.Since(startTime)
// Return an error if no results are found // Return an error if no results are found
if len(results) == 0 { if len(results) == 0 {
printDebug("No results found for query: %s", query) printDebug("No results found for query")
return nil, duration, fmt.Errorf("no results found") return nil, duration, fmt.Errorf("no results found")
} }
printDebug("Search completed successfully for query: %s, found %d results", query, len(results)) printDebug("Search completed successfully found %d results", len(results))
return results, duration, nil return results, duration, nil
} }