MCPcopy
hub / github.com/edoardottt/cariddi / visitHTMLLink

Function visitHTMLLink

pkg/crawler/colly.go:433–440  ·  view source on GitHub ↗

visitHTMLLink checks if the collector should visit a link or not.

(link string, event *Event, e *colly.HTMLElement, c *colly.Collector)

Source from the content-addressed store, hash-verified

431
432// visitHTMLLink checks if the collector should visit a link or not.
433func visitHTMLLink(link string, event *Event, e *colly.HTMLElement, c *colly.Collector) {
434 if len(link) != 0 && !strings.HasPrefix(link, "data:image") {
435 absoluteURL := urlUtils.AbsoluteURL(event.ProtocolTemp, event.TargetTemp, e.Request.AbsoluteURL(link))
436 // Visit link found on page
437 // Only those links are visited which are in AllowedDomains
438 visitLink(event, c, absoluteURL)
439 }
440}
441
442// visitXMLLink checks if the collector should visit a link or not.
443func visitXMLLink(link string, event *Event, e *colly.XMLElement, c *colly.Collector) {

Callers 1

registerHTMLEventsFunction · 0.85

Calls 1

visitLinkFunction · 0.85

Tested by

no test coverage detected