crawl

package
v0.0.0-...-6782837 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Feb 13, 2023 License: Apache-2.0 Imports: 8 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

This section is empty.

Functions

This section is empty.

Types

type LinkExtractor

type LinkExtractor struct {
}

func NewLinkExtractor

func NewLinkExtractor() LinkExtractor

type Scraper

type Scraper struct {
	// contains filtered or unexported fields
}

func NewScraper

func NewScraper() *Scraper

func (*Scraper) ScrapeUrl

func (s *Scraper) ScrapeUrl(baseUrl string) ([]string, error)

type WebPageExtractor

type WebPageExtractor struct {
}

func NewWebPageExtractor

func NewWebPageExtractor() *WebPageExtractor

func (*WebPageExtractor) ExtractWebPage

func (w *WebPageExtractor) ExtractWebPage(webPageUrl string, webPageResponse chan *http.Response, errorChannel chan error)

type WebPageParser

type WebPageParser struct {
	// contains filtered or unexported fields
}

func NewWebPageParser

func NewWebPageParser(linkExtractor LinkExtractor) *WebPageParser

func (*WebPageParser) Parse

func (w *WebPageParser) Parse(response *http.Response, urlChannel chan string, wg *sync.WaitGroup,
	urlCache *sync.Map, baseUrl string)

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL