crawl

package
v0.0.0-...-435ca04 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Oct 19, 2020 License: Apache-2.0 Imports: 9 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

This section is empty.

Functions

func Crawl

func Crawl(url string, external bool, delay int, maxVisits int)

Types

type Ext

type Ext struct {
	*gocrawl.DefaultExtender
}

func (*Ext) ComputeDelay

func (e *Ext) ComputeDelay(host string, di *gocrawl.DelayInfo, lastFetch *gocrawl.FetchInfo) time.Duration

func (*Ext) End

func (e *Ext) End(err error)

func (*Ext) Error

func (e *Ext) Error(err *gocrawl.CrawlError)

func (*Ext) Filter

func (e *Ext) Filter(ctx *gocrawl.URLContext, isVisited bool) bool

func (*Ext) Visit

func (e *Ext) Visit(ctx *gocrawl.URLContext, res *http.Response, doc *goquery.Document) (interface{}, bool)

type ResultSummary

type ResultSummary struct {
	Http200 int
	Errors  int
}

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL