gopdynamiccrawler

package
v0.0.0-...-37b0e48 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Apr 27, 2024 License: MIT Imports: 15 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

View Source
var (
	Internal_ressources []*gopstaticcrawler.Ressource
	External_ressources []*gopstaticcrawler.Ressource
	URLVisited          URLVisitedStruct
	ScreenshotList      []gopchromedp.Item
	ScreenshotChan      chan struct{}
	UrlChan             chan string
)

Functions

func InitCrawler

func InitCrawler()

func NewOptions

func NewOptions(url *string, logFileOption *os.File, report *bool, recursive *bool, screenshot *bool, cookie *string, proxy *string, delay *int, concurrency *int)

func PrintOptions

func PrintOptions(options *Options)

func RunCrawlerCmd

func RunCrawlerCmd()

RunCrawlerCmd Run the crawler

func TreatA

func TreatA(doc *goquery.Document) []string

func TreatLinkHref

func TreatLinkHref(doc *goquery.Document) []string

func TreatScriptSrc

func TreatScriptSrc(doc *goquery.Document) []string

Types

type Options

type Options struct {
	UrlPtr         *string
	LogFile        *os.File
	ReportPtr      *bool
	RecursivePtr   *bool
	ScreenshotPtr  *bool
	CookiePtr      *string
	ProxyPtr       *string
	DelayPtr       *int
	ConcurrencyPtr *int
}
var GoCrawlerOptions Options

type URLVisitedStruct

type URLVisitedStruct struct {
	sync.RWMutex
	// contains filtered or unexported fields
}

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL