Documentation ¶
Index ¶
- Constants
- Variables
- func Any2AnyList(data interface{}) []interface{}
- func Any2Float64(data interface{}) float64
- func Any2Int(data interface{}) int
- func Any2Map(data interface{}) map[string]interface{}
- func Any2String(data interface{}) string
- func Any2Strings(data interface{}) []string
- func Any2int64(data interface{}) int64
- func Base64Decode(str string) (string, error)
- func Base64Encode(str string) string
- func Base64UrlDecode(str string) (string, error)
- func Base64UrlEncode(str string) string
- func BeginDayUnix() int64
- func Byte2Str(b []byte) string
- func ByteToBinaryString(data byte) (str string)
- func CleaningStr(str string) string
- func ConvertByte2String(byte []byte, charset Charset) string
- func Daydiff(beginDay string, endDay string) int
- func EndDayUnix() int64
- func FileMd5(path string) (string, error)
- func FileSizeFormat(fileSize int64) (size string)
- func GetAgent(agentType UserAgentType) string
- func GetNowPath() string
- func IsContainStr(items []string, item string) bool
- func Json2Map(str string) map[string]interface{}
- func MD5(str string) string
- func MongoConn()
- func MongoConn1()
- func NewGoquery(html string) (*goquery.Document, error)
- func NewMysqlDB(host string, port int, user, password, database string) (err error)
- func PanicToError(fn func()) (err error)
- func PathExists(path string)
- func Ping(ip string)
- func ReadCsvFile(filename string) [][]string
- func RedisDELKeys(rds *Rds, keys string, jobNumber int)
- func RegFindAll(regStr, rest string) [][]string
- func RegHtmlA(str string) []string
- func RegHtmlATxt(str string) []string
- func RegHtmlH(str, typeH string) []string
- func RegHtmlHTxt(str, typeH string) []string
- func RegHtmlHref(str string) []string
- func RegHtmlHrefTxt(str string) []string
- func RegHtmlInput(str string) []string
- func RegHtmlInputTxt(str string) []string
- func RegHtmlP(str string) []string
- func RegHtmlPTxt(str string) []string
- func RegHtmlSpan(str string) []string
- func RegHtmlSpanTxt(str string) []string
- func RegHtmlSrc(str string) []string
- func RegHtmlSrcTxt(str string) []string
- func RegHtmlTd(str string) []string
- func RegHtmlTdTxt(str string) []string
- func RegHtmlTitle(str string) []string
- func RegHtmlTitleTxt(str string) []string
- func RegHtmlTr(str string) []string
- func RegHtmlTrTxt(str string) []string
- func SSHClient(user string, pass string, addr string) (*ssh.Client, error)
- func SearchDomain(ip string)
- func SearchPort(ipStr string, vs ...interface{})
- func SetStatusCodeFailEvent(code int)
- func SetStatusCodeRetryEvent(code int)
- func SetStatusCodeSuccessEvent(code int)
- func StartJob()
- func StartJobGet(jobNumber int, queue TodoQueue, vs ...interface{})
- func StartJobPost(jobNumber int, queue TodoQueue, vs ...interface{})
- func Str2Float64(str string) float64
- func Str2Int64(str string) int64
- func StrDeleteSpace(str string) string
- func StringValue(i interface{}) string
- func StrsDuplicates(a []string) []string
- func Struct2Map(obj interface{}, hasValue bool) (map[string]interface{}, error)
- func TickerRun(t time.Duration, f func())
- func Timestamp() string
- func Uint82Str(bs []uint8) string
- func UnescapeUnicode(raw []byte) ([]byte, error)
- func Upload(url, savePath string, vs ...interface{}) error
- type Charset
- type Context
- func Delete(url string, vs ...interface{}) (*Context, error)
- func Get(url string, vs ...interface{}) (*Context, error)
- func GetRun(url string, vs ...interface{}) (ctx *Context, err error)
- func Options(url string, vs ...interface{}) (*Context, error)
- func Post(url string, data []byte, contentType string, vs ...interface{}) (*Context, error)
- func PostJson(url string, jsonStr string, vs ...interface{}) (*Context, error)
- func Put(url string, data []byte, contentType string, vs ...interface{}) (*Context, error)
- func Req(request *http.Request, vs ...interface{}) (*Context, error)
- func Request(url, method string, data []byte, contentType string, vs ...interface{}) (*Context, error)
- func (c *Context) AddCookie(cookie *http.Cookie)
- func (c *Context) AddHeader(k, v string)
- func (c *Context) CloseLog()
- func (c *Context) CookieNext() error
- func (c *Context) Do() func()
- func (c *Context) OpenFail2Retry()
- func (c *Context) SetFailedFunc(failedFunc func(c *Context))
- func (c *Context) SetRetryFunc(retryFunc func(c *Context))
- func (c *Context) SetRetryTimes(times int)
- func (c *Context) SetSucceedFunc(successFunc func(c *Context))
- func (c *Context) Upload(filePath string) func()
- type Csv
- type EndFunc
- type FailedFunc
- type Header
- type Mongo
- type Mysql
- func (m *Mysql) CloseLog()
- func (m *Mysql) Conn() (err error)
- func (m *Mysql) Delete(sql string) error
- func (m *Mysql) Describe(table string) (map[string]string, error)
- func (m *Mysql) Exec(sql string) error
- func (m *Mysql) Insert(table string, fieldData map[string]interface{}) error
- func (m *Mysql) NewTable(table string, fields map[string]string) error
- func (m *Mysql) Select(sql string) ([]map[string]string, error)
- func (m *Mysql) Update(sql string) error
- type Queue
- type Rds
- type ReqTimeOut
- type ReqTimeOutMs
- type ReqUrl
- type RetryFunc
- type RetryTimes
- type SSHConnInfo
- type Set
- type Stack
- type StartFunc
- type StressUrl
- type SucceedFunc
- type TableInfo
- type Task
- type TodoQueue
- type UploadQueue
- type UserAgentType
Constants ¶
const ( UTF8 = Charset("UTF-8") GB18030 = Charset("GB18030") GBK = Charset("GBK") GB2312 = Charset("GB2312") )
Variables ¶
var CookiePool = &cookiePool{}
var MysqlDB = &Mysql{}
开放的mysql对象
var StatusCodeMap map[int]string = map[int]string{
200: "success",
201: "success",
202: "success",
203: "success",
204: "fail",
300: "success",
301: "success",
302: "success",
400: "fail",
401: "retry",
402: "retry",
403: "retry",
404: "fail",
405: "retry",
406: "retry",
407: "retry",
408: "retry",
500: "fail",
501: "fail",
502: "retry",
503: "retry",
504: "retry",
}
StatusCodeMap 状态码处理映射 success 该状态码对应执行成功函数 fail 该状态码对应执行失败函数 retry 该状态码对应需要重试前执行的函数
var (
UrlBad error = errors.New("url is bad.") // 错误的url
)
var UserAgentMap map[int]string = map[int]string{
1: "Mozilla/5.0 (Windows NT 6.2; WOW64; rv:21.0) Gecko/20100101 Firefox/21.0",
2: "Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453.94 Safari/537.36",
3: "Mozilla/5.0 (compatible; WOW64; MSIE 10.0; Windows NT 6.2)",
4: "Opera/9.80 (Windows NT 6.1; WOW64; U; en) Presto/2.10.229 Version/11.62",
5: "Mozilla/5.0 (Windows; U; Windows NT 6.1; en-US) AppleWebKit/533.20.25 (KHTML, like Gecko) Version/5.0.4 Safari/533.20.27",
6: "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:21.0) Gecko/20130331 Firefox/21.0",
7: "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/535.11 (KHTML, like Gecko) Ubuntu/11.10 Chromium/27.0.1453.93 Chrome/27.0.1453.93 Safari/537.36",
8: "Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10_6_6; en-US) AppleWebKit/533.20.25 (KHTML, like Gecko) Version/5.0.4 Safari/533.20.27",
9: "Opera/9.80 (Macintosh; Intel Mac OS X 10.6.8; U; en) Presto/2.9.168 Version/11.52",
10: "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453.93 Safari/537.36",
11: "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.8; rv:21.0) Gecko/20100101 Firefox/21.0",
12: "Mozilla/5.0 (Linux; Android 4.1.1; Nexus 7 Build/JRO03D) AppleWebKit/535.19 (KHTML, like Gecko) Chrome/18.0.1025.166 Safari/535.19",
13: "Mozilla/5.0 (Linux; U; Android 4.0.4; en-gb; GT-I9300 Build/IMM76D) AppleWebKit/534.30 (KHTML, like Gecko) Version/4.0 Mobile Safari/534.30",
14: "Mozilla/5.0 (Linux; U; Android 2.2; en-gb; GT-P1000 Build/FROYO) AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1",
15: "Mozilla/5.0 (Android; Mobile; rv:14.0) Gecko/14.0 Firefox/14.0",
16: "Mozilla/5.0 (Android; Tablet; rv:14.0) Gecko/14.0 Firefox/14.0",
17: "Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/535.19 (KHTML, like Gecko) Chrome/18.0.1025.133 Mobile Safari/535.19",
18: "Mozilla/5.0 (Linux; Android 4.1.2; Nexus 7 Build/JZ054K) AppleWebKit/535.19 (KHTML, like Gecko) Chrome/18.0.1025.166 Safari/535.19",
19: "Mozilla/5.0 (iPhone; CPU iPhone OS 5_0 like Mac OS X) AppleWebKit/534.46 (KHTML, like Gecko) Version/5.1 Mobile/9A334 Safari/7534.48.3",
20: "Mozilla/5.0 (iPad; CPU OS 5_0 like Mac OS X) AppleWebKit/534.46 (KHTML, like Gecko) Version/5.1 Mobile/9A334 Safari/7534.48.3",
21: "Mozilla/5.0 (iPhone; CPU iPhone OS 5_0 like Mac OS X) AppleWebKit/534.46 (KHTML, like Gecko) Version/5.1 Mobile/9A334 Safari/7534.48.3",
22: "Mozilla/5.0 (iPad; CPU OS 5_0 like Mac OS X) AppleWebKit/534.46 (KHTML, like Gecko) Version/5.1 Mobile/9A334 Safari/7534.48.3",
23: "Mozilla/5.0 (iPhone; CPU iPhone OS 6_1_4 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) CriOS/27.0.1453.10 Mobile/10B350 Safari/8536.25",
24: "Mozilla/5.0 (compatible; MSIE 10.0; Windows Phone 8.0; Trident/6.0; IEMobile/10.0; ARM; Touch; NOKIA; Lumia 920)",
25: "Mozilla/5.0 (compatible; MSIE 9.0; Windows Phone OS 7.5; Trident/5.0; IEMobile/9.0; SAMSUNG; SGH-i917)",
26: "User-Agent, UCWEB7.0.2.37/28/999",
27: "User-Agent, NOKIA5700/ UCWEB7.0.2.37/28/999",
28: "User-Agent, Openwave/ UCWEB7.0.2.37/28/999",
29: "User-Agent, Mozilla/4.0 (compatible; MSIE 6.0; ) Opera/UCWEB7.0.2.37/28/999",
30: "Mozilla/5.0 (Windows; U; Windows NT 6.1; ) AppleWebKit/534.12 (KHTML, like Gecko) Maxthon/3.0 Safari/534.12",
31: "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; WOW64; Trident/5.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; InfoPath.3; .NET4.0C; .NET4.0E)",
32: "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; WOW64; Trident/5.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; InfoPath.3; .NET4.0C; .NET4.0E; SE 2.X MetaSr 1.0)",
33: "Mozilla/5.0 (Windows; U; Windows NT 6.1; en-US) AppleWebKit/534.3 (KHTML, like Gecko) Chrome/6.0.472.33 Safari/534.3 SE 2.X MetaSr 1.0",
34: "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; WOW64; Trident/5.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; InfoPath.3; .NET4.0C; .NET4.0E)",
35: "Mozilla/5.0 (Windows NT 6.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/13.0.782.41 Safari/535.1 QQBrowser/6.9.11079.201",
}
Functions ¶
func Any2AnyList ¶ added in v0.0.10
func Any2AnyList(data interface{}) []interface{}
interface{} -> []interface{}
func Any2Float64 ¶ added in v0.0.10
func Any2Float64(data interface{}) float64
interface{} -> float64
func Any2Map ¶ added in v0.0.10
func Any2Map(data interface{}) map[string]interface{}
interface{} -> map[string]interface{}
func Any2Strings ¶ added in v0.0.10
func Any2Strings(data interface{}) []string
interface{} -> []string
func Base64UrlDecode ¶ added in v0.1.4
base64 url 解码
func ByteToBinaryString ¶ added in v0.1.4
ByteToBinaryString 字节 -> 二进制字符串
func CleaningStr ¶ added in v0.0.11
CleaningStr 清理字符串前后空白 和回车 换行符号
func ConvertByte2String ¶ added in v0.1.4
编码转换
func FileSizeFormat ¶ added in v0.1.1
字节的单位转换 保留两位小数
func GetAgent ¶ added in v0.0.4
func GetAgent(agentType UserAgentType) string
GetAgent 随机获取那种类型的 user-agent
func IsContainStr ¶ added in v0.1.4
IsContainStr 字符串是否等于items中的某个元素
func MongoConn1 ¶ added in v0.1.4
func MongoConn1()
func NewMysqlDB ¶ added in v0.0.11
给mysql对象进行连接
func ReadCsvFile ¶ added in v0.1.4
csv file -> [][]string 行列
func RegFindAll ¶ added in v0.1.1
func RegHtmlATxt ¶ added in v0.1.4
func RegHtmlHTxt ¶ added in v0.1.4
func RegHtmlHref ¶ added in v0.1.4
func RegHtmlHrefTxt ¶ added in v0.1.4
func RegHtmlInput ¶ added in v0.1.1
func RegHtmlInputTxt ¶ added in v0.1.4
func RegHtmlPTxt ¶ added in v0.1.4
func RegHtmlSpan ¶ added in v0.1.1
func RegHtmlSpanTxt ¶ added in v0.1.4
func RegHtmlSrc ¶ added in v0.1.4
func RegHtmlSrcTxt ¶ added in v0.1.4
func RegHtmlTdTxt ¶ added in v0.1.4
func RegHtmlTitle ¶ added in v0.1.1
func RegHtmlTitleTxt ¶ added in v0.1.4
func RegHtmlTrTxt ¶ added in v0.1.4
func SSHClient ¶ added in v0.1.1
SSHClient 连接ssh addr : 主机地址, 如: 127.0.0.1:22 user : 用户 pass : 密码 返回 ssh连接
func SearchDomain ¶ added in v0.1.4
func SearchDomain(ip string)
func SetStatusCodeRetryEvent ¶ added in v0.1.5
func SetStatusCodeRetryEvent(code int)
将指定状态码设置为执行重试事件
func SetStatusCodeSuccessEvent ¶ added in v0.1.5
func SetStatusCodeSuccessEvent(code int)
将指定状态码设置为执行成功事件
func StartJobGet ¶ added in v0.0.7
StartJobGet 并发执行Get,直到队列任务为空 @jobNumber 并发数, @queue 全局队列, @client 单个并发任务的client, @SucceedFunc 成功方法, @ RetryFunc重试方法, @FailedFunc 失败方法
func StartJobPost ¶ added in v0.0.7
TODO: StartJobPost 开始运行并发Post
func StrDeleteSpace ¶ added in v0.0.11
StrDeleteSpace 删除字符串前后的空格
func Struct2Map ¶ added in v0.1.3
Struct -> map hasValue=true表示字段值不管是否存在都转换成map hasValue=false表示字段为空或者不为0则转换成map
Types ¶
type Context ¶ added in v0.0.7
type Context struct { // Token Token string // client Client *http.Client // Request Req *http.Request // Response Resp *http.Response // Error Err error // Ctx context.Context Ctx context.Context // 最大允许重试次数 MaxTimes RetryTimes // 请求成功了需要处理的事件 SucceedFunc SucceedFunc // 请求失败了需要做的事 FailedFunc FailedFunc // 请求状态码设置了重试,在重试前的事件 RetryFunc RetryFunc // 请求开始前的方法 StartFunc StartFunc // 请求完成后的方法 EndFunc EndFunc // 本次请求的任务 // 用于有步骤的请求和并发执行请求 Task *Task // 请求返回的结果 RespBody []byte // job编号 // 在执行多并发执行抓取任务,每个并发都有一个编号 // 这个编号是递增分配的 JobNumber int // 请求的响应时间 单位ms Ms time.Duration // 是否显示日志, 默认是显示的 IsLog bool // contains filtered or unexported fields }
请求上下文
func Req ¶
Req 初始化请求 @url 请求链接 @maxTimes 重试次数 @sf 请求成功后做的事情, 200等 @ff 请求失败后做的事情, 403等,502等 @vs 可变参数 @vs UserAgentType 设置指定类型 user agent 如 AndroidAgent
func Request ¶ added in v0.0.7
func Request(url, method string, data []byte, contentType string, vs ...interface{}) (*Context, error)
Request 请求
func (*Context) SetFailedFunc ¶ added in v0.0.7
SetFailed 设置错误后的方法
func (*Context) SetRetryFunc ¶ added in v0.0.7
SetRetryFunc 设置重试,在重试前的方法
func (*Context) SetRetryTimes ¶ added in v0.0.7
SetRetryTimes 设置重试次数
func (*Context) SetSucceedFunc ¶ added in v0.0.7
SetSucceedFunc 设置成功后的方法
type Mongo ¶ added in v0.1.4
type Mongo struct { User string Password string Host string Port string Conn *mongo.Client Database *mongo.Database Collection *mongo.Collection MaxPoolSize int TimeOut time.Duration }
func (*Mongo) GetCollection ¶ added in v0.1.4
连接mongodb 的db的集合 @dbname DB名 @name 集合名
type Mysql ¶ added in v0.0.9
type Mysql struct { Host string Port int User string Password string DataBase string MaxOpenConn int MaxIdleConn int DB *sql.DB Log bool }
type Rds ¶ added in v0.1.2
type Rds struct { SSHUser string SSHPassword string SSHAddr string RedisHost string RedisPost string RedisPassword string // redis DB RedisDB int // 单个连接 Conn redis.Conn // 最大闲置数,用于redis连接池 RedisMaxIdle int // 最大连接数 RedisMaxActive int // 单条连接Timeout RedisIdleTimeoutSec int // 连接池 Pool *redis.Pool }
func NewRedisPool ¶ added in v0.1.2
type ReqTimeOut ¶ added in v0.0.7
type ReqTimeOut int
type ReqTimeOutMs ¶ added in v0.0.7
type ReqTimeOutMs int
type SSHConnInfo ¶ added in v0.1.2
func NewSSHInfo ¶ added in v0.1.2
func NewSSHInfo(addr, user, password string) *SSHConnInfo
type Stack ¶ added in v0.1.4
type Stack struct {
// contains filtered or unexported fields
}
======== Stack
type StressUrl ¶ added in v0.0.7
type StressUrl struct { Url string Method string Sum int64 Total int TQueue TodoQueue // 接口传入的json JsonData string // contains filtered or unexported fields }
StressUrl 压力测试一个url
func NewTestUrl ¶ added in v0.0.7
NewTestUrl 实例化一个新的url压测
type TableInfo ¶ added in v0.0.9
type TableInfo struct { Field string Type string Null string Key string Default interface{} Extra string }
表信息
type Task ¶ added in v0.0.5
type Task struct { Url string JsonParam string HeaderMap *http.Header // 上下文传递的数据 Data map[string]interface{} Urls []*ReqUrl // 多步骤使用 Type string // "", "upload", "do" SavePath string SaveDir string FileName string }
任务对象
func CrawlerTask ¶ added in v0.1.3
CrawlerTask
type TodoQueue ¶ added in v0.0.4
type UploadQueue ¶ added in v0.1.1
type UploadQueue struct {
// contains filtered or unexported fields
}
下载队列
func (*UploadQueue) Clear ¶ added in v0.1.1
func (q *UploadQueue) Clear() bool
func (*UploadQueue) IsEmpty ¶ added in v0.1.1
func (q *UploadQueue) IsEmpty() bool
func (*UploadQueue) Print ¶ added in v0.1.1
func (q *UploadQueue) Print()
func (*UploadQueue) Size ¶ added in v0.1.1
func (q *UploadQueue) Size() int
type UserAgentType ¶ added in v0.0.4
type UserAgentType int
const ( PCAgent UserAgentType = iota + 1 WindowsAgent LinuxAgent MacAgent AndroidAgent IosAgent PhoneAgent WindowsPhoneAgent UCAgent )