spray/internal/pool.go

324 lines
7.6 KiB
Go
Raw Normal View History

2022-09-08 15:57:17 +08:00
package internal
import (
"context"
"github.com/chainreactors/logs"
"github.com/chainreactors/spray/pkg"
"github.com/chainreactors/spray/pkg/ihttp"
2022-09-15 19:27:07 +08:00
"github.com/chainreactors/words"
2022-09-08 15:57:17 +08:00
"github.com/panjf2000/ants/v2"
"github.com/valyala/fasthttp"
"net/http"
2022-09-08 15:57:17 +08:00
"sync"
2022-09-15 19:27:07 +08:00
"time"
2022-09-08 15:57:17 +08:00
)
var (
CheckStatusCode func(int) bool
CheckRedirect func(string) bool
2022-09-26 17:19:08 +08:00
CheckWaf func([]byte) bool
2022-09-08 15:57:17 +08:00
)
var breakThreshold int = 20
2022-09-23 01:47:24 +08:00
2022-09-15 19:27:07 +08:00
func NewPool(ctx context.Context, config *pkg.Config, outputCh chan *baseline) (*Pool, error) {
2022-09-19 14:42:29 +08:00
pctx, cancel := context.WithCancel(ctx)
2022-09-08 15:57:17 +08:00
pool := &Pool{
Config: config,
ctx: pctx,
2022-09-23 01:47:24 +08:00
cancel: cancel,
client: ihttp.NewClient(config.Thread, 2, config.ClientType),
worder: words.NewWorder(config.Wordlist),
outputCh: outputCh,
tempCh: make(chan *baseline, config.Thread),
2022-09-23 11:20:41 +08:00
wg: sync.WaitGroup{},
initwg: sync.WaitGroup{},
checkPeriod: 100,
errPeriod: 10,
reqCount: 1,
failedCount: 1,
2022-09-08 15:57:17 +08:00
}
switch config.Mod {
case pkg.PathSpray:
pool.genReq = func(s string) (*ihttp.Request, error) {
2022-09-23 11:20:41 +08:00
return pool.buildPathRequest(s)
2022-09-08 15:57:17 +08:00
}
pool.check = func() {
pool.wg.Add(1)
_ = pool.pool.Invoke(newUnit(pkg.RandPath(), CheckSource))
if pool.failedCount > breakThreshold {
// 当报错次数超过上限是, 结束任务
pool.Recover()
pool.cancel()
}
}
2022-09-08 15:57:17 +08:00
case pkg.HostSpray:
pool.genReq = func(s string) (*ihttp.Request, error) {
2022-09-23 11:20:41 +08:00
return pool.buildHostRequest(s)
2022-09-08 15:57:17 +08:00
}
pool.check = func() {
pool.wg.Add(1)
_ = pool.pool.Invoke(newUnit(pkg.RandHost(), CheckSource))
if pool.failedCount > breakThreshold {
// 当报错次数超过上限是, 结束任务
pool.Recover()
pool.cancel()
}
}
2022-09-08 15:57:17 +08:00
}
p, _ := ants.NewPoolWithFunc(config.Thread, func(i interface{}) {
unit := i.(*Unit)
req, err := pool.genReq(unit.path)
if err != nil {
logs.Log.Error(err.Error())
return
}
var bl *baseline
2022-09-23 11:20:41 +08:00
resp, reqerr := pool.client.Do(pctx, req)
if pool.ClientType == ihttp.FAST {
defer fasthttp.ReleaseResponse(resp.FastResponse)
defer fasthttp.ReleaseRequest(req.FastRequest)
}
2022-09-23 11:20:41 +08:00
if reqerr != nil && reqerr != fasthttp.ErrBodyTooLarge {
2022-10-19 16:38:23 +08:00
pool.failedCount++
bl = &baseline{Url: pool.BaseURL + unit.path, Err: reqerr}
pool.failedBaselines = append(pool.failedBaselines, bl)
2022-09-08 15:57:17 +08:00
} else {
2022-11-09 16:05:17 +08:00
if err = pool.PreCompare(resp); err == nil || unit.source == CheckSource || unit.source == InitSource {
2022-09-08 15:57:17 +08:00
// 通过预对比跳过一些无用数据, 减少性能消耗
bl = NewBaseline(req.URI(), req.Host(), resp)
2022-09-08 15:57:17 +08:00
} else {
bl = NewInvalidBaseline(req.URI(), req.Host(), resp)
2022-09-08 15:57:17 +08:00
}
}
switch unit.source {
2022-10-27 23:40:15 +08:00
case InitSource:
pool.base = bl
pool.initwg.Done()
logs.Log.Important("[baseline] " + bl.String())
2022-10-27 23:40:15 +08:00
return
2022-09-20 18:09:06 +08:00
case CheckSource:
2022-10-27 23:40:15 +08:00
if bl.Err != nil {
logs.Log.Warnf("[check.error] maybe ip had banned by waf, break (%d/%d), error: %s", pool.failedCount, breakThreshold, bl.Err.Error())
pool.failedBaselines = append(pool.failedBaselines, bl)
} else if i := pool.base.Compare(bl); i < 1 {
if i == 0 {
logs.Log.Debug("[check.fuzzy] maybe trigger risk control, " + bl.String())
} else {
logs.Log.Warn("[check.failed] maybe trigger risk control, " + bl.String())
}
pool.failedBaselines = append(pool.failedBaselines, bl)
} else {
pool.ResetFailed() // 如果后续访问正常, 重置错误次数
logs.Log.Debug("[check.pass] " + bl.String())
}
2022-09-08 15:57:17 +08:00
case WordSource:
// 异步进行性能消耗较大的深度对比
pool.tempCh <- bl
2022-09-23 11:20:41 +08:00
if pool.reqCount%pool.checkPeriod == 0 {
go pool.check()
2022-11-09 17:28:51 +08:00
} else if pool.failedCount%pool.errPeriod == 0 {
2022-09-23 11:20:41 +08:00
go pool.check()
}
pool.bar.Done()
2022-09-08 15:57:17 +08:00
}
2022-10-19 16:38:23 +08:00
2022-09-08 15:57:17 +08:00
pool.wg.Done()
})
pool.pool = p
2022-09-26 17:19:08 +08:00
go pool.comparing()
2022-09-08 15:57:17 +08:00
return pool, nil
}
type Pool struct {
*pkg.Config
client *ihttp.Client
2022-09-08 15:57:17 +08:00
pool *ants.PoolWithFunc
bar *pkg.Bar
2022-09-19 14:42:29 +08:00
ctx context.Context
2022-09-23 01:47:24 +08:00
cancel context.CancelFunc
2022-09-08 15:57:17 +08:00
//baseReq *http.Request
base *baseline
outputCh chan *baseline // 输出的chan, 全局统一
tempCh chan *baseline // 待处理的baseline
reqCount int
failedCount int
checkPeriod int
errPeriod int
failedBaselines []*baseline
analyzeDone bool
genReq func(s string) (*ihttp.Request, error)
check func()
worder *words.Worder
wg sync.WaitGroup
initwg sync.WaitGroup // 初始化用, 之后改成锁
2022-09-08 15:57:17 +08:00
}
func (p *Pool) Init() error {
2022-09-23 11:20:41 +08:00
p.initwg.Add(1)
2022-10-28 00:46:54 +08:00
p.pool.Invoke(newUnit(pkg.RandPath(), InitSource))
2022-09-23 11:20:41 +08:00
p.initwg.Wait()
2022-09-08 15:57:17 +08:00
// todo 分析baseline
// 检测基本访问能力
2022-10-27 23:40:15 +08:00
if p.base.Err != nil {
2022-09-23 01:47:24 +08:00
p.cancel()
2022-09-23 11:20:41 +08:00
return p.base.Err
2022-09-08 15:57:17 +08:00
}
2022-09-23 11:20:41 +08:00
p.base.Collect()
if p.base.RedirectURL != "" {
CheckRedirect = func(redirectURL string) bool {
2022-09-23 11:20:41 +08:00
if redirectURL == p.base.RedirectURL {
2022-09-08 15:57:17 +08:00
// 相同的RedirectURL将被认为是无效数据
return false
} else {
// path为3xx, 且与baseline中的RedirectURL不同时, 为有效数据
return true
2022-09-08 15:57:17 +08:00
}
}
}
return nil
}
2022-11-10 15:48:38 +08:00
func (p *Pool) Run(ctx context.Context, offset, limit int) {
maxreq := offset + limit
2022-09-15 19:27:07 +08:00
Loop:
for {
select {
case u, ok := <-p.worder.C:
if !ok {
break Loop
}
2022-11-10 15:48:38 +08:00
if p.reqCount < offset {
p.reqCount++
continue
}
if p.reqCount > maxreq {
break Loop
}
for _, fn := range p.Fns {
u = fn(u)
}
2022-11-10 04:48:07 +08:00
if u == "" {
continue
}
2022-11-10 15:48:38 +08:00
p.reqCount++
p.wg.Add(1)
_ = p.pool.Invoke(newUnit(u, WordSource))
2022-09-15 19:27:07 +08:00
case <-ctx.Done():
break Loop
2022-09-19 14:42:29 +08:00
case <-p.ctx.Done():
break Loop
2022-09-15 19:27:07 +08:00
}
2022-09-08 15:57:17 +08:00
}
2022-09-23 11:20:41 +08:00
p.Close()
2022-09-08 15:57:17 +08:00
}
func (p *Pool) PreCompare(resp *ihttp.Response) error {
if !CheckStatusCode(resp.StatusCode()) {
2022-09-15 19:27:07 +08:00
return ErrBadStatus
2022-09-08 15:57:17 +08:00
}
if CheckRedirect != nil && !CheckRedirect(string(resp.GetHeader("Location"))) {
2022-09-15 19:27:07 +08:00
return ErrRedirect
2022-09-08 15:57:17 +08:00
}
2022-09-26 17:19:08 +08:00
if CheckWaf != nil && !CheckWaf(nil) {
// todo check waf
return ErrWaf
}
2022-09-08 15:57:17 +08:00
2022-09-15 19:27:07 +08:00
return nil
2022-09-08 15:57:17 +08:00
}
2022-09-26 17:19:08 +08:00
func (p *Pool) comparing() {
for bl := range p.tempCh {
2022-11-09 16:05:17 +08:00
if p.base.Compare(bl) == 1 {
// 如果是同一个包则设置为无效包
bl.IsValid = false
p.outputCh <- bl
continue
}
if !bl.IsValid {
// 已经时被precompare过滤的项目, 跳过collect, 直接认为是无效数据
p.outputCh <- bl
continue
}
bl.Collect()
2022-09-23 11:20:41 +08:00
if p.EnableFuzzy && p.base.FuzzyEqual(bl) {
bl.IsValid = false
p.outputCh <- bl
continue
}
p.outputCh <- bl
}
2022-09-23 11:20:41 +08:00
p.analyzeDone = true
}
2022-09-26 17:19:08 +08:00
func (p *Pool) ResetFailed() {
p.failedCount = 0
p.failedBaselines = nil
}
func (p *Pool) Recover() {
logs.Log.Errorf("failed request exceeds the threshold , task will exit. Breakpoint %d", p.reqCount)
logs.Log.Error("collecting failed check")
for i, bl := range p.failedBaselines {
logs.Log.Errorf("[failed.%d] %s", i, bl.String())
}
}
2022-09-23 11:20:41 +08:00
func (p *Pool) Close() {
p.wg.Wait()
p.bar.Close()
close(p.tempCh)
for !p.analyzeDone {
time.Sleep(time.Duration(100) * time.Millisecond)
}
}
2022-09-26 17:19:08 +08:00
func (p *Pool) buildPathRequest(path string) (*ihttp.Request, error) {
if p.Config.ClientType == ihttp.FAST {
req := fasthttp.AcquireRequest()
req.SetRequestURI(p.BaseURL + path)
2022-10-27 23:40:15 +08:00
return &ihttp.Request{FastRequest: req, ClientType: p.ClientType}, nil
} else {
req, err := http.NewRequest("GET", p.BaseURL+path, nil)
2022-10-27 23:40:15 +08:00
return &ihttp.Request{StandardRequest: req, ClientType: p.ClientType}, err
}
}
func (p *Pool) buildHostRequest(host string) (*ihttp.Request, error) {
if p.Config.ClientType == ihttp.FAST {
req := fasthttp.AcquireRequest()
req.SetRequestURI(p.BaseURL)
req.SetHost(host)
2022-10-27 23:40:15 +08:00
return &ihttp.Request{FastRequest: req, ClientType: p.ClientType}, nil
} else {
req, err := http.NewRequest("GET", p.BaseURL, nil)
req.Host = host
2022-10-27 23:40:15 +08:00
return &ihttp.Request{StandardRequest: req, ClientType: p.ClientType}, err
}
}