mirror of
https://github.com/httprunner/httprunner.git
synced 2026-05-31 21:39:41 +08:00
324 lines
7.7 KiB
Go
324 lines
7.7 KiB
Go
package uixt
|
|
|
|
import (
|
|
"bytes"
|
|
"fmt"
|
|
"image"
|
|
"io/ioutil"
|
|
"mime/multipart"
|
|
"net/http"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/pkg/errors"
|
|
"github.com/rs/zerolog/log"
|
|
|
|
"github.com/httprunner/httprunner/v4/hrp/internal/builtin"
|
|
"github.com/httprunner/httprunner/v4/hrp/internal/code"
|
|
"github.com/httprunner/httprunner/v4/hrp/internal/env"
|
|
"github.com/httprunner/httprunner/v4/hrp/internal/json"
|
|
)
|
|
|
|
var client = &http.Client{
|
|
Timeout: time.Second * 10,
|
|
}
|
|
|
|
type OCRResult struct {
|
|
Text string `json:"text"`
|
|
Points []PointF `json:"points"`
|
|
}
|
|
|
|
type ResponseOCR struct {
|
|
Code int `json:"code"`
|
|
Message string `json:"message"`
|
|
OCRResult []OCRResult `json:"ocrResult"`
|
|
}
|
|
|
|
type OCRText struct {
|
|
Text string
|
|
Rect image.Rectangle
|
|
}
|
|
|
|
type OCRTexts []OCRText
|
|
|
|
func (t OCRTexts) texts() (texts []string) {
|
|
for _, text := range t {
|
|
texts = append(texts, text.Text)
|
|
}
|
|
return texts
|
|
}
|
|
|
|
func (t OCRTexts) FindText(text string, options ...ActionOption) (
|
|
point PointF, err error) {
|
|
|
|
actionOptions := NewActionOptions(options...)
|
|
|
|
var rects []image.Rectangle
|
|
for _, ocrText := range t {
|
|
rect := ocrText.Rect
|
|
|
|
// not contains text
|
|
if !strings.Contains(ocrText.Text, text) {
|
|
continue
|
|
}
|
|
|
|
// check if text in scope
|
|
if rect.Min.X < actionOptions.AbsScope[0] || rect.Min.Y < actionOptions.AbsScope[1] ||
|
|
rect.Max.X > actionOptions.AbsScope[2] || rect.Max.Y > actionOptions.AbsScope[3] {
|
|
// not in scope
|
|
continue
|
|
}
|
|
|
|
rects = append(rects, rect)
|
|
|
|
// contains text while not match exactly
|
|
if ocrText.Text != text {
|
|
continue
|
|
}
|
|
|
|
// match exactly, and not specify index, return the first one
|
|
if actionOptions.Index == 0 {
|
|
return getRectangleCenterPoint(rect), nil
|
|
}
|
|
}
|
|
|
|
if len(rects) == 0 {
|
|
return PointF{}, errors.Wrap(code.OCRTextNotFoundError,
|
|
fmt.Sprintf("text %s not found in %v", text, t.texts()))
|
|
}
|
|
|
|
// get index
|
|
idx := actionOptions.Index
|
|
if idx > 0 {
|
|
// NOTICE: index start from 1
|
|
idx = idx - 1
|
|
} else if idx < 0 {
|
|
idx = len(rects) + idx
|
|
}
|
|
|
|
// index out of range
|
|
if idx >= len(rects) {
|
|
return PointF{}, errors.Wrap(code.OCRTextNotFoundError,
|
|
fmt.Sprintf("text %s found %d, index %d out of range", text, len(rects), idx))
|
|
}
|
|
|
|
return getRectangleCenterPoint(rects[idx]), nil
|
|
}
|
|
|
|
func (t OCRTexts) FindTexts(texts []string, options ...ActionOption) (points []PointF, err error) {
|
|
for _, text := range texts {
|
|
point, err := t.FindText(text, options...)
|
|
if err != nil {
|
|
continue
|
|
}
|
|
points = append(points, point)
|
|
}
|
|
|
|
if len(points) != len(texts) {
|
|
return nil, errors.Wrap(code.OCRTextNotFoundError,
|
|
fmt.Sprintf("texts %s not found in %v", texts, t.texts()))
|
|
}
|
|
return points, nil
|
|
}
|
|
|
|
func newVEDEMOCRService() (*veDEMOCRService, error) {
|
|
if err := checkEnv(); err != nil {
|
|
return nil, err
|
|
}
|
|
return &veDEMOCRService{}, nil
|
|
}
|
|
|
|
// veDEMOCRService implements IOCRService interface
|
|
type veDEMOCRService struct{}
|
|
|
|
func (s *veDEMOCRService) getOCRResult(imageBuf *bytes.Buffer) ([]OCRResult, error) {
|
|
bodyBuf := &bytes.Buffer{}
|
|
bodyWriter := multipart.NewWriter(bodyBuf)
|
|
bodyWriter.WriteField("withDet", "true")
|
|
// bodyWriter.WriteField("timestampOnly", "true")
|
|
|
|
formWriter, err := bodyWriter.CreateFormFile("image", "screenshot.png")
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRRequestError,
|
|
fmt.Sprintf("create form file error: %v", err))
|
|
}
|
|
size, err := formWriter.Write(imageBuf.Bytes())
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRRequestError,
|
|
fmt.Sprintf("write form error: %v", err))
|
|
}
|
|
|
|
err = bodyWriter.Close()
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRRequestError,
|
|
fmt.Sprintf("close body writer error: %v", err))
|
|
}
|
|
|
|
req, err := http.NewRequest("POST", env.VEDEM_OCR_URL, bodyBuf)
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRRequestError,
|
|
fmt.Sprintf("construct request error: %v", err))
|
|
}
|
|
|
|
token := builtin.Sign("auth-v2", env.VEDEM_OCR_AK, env.VEDEM_OCR_SK, bodyBuf.Bytes())
|
|
req.Header.Add("Agw-Auth", token)
|
|
req.Header.Add("Content-Type", bodyWriter.FormDataContentType())
|
|
|
|
var resp *http.Response
|
|
// retry 3 times
|
|
for i := 1; i <= 3; i++ {
|
|
start := time.Now()
|
|
resp, err = client.Do(req)
|
|
elapsed := time.Since(start)
|
|
var logID string
|
|
if resp != nil {
|
|
logID = getLogID(resp.Header)
|
|
}
|
|
if err == nil && resp.StatusCode == http.StatusOK {
|
|
log.Debug().
|
|
Str("X-TT-LOGID", logID).
|
|
Int("image_bytes", size).
|
|
Float64("elapsed_seconds", elapsed.Seconds()).
|
|
Msg("request OCR service success")
|
|
break
|
|
}
|
|
log.Error().Err(err).
|
|
Str("X-TT-LOGID", logID).
|
|
Int("imageBufSize", size).
|
|
Msgf("request OCR service failed, retry %d", i)
|
|
time.Sleep(1 * time.Second)
|
|
}
|
|
if resp == nil {
|
|
return nil, code.OCRServiceConnectionError
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
results, err := ioutil.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRResponseError,
|
|
fmt.Sprintf("read response body error: %v", err))
|
|
}
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
return nil, errors.Wrap(code.OCRResponseError,
|
|
fmt.Sprintf("unexpected response status code: %d, results: %v",
|
|
resp.StatusCode, string(results)))
|
|
}
|
|
|
|
var ocrResult ResponseOCR
|
|
err = json.Unmarshal(results, &ocrResult)
|
|
if err != nil {
|
|
return nil, errors.Wrap(code.OCRResponseError,
|
|
fmt.Sprintf("json unmarshal response body error: %v", err))
|
|
}
|
|
|
|
return ocrResult.OCRResult, nil
|
|
}
|
|
|
|
func (s *veDEMOCRService) GetTexts(imageBuf *bytes.Buffer) (
|
|
ocrTexts OCRTexts, err error) {
|
|
|
|
ocrResults, err := s.getOCRResult(imageBuf)
|
|
if err != nil {
|
|
log.Error().Err(err).Msg("getOCRResult failed")
|
|
return
|
|
}
|
|
|
|
for _, ocrResult := range ocrResults {
|
|
rect := image.Rectangle{
|
|
// ocrResult.Points 顺序:左上 -> 右上 -> 右下 -> 左下
|
|
Min: image.Point{
|
|
X: int(ocrResult.Points[0].X),
|
|
Y: int(ocrResult.Points[0].Y),
|
|
},
|
|
Max: image.Point{
|
|
X: int(ocrResult.Points[2].X),
|
|
Y: int(ocrResult.Points[2].Y),
|
|
},
|
|
}
|
|
|
|
ocrTexts = append(ocrTexts, OCRText{
|
|
Text: ocrResult.Text,
|
|
Rect: rect,
|
|
})
|
|
}
|
|
|
|
log.Debug().Interface("texts", ocrTexts).Msg("get screen texts by veDEM OCR")
|
|
return
|
|
}
|
|
|
|
func checkEnv() error {
|
|
if env.VEDEM_OCR_URL == "" {
|
|
return errors.Wrap(code.OCREnvMissedError, "VEDEM_OCR_URL missed")
|
|
}
|
|
if env.VEDEM_OCR_AK == "" {
|
|
return errors.Wrap(code.OCREnvMissedError, "VEDEM_OCR_AK missed")
|
|
}
|
|
if env.VEDEM_OCR_SK == "" {
|
|
return errors.Wrap(code.OCREnvMissedError, "VEDEM_OCR_SK missed")
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func getLogID(header http.Header) string {
|
|
if len(header) == 0 {
|
|
return ""
|
|
}
|
|
|
|
logID, ok := header["X-Tt-Logid"]
|
|
if !ok || len(logID) == 0 {
|
|
return ""
|
|
}
|
|
return logID[0]
|
|
}
|
|
|
|
type IOCRService interface {
|
|
GetTexts(imageBuf *bytes.Buffer) (texts OCRTexts, err error)
|
|
}
|
|
|
|
func (dExt *DriverExt) GetScreenTextsByOCR() (texts OCRTexts, err error) {
|
|
var bufSource *bytes.Buffer
|
|
var imagePath string
|
|
if bufSource, imagePath, err = dExt.TakeScreenShot(
|
|
builtin.GenNameWithTimestamp("%d_ocr")); err != nil {
|
|
return
|
|
}
|
|
|
|
ocrTexts, err := dExt.OCRService.GetTexts(bufSource)
|
|
if err != nil {
|
|
log.Error().Err(err).Msg("GetScreenTextsByOCR failed")
|
|
return
|
|
}
|
|
|
|
o, _ := json.Marshal(ocrTexts)
|
|
dExt.cacheStepData.OcrResults[imagePath] = string(o)
|
|
return ocrTexts, nil
|
|
}
|
|
|
|
func (dExt *DriverExt) FindScreenTextByOCR(text string, options ...ActionOption) (point PointF, err error) {
|
|
ocrTexts, err := dExt.GetScreenTextsByOCR()
|
|
if err != nil {
|
|
return
|
|
}
|
|
point, err = ocrTexts.FindText(text, options...)
|
|
if err != nil {
|
|
log.Warn().Msgf("FindText failed: %s", err.Error())
|
|
return
|
|
}
|
|
|
|
log.Info().Str("text", text).
|
|
Interface("point", point).Msgf("FindScreenTextByOCR success")
|
|
return
|
|
}
|
|
|
|
func getRectangleCenterPoint(rect image.Rectangle) (point PointF) {
|
|
x, y := float64(rect.Min.X), float64(rect.Min.Y)
|
|
width, height := float64(rect.Dx()), float64(rect.Dy())
|
|
point = PointF{
|
|
X: x + width*0.5,
|
|
Y: y + height*0.5,
|
|
}
|
|
return point
|
|
}
|