task-processor/internal/parsers/mandarake/service.go

175 lines
4.9 KiB
Go
Raw Normal View History

2025-12-26 16:19:09 +03:00
package mandarake
import (
"context"
"github.com/chromedp/chromedp"
log "github.com/sirupsen/logrus"
"regexp"
"slices"
"strconv"
"strings"
"task-processor/internal/shared"
)
func (s *Parser) getPrice(ctx context.Context, task shared.Task) (int32, error) {
var (
singlePrice string
rangedPrice string
prices []int32
)
if err := chromedp.Run(ctx,
chromedp.Navigate(task.Link),
chromedp.WaitReady("body"),
2025-12-26 16:56:40 +03:00
chromedp.Text(`div.price`, &singlePrice, chromedp.ByQuery, chromedp.AtLeast(0)),
chromedp.Text(`div.price_range`, &rangedPrice, chromedp.ByQuery, chromedp.AtLeast(0)),
2025-12-26 16:19:09 +03:00
); err != nil {
log.WithError(err).Error(logHeader + logGetPrice + "failed to get single price tag")
return zeroPrice, err
}
singlePrice = strings.TrimSpace(singlePrice)
prices = append(prices, s.getSinglePriceWithTax(singlePrice))
rangedPrice = strings.TrimSpace(rangedPrice)
if rangedPrice != "" {
prices = append(prices, s.getMinimalPriceFromRangeWithTax(rangedPrice))
}
minimal := slices.Min(prices)
log.Infof(logHeader+"uuid: %s, price: %d", task.MerchUuid, minimal)
2026-01-04 15:19:21 +03:00
return minimal, nil
}
2026-01-05 17:51:02 +03:00
func (s *Parser) getMinimalPrice(task shared.Task) int32 {
2026-01-04 15:19:21 +03:00
ctx := context.Background()
allocCtx, allocCancel := chromedp.NewRemoteAllocator(ctx, s.externalBrowser)
defer allocCancel()
sessionCtx, sessionCancel := chromedp.NewContext(allocCtx, chromedp.WithLogf(log.Printf))
defer sessionCancel()
var (
singlePrice string
rangedPrice string
)
if err := chromedp.Run(sessionCtx,
chromedp.Navigate(task.Link),
chromedp.WaitVisible("body", chromedp.ByQuery),
chromedp.Evaluate(`(document.querySelector('div.price')?.innerText || '').trim()`, &singlePrice),
chromedp.Evaluate(`(document.querySelector('div.price_range')?.innerText || '').trim()`, &rangedPrice),
); err != nil {
2026-01-05 17:51:02 +03:00
return zeroPrice
2026-01-04 15:19:21 +03:00
}
2026-01-05 17:51:02 +03:00
minimal := s.processPrices(singlePrice, rangedPrice)
log.Infof(logHeader+"uuid: %s, price: %d", task.MerchUuid, minimal)
return minimal
}
func (s *Parser) processPrices(singlePrice, rangedPrice string) int32 {
var prices []int32
//in case of any errors or no price return zeroPrice const
//if success add to prices slice
2026-01-04 15:19:21 +03:00
if singlePrice != "" {
singlePrice = strings.TrimSpace(singlePrice)
2026-01-05 17:51:02 +03:00
counted, err := s.parseSinglePrice(singlePrice)
if err != nil {
log.WithFields(log.Fields{
"err": err.Error(),
"singlePrice": singlePrice,
}).Error(logHeader + logGetPrice + "failed to parse single price, returning zero price")
return zeroPrice
}
prices = append(prices, counted)
2026-01-04 15:19:21 +03:00
} else {
2026-01-05 17:51:02 +03:00
log.Warn(logHeader + logGetPrice + "single price not found")
return zeroPrice
2026-01-04 15:19:21 +03:00
}
2026-01-05 17:51:02 +03:00
//optional, adds price only if no errors and has non zero value
2026-01-04 15:19:21 +03:00
if rangedPrice != "" {
rangedPrice = strings.TrimSpace(rangedPrice)
2026-01-05 17:51:02 +03:00
counted, err := s.parseRangedPrice(rangedPrice)
if err != nil {
log.WithFields(log.Fields{
"err": err.Error(),
"rangedPrice": rangedPrice,
}).Error(logHeader + logGetPrice + "failed to parse ranged price")
} else {
if counted > 0 {
prices = append(prices, counted)
}
}
2026-01-04 15:19:21 +03:00
}
2026-01-05 17:51:02 +03:00
return slices.Min(prices)
2025-12-26 16:19:09 +03:00
}
func (s *Parser) getSinglePriceWithTax(rawPrice string) int32 {
re := regexp.MustCompile(`(\d+)\s*円`)
matches := re.FindStringSubmatch(rawPrice)
if len(matches) < 2 {
log.Error("Mandarake | Single price not found, returning zero price")
return zeroPrice
}
priceStr := matches[1]
price, err := strconv.Atoi(priceStr)
if err != nil {
log.Error("Mandarake | Failed to convert single price, returning zero price")
return zeroPrice
}
return int32(price)
}
func (s *Parser) getMinimalPriceFromRangeWithTax(priceRange string) int32 {
re := regexp.MustCompile(`他([\d,]+)円`)
matches := re.FindStringSubmatch(priceRange)
if len(matches) < 2 {
log.Error("Price not found in range, returning zero price")
return zeroPrice
}
priceStr := strings.ReplaceAll(matches[1], ",", "")
price, err := strconv.Atoi(priceStr)
if err != nil {
log.Error("Failed to convert minimal price in range, returning zero price")
return zeroPrice
}
return int32(float64(price) * taxMultiplier)
}
2026-01-05 17:51:02 +03:00
func (s *Parser) parseSinglePrice(rawPrice string) (int32, error) {
deCommaStr := strings.ReplaceAll(rawPrice, ",", "")
split := strings.Split(deCommaStr, "円")
finalPrice, err := s.countTax(split[0])
if err != nil {
return zeroPrice, err
}
return finalPrice, nil
}
func (s *Parser) parseRangedPrice(rawPrice string) (int32, error) {
deCommaStr := strings.ReplaceAll(rawPrice, ",", "")
split := strings.Split(deCommaStr, "円")
rm1 := strings.ReplaceAll(split[0], "(", "")
rm2 := strings.ReplaceAll(rm1, "他", "")
finalPrice, err := s.countTax(rm2)
if err != nil {
return zeroPrice, err
}
return finalPrice, nil
}
func (s *Parser) countTax(priceStr string) (int32, error) {
intPrice, err := strconv.Atoi(priceStr)
if err != nil {
return zeroPrice, err
}
return int32(float64(intPrice) * taxMultiplier), nil
}