149 lines
3.4 KiB
Go

package crawler
import (
"context"
"fmt"
"log/slog"
"os"
"strings"
"time"
"github.com/maximotejeda/us_dop_scrapper/helpers"
"github.com/maximotejeda/us_dop_scrapper/internal/application/core/domain"
"github.com/maximotejeda/us_dop_scrapper/internal/ports"
"github.com/playwright-community/playwright-go"
)
type bhd struct {
client ports.DollarPort
}
func NewBHD(client ports.DollarPort) ports.APIPorts {
return &bhd{
client: client,
}
}
// Scrape
// needs a mobile User Agent
func (bh bhd) Scrape(ctx context.Context, page playwright.Page, log *slog.Logger) (insts []*domain.History, err error) {
tout := 120000.00
uri := os.Getenv("BHD")
log = log.With("scrapper", "bhd")
if _, err := page.Goto(uri, playwright.PageGotoOptions{
Timeout: &tout,
WaitUntil: playwright.WaitUntilStateLoad,
}); err != nil {
log.Error("could not get info", "error", err)
return nil, err
}
err = page.WaitForLoadState()
if err != nil {
log.Error("waiting for page state", "err", err)
return nil, err
}
err = page.Locator("html body").WaitFor()
if err != nil {
log.Error("waiting for locating body", "err", err)
return nil, err
}
fieldGroupLocator := page.Locator("div.field_group")
fieldGroupLocator.WaitFor()
fieldGroup, err := fieldGroupLocator.All()
//log.Info("divs", "number", len(fieldGroup))
if err != nil {
log.Error("locating field group", "err", err)
return nil, err
}
inst := &domain.History{
Name: "banco hipotecario dominicano",
Parser: "bhd",
Parsed: time.Now().Unix(),
}
for _, it := range fieldGroup {
n, _ := it.AllTextContents()
if n[0] == "CompramosUS$RD$" || n[0] == "VendemosUS$RD$" {
// we work from here in the second div as first is amount of dollars
div := it.Locator("div")
/*input := div.Locator("div > div input")
val, _ := input.InputValue()
if val == "1"{
input := div.Locator("div > div input")
}*/
places, _ := div.Locator("div").All()
for _, x := range places {
//txt, _ := x.TextContent()
input := x.Locator("div input")
if n, _ := input.Count(); n <= 0 {
//log.Info("no input")
continue
}
val, _ := input.InputValue()
if val == "" || val == "1" {
continue
}
place := strings.ReplaceAll(n[0], "US$RD$", "")
place = strings.ToLower(place)
price := helpers.Normalize(val)
if err != nil {
log.Error("parsing value", "where", place, "err", err)
return nil, err
}
switch place {
case "compramos":
inst.Compra = price
case "vendemos":
inst.Venta = price
}
}
}
}
if inst.Compra == 0 || inst.Venta == 0 {
return nil, fmt.Errorf("bhd: institution not parsed: %v", inst)
}
//log.Info(fmt.Sprintf("%v", inst))
return []*domain.History{inst}, nil
}
func (bh bhd) ExecParser(
ctx context.Context,
browser *playwright.Browser,
log *slog.Logger) (err error) {
t := true
ua := helpers.NewMobileUA()
b := *browser
page, err := b.NewPage(playwright.BrowserNewPageOptions{
UserAgent: &ua,
// IsMobile: &t,
HasTouch: &t,
Viewport: &playwright.Size{
Width: 412,
Height: 915,
},
Screen: &playwright.Size{
Width: 412,
Height: 915,
},
})
if err != nil {
log.Error("creating page", "error", err)
os.Exit(1)
}
ctx, cancel := context.WithTimeout(ctx, 6*time.Minute)
defer page.Close()
defer cancel()
inst, err := bh.Scrape(ctx, page, log)
if err != nil {
return err
}
bh.client.NewHistory(inst[0])
return err
}