bazaar/pkg/shop/casadellibro/casadellibro.go

103 lines
2.5 KiB
Go

package casadellibro
import (
"fmt"
"log"
"net/url"
"regexp"
"strconv"
"strings"
"time"
"github.com/PuerkitoBio/goquery"
"github.com/fmartingr/bazaar/pkg/models"
)
const (
releaseDatePropertyName = "Fecha de lanzamiento"
releaseDatePropertyValueFormat = "02/01/2006"
)
var Domains = []string{"www.casadellibro.com"}
type CasaDelLibroShop struct {
models.ShopOptions
domains []string
priceRegexp *regexp.Regexp
}
func (s *CasaDelLibroShop) Get(u *url.URL) (*models.Product, error) {
body, err := s.ShopOptions.Client.Get(u)
if err != nil {
return nil, fmt.Errorf("error during request: %s", err)
}
doc, err := goquery.NewDocumentFromReader(body)
if err != nil {
return nil, fmt.Errorf("error parsing body: %s", err)
}
product := models.Product{
URL: u.String(),
}
// Price
seoJSON := doc.Find(`[vmid="seo"][data-body="true"]`).Text()
priceSubmatch := s.priceRegexp.FindSubmatch([]byte(seoJSON))
if len(priceSubmatch) != 2 {
return nil, fmt.Errorf("error parsing price, expected one match, found %d", len(priceSubmatch)/2)
}
priceNum, _ := strconv.ParseFloat(strings.ReplaceAll(string(priceSubmatch[1]), ",", "."), 64)
product.PriceText = string(priceSubmatch[1])
product.Price = priceNum
// Release date (& meta)
rightBlocks := doc.Find(".border-left.col-md-4.col-12")
if rightBlocks.Length() >= 2 {
rightBlocks.Eq(1).Find(".row").Each(func(i int, s *goquery.Selection) {
cols := s.Find(".col")
propertyNamme := strings.Trim(cols.First().Text(), ":")
if propertyNamme == releaseDatePropertyName {
propertyValue := cols.Eq(1).Text()
releaseDate, err := time.Parse(releaseDatePropertyValueFormat, propertyValue)
if err != nil {
log.Printf("error parsing release date: %s", err)
return
}
product.ReleaseDate = &releaseDate
}
})
}
doc.Find(`main.v-main`).Each(func(i int, s *goquery.Selection) {
imageURL, _ := s.Find(".product-image").Attr("src")
product.Name = strings.TrimSpace(s.Find("h1.text-h5.mb-4").Text())
product.InStock = s.Find("p.stock").HasClass("in-stock")
product.ImageURL = imageURL
product.Description = strings.TrimSpace(s.Find(".resume-body").Text())
})
return &product, nil
}
func NewCasaDelLibroShopFactory() models.ShopFactory {
return func(shopOptions models.ShopOptions) models.Shop {
r, err := regexp.Compile(`Price\"\:\"([\d+\.]+)`)
if err != nil {
log.Println(err)
}
shop := CasaDelLibroShop{
ShopOptions: shopOptions,
domains: Domains,
priceRegexp: r,
}
return &shop
}
}