96 lines
2.6 KiB
JavaScript
96 lines
2.6 KiB
JavaScript
import browser from "../system/browser.js";
|
|
import { extractModelId, extractNumber } from "../system/ultils.js";
|
|
import { ScrapModel } from "./scrap-model.js";
|
|
|
|
export class LawsonsScrapModel extends ScrapModel {
|
|
action = async () => {
|
|
const urlsData = this.extractUrls();
|
|
|
|
for (let item of urlsData) {
|
|
await this.page.goto(item.url);
|
|
|
|
const data = await this.getItemsInHtml(item);
|
|
|
|
const results = this.filterItemByKeyword(item.keyword, data);
|
|
|
|
this.results[item.keyword] = results;
|
|
|
|
console.log({ results: this.results });
|
|
}
|
|
};
|
|
|
|
async getPrice(url) {
|
|
const newPage = await browser.newPage();
|
|
|
|
await newPage.setUserAgent(
|
|
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/115.0.0.0 Safari/537.36"
|
|
);
|
|
|
|
try {
|
|
await newPage.goto(`${this.web_bid.origin_url}${url}`, {
|
|
waitUntil: "domcontentloaded", // hoặc "networkidle2" nếu cần đợi AJAX
|
|
});
|
|
|
|
await newPage.waitForSelector("#bidPrefix > span.font-weight-bold", {
|
|
timeout: 10000,
|
|
});
|
|
|
|
const priceText = await newPage
|
|
.$eval("#bidPrefix > span.font-weight-bold", (el) =>
|
|
el.textContent.trim()
|
|
)
|
|
.catch(() => null);
|
|
|
|
return extractNumber(priceText) || 0;
|
|
} catch (error) {
|
|
console.error(`Error getting price for ${url}:`, error);
|
|
return 0;
|
|
} finally {
|
|
await newPage.close();
|
|
}
|
|
}
|
|
|
|
getItemsInHtml = async (data) => {
|
|
await this.page.waitForSelector(".row.row-spacing > .lot-container", {
|
|
timeout: 10000,
|
|
});
|
|
|
|
const elements = await this.page.$$(".row.row-spacing > .lot-container");
|
|
const results = [];
|
|
|
|
for (const el of elements) {
|
|
const url = await el
|
|
.$eval("aside.search-lot--content.text-left > a", (el) =>
|
|
el.getAttribute("href")
|
|
)
|
|
.catch(() => null);
|
|
|
|
const image_url = await el
|
|
.$eval("figure.text-center.imgContainer img", (img) =>
|
|
img.getAttribute("src")
|
|
)
|
|
.catch(() => null);
|
|
|
|
const name = await el
|
|
.$eval(".font-weight-normal.text-grey.title", (el) =>
|
|
el.textContent.trim()
|
|
)
|
|
.catch(() => null);
|
|
|
|
const current_price = await this.getPrice(url);
|
|
|
|
results.push({
|
|
url: `${this.web_bid.origin_url}${url}`,
|
|
image_url,
|
|
name,
|
|
keyword: data.keyword,
|
|
model: extractModelId(`${this.web_bid.origin_url}${url}`),
|
|
current_price: current_price,
|
|
scrap_config_id: this.scrap_config_id,
|
|
});
|
|
}
|
|
|
|
return results;
|
|
};
|
|
}
|