mirror of
https://github.com/hempyhemp/hh-auto-reply.git
synced 2026-06-09 02:15:34 +00:00
init
This commit is contained in:
307
src/hh/scraper.ts
Normal file
307
src/hh/scraper.ts
Normal file
@@ -0,0 +1,307 @@
|
||||
import type { Message } from 'node-telegram-bot-api'
|
||||
import bot from '@bot'
|
||||
import prisma from '@prisma'
|
||||
import { type Browser, chromium, type Page } from 'playwright'
|
||||
import { askGPT } from '../openai'
|
||||
|
||||
// const SESSION_FILE = path.resolve('./session.json')
|
||||
|
||||
interface ApplyOptions {
|
||||
query: string
|
||||
area?: number
|
||||
maxApplies?: number
|
||||
}
|
||||
|
||||
interface ApplyResult {
|
||||
applied: string[]
|
||||
skipped: string[]
|
||||
errors: string[]
|
||||
error?: string
|
||||
}
|
||||
|
||||
function randomDelay(min = 300, max = 2000) {
|
||||
return min + Math.random() * (max - min)
|
||||
}
|
||||
|
||||
async function humanDelay(min = 300, max = 2000) {
|
||||
return new Promise(r => setTimeout(r, randomDelay(min, max)))
|
||||
}
|
||||
|
||||
async function randomScroll(page: Page) {
|
||||
await page.mouse.move(100 + Math.random() * 500, 200 + Math.random() * 500)
|
||||
await page.mouse.wheel(0, 300 + Math.random() * 1000)
|
||||
}
|
||||
|
||||
async function getBrowser(): Promise<Browser> {
|
||||
return chromium.launch({ headless: true })
|
||||
}
|
||||
|
||||
async function loadSession(page: Page, telegramId: bigint | number): Promise<boolean> {
|
||||
const user = await prisma.user.findUnique({
|
||||
where: { telegramId },
|
||||
})
|
||||
|
||||
const session = user?.session
|
||||
|
||||
if (!session)
|
||||
return false
|
||||
|
||||
const cookies = JSON.parse(session)
|
||||
await page.context().addCookies(cookies)
|
||||
return true
|
||||
}
|
||||
|
||||
function waitForOtp(chatId: number): Promise<string> {
|
||||
return new Promise((resolve) => {
|
||||
const handler = (msg: Message) => {
|
||||
if (msg.chat.id !== chatId)
|
||||
return
|
||||
|
||||
if (!msg.text)
|
||||
return
|
||||
|
||||
bot.removeListener('message', handler)
|
||||
resolve(msg.text)
|
||||
}
|
||||
|
||||
bot.on('message', handler)
|
||||
})
|
||||
}
|
||||
|
||||
export async function login(
|
||||
email: string,
|
||||
chatId: number,
|
||||
): Promise<void> {
|
||||
const browser = await getBrowser()
|
||||
await bot.sendMessage(chatId, `Browser is connected: ${browser.isConnected()}`)
|
||||
if (!browser.version())
|
||||
return
|
||||
await bot.sendMessage(chatId, `Browser version: ${browser.version()}`)
|
||||
|
||||
const context = await browser.newContext()
|
||||
const page = await context.newPage()
|
||||
|
||||
await page.goto('https://hh.ru/account/login', { waitUntil: 'networkidle' })
|
||||
|
||||
await bot.sendMessage(chatId, `page: ${page.url()}`)
|
||||
|
||||
await page.click('[data-qa="submit-button"]')
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await bot.sendMessage(chatId, `Клик по "Войти"`)
|
||||
|
||||
await page.click('label:has([data-qa="credential-type-EMAIL"])')
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await bot.sendMessage(chatId, `Клик по "Email"`)
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await page.fill('[data-qa="applicant-login-input-email"]', email)
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await bot.sendMessage(chatId, `Ввод "Email"`)
|
||||
|
||||
await page.click('[data-qa="submit-button"]')
|
||||
|
||||
await bot.sendMessage(chatId, `Клик по "Дальше"`)
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await bot.sendMessage(chatId, '🔑 Введи код из email')
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await page.click('[data-qa="applicant-login-input-otp"]')
|
||||
|
||||
const otp = await waitForOtp(chatId)
|
||||
|
||||
await page.fill('[data-qa="applicant-login-input-otp"] input', otp)
|
||||
|
||||
await bot.sendMessage(chatId, `Введён ОТП: ${otp}`)
|
||||
|
||||
await page.waitForTimeout(randomDelay())
|
||||
|
||||
await page.waitForLoadState('networkidle')
|
||||
|
||||
const cookies = await context.cookies()
|
||||
|
||||
await prisma.user.update({
|
||||
where: { telegramId: chatId },
|
||||
data: {
|
||||
session: JSON.stringify(cookies, null, 2),
|
||||
},
|
||||
})
|
||||
|
||||
await bot.sendMessage(chatId, `cookies: ${cookies.length}`)
|
||||
|
||||
await browser.close()
|
||||
|
||||
await getResume(chatId)
|
||||
}
|
||||
|
||||
export async function checkIsAuth(telegramId: bigint | number) {
|
||||
const browser = await getBrowser()
|
||||
const context = await browser.newContext()
|
||||
const page = await context.newPage()
|
||||
|
||||
await loadSession(page, telegramId)
|
||||
|
||||
console.log('Сессия загружена')
|
||||
|
||||
const url = `https://hh.ru/search/vacancy`
|
||||
|
||||
await page.goto(url, { waitUntil: 'networkidle' })
|
||||
|
||||
try {
|
||||
return await page.$('[data-qa="profileAndResumes-button"]')
|
||||
}
|
||||
catch (e) {
|
||||
return e
|
||||
}
|
||||
// return await page.$('[data-qa="mainmenu_createResume"]')
|
||||
}
|
||||
|
||||
export async function getResume(chatId: number) {
|
||||
const browser = await getBrowser()
|
||||
const context = await browser.newContext()
|
||||
const page = await context.newPage()
|
||||
await loadSession(page, chatId)
|
||||
const url = `https://hh.ru/applicant/resumes`
|
||||
await page.goto(url, { waitUntil: 'networkidle' })
|
||||
|
||||
const text = await page
|
||||
.$('[data-qa^="resume-card-link-"]')
|
||||
.then(html => html?.getAttribute('href'))
|
||||
|
||||
const hhUrl = new URL(`https://hh.ru${text}`)
|
||||
|
||||
const id = hhUrl.pathname.split('/').pop()!
|
||||
|
||||
const resumeUrl = `https://hh.ru/resume_converter/resume.txt?hash=${id}&type=txt&hhtmFrom=&hhtmSource=resume`
|
||||
|
||||
await page.goto(resumeUrl, { waitUntil: 'networkidle' })
|
||||
|
||||
let resume
|
||||
try {
|
||||
resume = await page.locator('.resume').innerText()
|
||||
|
||||
await prisma.resume.upsert({
|
||||
where: { id },
|
||||
create: { data: resume, id, telegramId: chatId },
|
||||
update: { data: resume },
|
||||
})
|
||||
}
|
||||
catch (e) {
|
||||
console.log(e)
|
||||
await bot.sendMessage(chatId, 'Нет резюме на ХХ, создайте')
|
||||
}
|
||||
finally {
|
||||
await browser.close()
|
||||
}
|
||||
|
||||
return resume
|
||||
}
|
||||
|
||||
export async function applyToJobs({
|
||||
query,
|
||||
area = 1,
|
||||
maxApplies = 10,
|
||||
}: ApplyOptions, { chatId }: {
|
||||
chatId: number
|
||||
}): Promise<ApplyResult> {
|
||||
const browser = await getBrowser()
|
||||
const context = await browser.newContext()
|
||||
const page = await context.newPage()
|
||||
const results: ApplyResult = { applied: [], skipped: [], errors: [] }
|
||||
|
||||
try {
|
||||
await loadSession(page, chatId)
|
||||
|
||||
const url = `https://hh.ru/search/vacancy?text=${encodeURIComponent(query)}&area=${area}`
|
||||
await page.goto(url, { waitUntil: 'networkidle' })
|
||||
|
||||
const isLoggedIn = await page.$('[data-qa="profileAndResumes-button"]')
|
||||
// await page.$('[data-qa="mainmenu_myResumes"]')
|
||||
if (!isLoggedIn) {
|
||||
return { ...results, error: 'Не авторизован. Выполните login' }
|
||||
}
|
||||
|
||||
await bot.sendMessage(chatId, `✅ Авторизация выполнена`)
|
||||
|
||||
const vacancies = await page.$$eval(
|
||||
'[data-qa="serp-item__title"]',
|
||||
links => links.map(a => ({
|
||||
href: (a as HTMLAnchorElement).href,
|
||||
title: a.textContent?.trim() ?? '',
|
||||
})),
|
||||
)
|
||||
|
||||
await bot.sendMessage(chatId, `✅ Вакансий найдено: ${vacancies.length}`)
|
||||
|
||||
for (const vacancy of vacancies.slice(0, maxApplies)) {
|
||||
try {
|
||||
await bot.sendMessage(chatId, `🔄 Обрабатывается вакансия: ${vacancy.title}`)
|
||||
await page.goto(vacancy.href, { waitUntil: 'networkidle' })
|
||||
|
||||
const description = await page
|
||||
.locator('[data-qa="vacancy-description"]')
|
||||
.innerText()
|
||||
|
||||
if (!description) {
|
||||
await bot.sendMessage(chatId, `😬 Ошибка с получением описания`)
|
||||
continue
|
||||
}
|
||||
|
||||
await bot.sendMessage(chatId, `✅ Описание получено`)
|
||||
|
||||
const resume = await prisma.resume.findFirst({
|
||||
where: { telegramId: chatId },
|
||||
})
|
||||
|
||||
if (!resume?.data) {
|
||||
await getResume(chatId)
|
||||
}
|
||||
|
||||
const user = await prisma.user.findUnique({
|
||||
where: { telegramId: chatId },
|
||||
})
|
||||
|
||||
const letter = await askGPT(resume!.data, description, user!.prompt)
|
||||
|
||||
await bot.sendMessage(chatId, `✅ Сопроводительное письмо отправлено: ${letter}`)
|
||||
|
||||
// const applyBtn = await page.$('[data-qa="vacancy-response-link-top"]')
|
||||
// if (!applyBtn) {
|
||||
// results.skipped.push(vacancy.title)
|
||||
// continue
|
||||
// }
|
||||
//
|
||||
// await randomScroll(page)
|
||||
//
|
||||
// await applyBtn.click()
|
||||
// await page.waitForTimeout(randomDelay())
|
||||
//
|
||||
// const submitBtn = await page.$('[data-qa="vacancy-response-popup-submit"]')
|
||||
// if (submitBtn) {
|
||||
// await submitBtn.click()
|
||||
// await page.waitForTimeout(randomDelay())
|
||||
// }
|
||||
|
||||
results.applied.push(vacancy.title)
|
||||
// await page.waitForTimeout(3000 + Math.random() * 2000)
|
||||
}
|
||||
catch (err) {
|
||||
results.errors.push(`${vacancy.title}: ${(err as Error).message}`)
|
||||
}
|
||||
}
|
||||
}
|
||||
finally {
|
||||
await browser.close()
|
||||
}
|
||||
|
||||
return results
|
||||
}
|
||||
Reference in New Issue
Block a user