-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathindex.js
More file actions
72 lines (60 loc) · 1.7 KB
/
index.js
File metadata and controls
72 lines (60 loc) · 1.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import puppeteer from 'puppeteer';
import { writeFile } from './src/writeFile.js';
import { handleData } from './src/handleData.js';
import { url } from './config.js';
import { changeLink } from './src/handleData.js';
const browser = await puppeteer.launch({
headless: false,
defaultViewport: {
width: 0,
height: 0,
},
});
const page = await browser.newPage();
// 等待打开url
await page.goto(url);
// 等待页面加载
await page.waitForSelector('.job-list-box');
// 获取页码
const totalPage = await page.$eval(
'.options-pages a:nth-last-child(2)',
(e) => {
return parseInt(e.textContent);
}
);
const allJobs = [];
for (let i = 1; i <= totalPage; i++) {
await page.goto(url + '&page=' + i);
await page.waitForSelector('.job-list-box');
const jobs = await page.$eval('.job-list-box', (el) => {
return [...el.querySelectorAll('.job-card-wrapper')].map((item) => {
return {
job: {
name: item.querySelector('.job-name').textContent,
area: item.querySelector('.job-area').textContent,
salary: item.querySelector('.salary').textContent,
},
link: item.querySelector('a').href,
company: {
name: item.querySelector('.company-name').textContent,
},
};
});
});
allJobs.push(...jobs);
}
for (let i = 0; i < allJobs.length; i++) {
await page.goto(changeLink(allJobs[i].link));
try {
await page.waitForSelector('.job-sec-text');
const jd = await page.$eval('.job-sec-text', (el) => {
return el.textContent;
});
allJobs[i].desc = jd;
console.log(allJobs[i]);
} catch (e) {
console.log('🚀 ~ e:', e);
}
}
const result = handleData(allJobs);
writeFile(result);