-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgetcheguanshuo.js
99 lines (72 loc) · 2.09 KB
/
getcheguanshuo.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
const devices = require('puppeteer/DeviceDescriptors')
const puppeteer = require('puppeteer'),
fs = require('fs'),
$ = require('jquery'),
path = require('path');
const XLSX = require("xlsx");
const WorkBook = require("./workbook");
(async () => {
const browser = await puppeteer.launch({
executablePath: '/opt/google/chrome/chrome',
headless: false,
});
let getOnePage = async (url, maxPage) => {
const page = await browser.newPage();
// await page.emulate(devices['iPhone X'])
await page.goto(url, {
waitUntil: 'networkidle2'
});
await page.setJavaScriptEnabled(true);
await page.waitFor(1200);
let arr = await page.evaluate(() => {
let trs = document.querySelectorAll('#jczgl .stadiv a')
console.log(trs)
let arr = []
trs.forEach(item => {
let name = item.getAttribute('name')
let addr = item.getAttribute('title')
let link = 'http://cgs.gzjd.gov.cn'+item.getAttribute('href')
arr.push({name, addr, link})
})
return arr;
});
console.log(arr)
let bigSheet = [['名称', '地址', '链接']];
let sheet = []
let data = arr
data.map(item=>{
sheet.push([item.name, item.addr, item.link])
// }
})
workbook = new WorkBook({
Sheet1: bigSheet.concat(sheet)
})
workbook.writeFile('车管所.xlsx')
// console.log((china))
fs.writeFile('cheguanshuo.json', JSON.stringify(arr), function(err) {
if (err) {
return console.error(err);
}
console.log("数据写入成功!");
});
page.once('load', () => console.log('Page loaded!'));
await page.close()
url.match(/&p=(\w*)$/)
if (RegExp.$1 == maxPage){
await setTimeout(()=>{
browser.close();
},5000)
}
};
(async () => {
let getAllPage = (i, maxPage) => {
console.log('抓取进度:', i + '/' + maxPage)
getOnePage(
"http://cgs.gzjd.gov.cn/nsyycms/contactauthorized/index.jhtml",
maxPage
);
}
getAllPage(1, 1)
console.log('hehe')
})()
})()