-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.js
73 lines (73 loc) · 2.56 KB
/
index.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
const puppeteer = require('puppeteer')
const {user} = require('./config')
var json2csv = require('json2csv')
var fs = require('fs')
const totalText = []
const getLastPage = async (page) => {
let lastPage = await page.evaluate(() => {
let pages = [...document.querySelectorAll('.WB_cardpage.S_line1 .W_pages a.page.S_txt1')]
// 最后一页在倒数第二个标签
let lastPage = pages[pages.length - 2]
return lastPage.innerText
})
return lastPage
}
const transToCsvFile = (data) => {
const fields = ['name', 'href', 'address']
const fieldNames = ['名称', '链接', '地址']
const csv = json2csv({data, fields, fieldNames})
console.log('csv', csv)
fs.writeFile('file.csv', csv, function(err) {
if (err) throw err;
console.log('file saved')
})
}
const main = async () => {
try {
const browser = await puppeteer.launch({
executablePath: './node_modules/puppeteer/local/chrome-win32/chrome',
headless: false,
userDataDir: 'weibo'
})
const page = await browser.newPage()
page.on('console', console.log)
page.on('dialog', async dialog => {
console.log(dialog.message())
await dialog.dismiss()
})
let totalUserList = []
let fansPage = 1
await page.goto(`https://weibo.com/p/1005051782703161/follow?page=${fansPage}#Pl_Official_HisRelation__60`, {waitUntil: 'networkidle2'})
let lastPage = await getLastPage(page)
// 拿当前页的数据
for (let i = 1; i <= 5; i++) {
let pageSize = i
if (i !== 1) {
await page.goto(`https://weibo.com/p/1005051782703161/follow?page=${pageSize}#Pl_Official_HisRelation__60`, {waitUntil: 'networkidle2'})
}
let userList = await page.evaluate(() => {
let nameAndHrefList = [...document.querySelectorAll('.follow_box .follow_list li.follow_item .info_name a.S_txt1')]
let addressList = [...document.querySelectorAll('.follow_box .follow_list li.follow_item .info_add span')]
let fanList = []
if (nameAndHrefList.length === addressList.length) {
for (var i = 0; i < nameAndHrefList.length; i++) {
let nameAndHref = nameAndHrefList[i]
let address = addressList[i]
fanList.push({
name: nameAndHref.innerText,
href: nameAndHref.href,
address: address.innerText
})
}
}
return fanList
})
// console.log('userList', userList)
totalUserList = [...totalUserList, ...userList]
}
transToCsvFile(totalUserList)
} catch (e) {
console.error('e', e)
}
}
main()