nodejs 爬虫

版权声明:本文为博主原创文章,未经博主允许不得转载。 https://blog.csdn.net/adley_app/article/details/85218165
const request = require('request')
const cheerio = require('cheerio')

const MongoClient = require('mongodb').MongoClient;
const url = 'mongodb://localhost:27017';


MongoClient.connect(url, function(err, client) {
	console.log("Connected successfully to server");

	const db = client.db("douban");
	const collection = db.collection('movie');
	
	// request
	request.get('https://movie.douban.com/top250', (err, result) => {
		var $ = cheerio.load(result.body);
		
		var log = console.log;
		
		log($('.grid_view li').length)
		
		let arr=[];
		Array.from($('.grid_view li')).forEach(item => {
			
			let obj={}
			
			obj.title = $(item).find('.title').eq(0).text();
			obj.imgSrc = $(item).find('img').attr("src");
			obj.rate = $(item).find('.rating_num').text();
			
			arr.push(obj)
			
		});
		
	//	log(arr)
		
		collection.insert(arr, (err, result) => {
			log(result);
			client.close();
		})
		
		
	})
 
//	client.close();
});



猜你喜欢

转载自blog.csdn.net/adley_app/article/details/85218165