红糖糍粑
首先肯定是确定要爬的页面的编码。如果是GBK的话就需要对爬过来的文字用iconv库做转化,在nodejs中变成UTF8。比如:var request = require('request'), cheerio = require('cheerio'), Iconv = require('iconv').Iconv;var iconv = new Iconv('GBK', 'UTF-8');request(opts, function (err, response, body) { var result = iconv.convert(new Buffer(body, 'binary')).toString(); var $ = cheerio.load(result); // ......});