A Node.js library for converting HTML documents of arbitrary encoding to UTF-8.
npm install html-to-utf8
var request = require('request');
var toUTF8 = require('html-to-utf8');
request({
url: 'http://www.rakuten.co.jp',
encoding: null // stop request from decoding response
}, function(err, resp, buffer) {
if (err) {
console.error(err.stack);
return;
}
var htmlInUTF8 = toUTF8(buffer, resp.headers['content-type']);
});
The code is available under MIT license.