1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586 |
- var should = require('should'),
- needle = require('./../'),
- Q = require('q'),
- chardet = require('jschardet');
- describe('character encoding', function() {
- var url;
- this.timeout(5000);
- describe('test A', function() {
- before(function() {
- url = 'http://www.nina.jp/server/slackware/webapp/tomcat_charset.html';
- })
- describe('with decode = false', function() {
- it('does not decode', function(done) {
- needle.get(url, { decode: false }, function(err, resp) {
- resp.body.should.be.a.String;
- chardet.detect(resp.body).encoding.should.eql('windows-1252');
- resp.body.indexOf('EUCを使う').should.eql(-1);
- done();
- })
- })
- })
- describe('with decode = true', function() {
- it('decodes', function(done) {
- needle.get(url, { decode: true }, function(err, resp) {
- resp.body.should.be.a.String;
- chardet.detect(resp.body).encoding.should.eql('ascii');
- resp.body.indexOf('EUCを使う').should.not.eql(-1);
- done();
- })
- })
- })
- })
- describe('test B', function() {
- it('encodes to UTF-8', function(done) {
- // Our Needle wrapper that requests a chinese website.
- var task = Q.nbind(needle.get, needle, 'http://www.chinesetop100.com/');
- // Different instantiations of this task
- var tasks = [Q.fcall(task, {decode: true}),
- Q.fcall(task, {decode: false})];
- var results = tasks.map(function(task) {
- return task.then(function(obj) {
- return obj[0].body;
- });
- });
- // Execute all requests concurrently
- Q.all(results).done(function(bodies) {
- var charsets = [
- chardet.detect(bodies[0]).encoding,
- chardet.detect(bodies[1]).encoding,
- ]
- // We wanted to decode our first stream.
- charsets[0].should.equal('ascii');
- bodies[0].indexOf('全球中文网站前二十强').should.not.equal(-1);
- // But not our second stream.
- charsets[1].should.equal('windows-1252');
- bodies[1].indexOf('全球中文网站前二十强').should.equal(-1);
- done();
- });
- })
- })
- })
|