summaryrefslogtreecommitdiff
path: root/node_modules/needle/test/decoder_spec.js
diff options
context:
space:
mode:
Diffstat (limited to 'node_modules/needle/test/decoder_spec.js')
-rw-r--r--node_modules/needle/test/decoder_spec.js86
1 files changed, 86 insertions, 0 deletions
diff --git a/node_modules/needle/test/decoder_spec.js b/node_modules/needle/test/decoder_spec.js
new file mode 100644
index 0000000..5225f6f
--- /dev/null
+++ b/node_modules/needle/test/decoder_spec.js
@@ -0,0 +1,86 @@
+var should = require('should'),
+ needle = require('./../'),
+ Q = require('q'),
+ chardet = require('jschardet');
+
+describe('character encoding', function() {
+
+ var url;
+ this.timeout(5000);
+
+ describe('test A', function() {
+
+ before(function() {
+ url = 'http://www.nina.jp/server/slackware/webapp/tomcat_charset.html';
+ })
+
+ describe('with decode = false', function() {
+
+ it('does not decode', function(done) {
+
+ needle.get(url, { decode: false }, function(err, resp) {
+ resp.body.should.be.a.String;
+ chardet.detect(resp.body).encoding.should.eql('windows-1252');
+ resp.body.indexOf('EUCを使う').should.eql(-1);
+ done();
+ })
+
+ })
+
+ })
+
+ describe('with decode = true', function() {
+
+ it('decodes', function(done) {
+
+ needle.get(url, { decode: true }, function(err, resp) {
+ resp.body.should.be.a.String;
+ chardet.detect(resp.body).encoding.should.eql('ascii');
+ resp.body.indexOf('EUCを使う').should.not.eql(-1);
+ done();
+ })
+
+ })
+
+ })
+
+ })
+
+ describe('test B', function() {
+
+ it('encodes to UTF-8', function(done) {
+
+ // Our Needle wrapper that requests a chinese website.
+ var task = Q.nbind(needle.get, needle, 'http://www.chinesetop100.com/');
+
+ // Different instantiations of this task
+ var tasks = [Q.fcall(task, {decode: true}),
+ Q.fcall(task, {decode: false})];
+
+ var results = tasks.map(function(task) {
+ return task.then(function(obj) {
+ return obj[0].body;
+ });
+ });
+
+ // Execute all requests concurrently
+ Q.all(results).done(function(bodies) {
+
+ var charsets = [
+ chardet.detect(bodies[0]).encoding,
+ chardet.detect(bodies[1]).encoding,
+ ]
+
+ // We wanted to decode our first stream.
+ charsets[0].should.equal('ascii');
+ bodies[0].indexOf('全球中文网站前二十强').should.not.equal(-1);
+
+ // But not our second stream.
+ charsets[1].should.equal('windows-1252');
+ bodies[1].indexOf('全球中文网站前二十强').should.equal(-1);
+
+ done();
+ });
+ })
+ })
+})