使用Node.js从URL读取内容

Luk*_*uke 26 node.js

我正在尝试从带有Node.js的URL读取内容,但我似乎得到的只是一堆字节.我显然做错了什么,但我不确定是什么.这是我目前的代码:

var http = require('http');

var client = http.createClient(80, "google.com");
request = client.request();
request.on('response', function( res ) {
    res.on('data', function( data ) {
        console.log( data );
    } );
} );
request.end();
Run Code Online (Sandbox Code Playgroud)

任何见解将不胜感激.

小智 38

尝试使用客户端的on error事件来查找问题.

var http = require('http');

var options = {
    host: 'google.com',
    path: '/'
}
var request = http.request(options, function (res) {
    var data = '';
    res.on('data', function (chunk) {
        data += chunk;
    });
    res.on('end', function () {
        console.log(data);

    });
});
request.on('error', function (e) {
    console.log(e.message);
});
request.end();
Run Code Online (Sandbox Code Playgroud)


sid*_*mor 10

HTTP和HTTPS:

const getScript = (url) => {
    return new Promise((resolve, reject) => {
        const http      = require('http'),
              https     = require('https');

        let client = http;

        if (url.toString().indexOf("https") === 0) {
            client = https;
        }

        client.get(url, (resp) => {
            let data = '';

            // A chunk of data has been recieved.
            resp.on('data', (chunk) => {
                data += chunk;
            });

            // The whole response has been received. Print out the result.
            resp.on('end', () => {
                resolve(data);
            });

        }).on("error", (err) => {
            reject(err);
        });
    });
};

(async (url) => {
    console.log(await getScript(url));
})('https://sidanmor.com/');
Run Code Online (Sandbox Code Playgroud)


tti*_*sdf 9

@sidanmor 代码的稍微修改版本。要点是,并非每个网页都是纯 ASCII,用户应该能够手动处理解码(甚至编码为 Base64)

function httpGet(url) {
  return new Promise((resolve, reject) => {
    const http = require('http'),
      https = require('https');

    let client = http;

    if (url.toString().indexOf("https") === 0) {
      client = https;
    }

    client.get(url, (resp) => {
      let chunks = [];

      // A chunk of data has been recieved.
      resp.on('data', (chunk) => {
        chunks.push(chunk);
      });

      // The whole response has been received. Print out the result.
      resp.on('end', () => {
        resolve(Buffer.concat(chunks));
      });

    }).on("error", (err) => {
      reject(err);
    });
  });
}

(async(url) => {
  var buf = await httpGet(url);
  console.log(buf.toString('utf-8'));
})('https://httpbin.org/headers');
Run Code Online (Sandbox Code Playgroud)


Mar*_*ahn 8

数据对象是字节缓冲区.只需调用.toString()以获取人类可读的代码:

console.log( data.toString() );
Run Code Online (Sandbox Code Playgroud)

reference:Node.js缓冲区