python到node.js的混淆

python to node.js confusion

本文关键字:js node python      更新时间:2024-07-17

所以我有这个python代码,我正试图将其转换为node.js,但我不确定如何转换。

import urllib.request, re
def getDef(word):
    link = "http://www.merriam-webster.com/dictionary/%s" % word
    data = urllib.request.urlopen(link).read().decode()
    try:
        return re.search("<p>: (.*?)</p><p>", data).group(1)
    except:
        return "No match"
 class newDefinition:
     def __init__(self, word):
         self.definition = getDef(word);
 >>> definition = newDefintion("color")
 >>> print(definition.definition)
a quality such as red, blue, green, yellow, etc., that you see when you look at something

然而,尽管在node.js中,我似乎可以像在python中一样返回它,因为它是回调的做事方式,或者至少我似乎不能返回它,这就是为什么我问我该如何实现node.js的等效性,或者它们没有等效性?这是我到目前为止所拥有的,也许你可以发现我做错了什么,以及如何修复

var urllib = require("urllib"); // installed with npm
var getDef = function(word){
    var link = "http://www.merriam-webster.com/dictionary/" + word;
    var urlData = urllib.request(link, {}, function(err, data, res){
        var re = new RegExp("<p>: (.*?)</p><p>");
        var results = data.toString();
        var match = re.exec(results)[1];
        return match; // Expected it to give urlData the definition
    });
    return urlData;
}
var Definition = function(word){
    this.definition = getDef(word);
}
definition = new Definition("color");
console.log(definition.definition); // this won't give the definition but the information of the urllib itself rather.

所以一般来说,我想知道如何使用异步代码,这样我就可以返回我需要的东西,但我也不习惯这个概念,所以在python中有类似的东西吗?此外,如果你能给我介绍一些关于异步代码的好文档,那也会很棒。

由于return实际上只是退出函数而不是返回值,因此需要使用回调。它看起来是这样的:

var urllib = require("urllib");
var getDef = function(word, callback){
  var link = 'http://www.merriam-webster.com/dictionary/' + word;
  urllib.request(link, {}, function(err, data, res) {
    var re = new RegExp('<p>: (.*?)</p><p>');
    var results = data.toString();
    var match = re.exec(results)[1];
    callback(match);
  });
};

然后,您将在调用函数时传递回调:

getDef('color', function(definition) {
  console.log(definition);
});

编辑:设置对象的属性也有同样的想法。相反,它可能看起来像这样:

var Definition = function(word) {
  var self = this;
  getDef(world, function(definition, callback) {
    self.definition = definition;
    callback.call(self);
  });
};

这样称呼:

var definition = new Definition('color', function() {
  console.log(definition.definition);
});

这是我值得两分钱的建议。

永远不要使用正则表达式来解析HTML(请参阅此处了解更多详细信息),而是使用类似XPath的库来解析文档。您可以使用像cheerio或phantomjs这样的库。

这是一个干净的解决方案。

var request = require('request'),
    when    = require('when'),
    cheerio = require('cheerio');
var URL = 'http://www.merriam-webster.com/dictionary/';
/**
 * @param word: Word to search the dictionary
 * @returns 
 *   Promise object which resolves to array of
 *   definitions of the word
 */
var getDef = function(word){
    var defer = when.defer();
    request(URL + word, function(err, res, body){
        if (err || res.statusCode !== 200){
            defer.reject();
        }
        var defs = [];
        var $ = cheerio.load(body);
        $('.wordclick .headword:first-child p').each(function(i,ele){
            var definition = $(ele).text();
            defs.push(definition);
        });
        defer.resolve(defs);
    });
    return defer.promise;
}
getDef('happy').then(function(words){
    console.log(words);
});

注意:这里我使用的是when(Promise+库),而不是Node的标准CPS样式。