2013-10-22 109 views
0

我试图创建一个NodeJS应用程序来提取SQL记录并将它们插入到MongoDB中。我感兴趣的表格有些大(100万+记录)。对于小数据集(< 200,000),我的应用工作得很好,但是对整个桌面运行开始消耗RAM并使服务器爬行。NodeJS操作顺序

看起来Node正在运行我的“for”循环,为每个SQL sub select分支进程,然后运行MongoDB更新。

我从来没有看到“Mongo Connected!”直到最后一个“获得对活动的响应#”写入屏幕。

#!/var/node/bin/node 
var odbc = require("odbc"); 
var db = new odbc.Database(); 

var MongoClient = require('mongodb').MongoClient; 
var format = require('util').format; 

db.open("DSN=<DSN>;SERVER=<SERVER>;DATABASE=<DB>;UID=<UID>;PWD=<PWD>", function (err) { 
    if(err) throw err; 
    console.log("SQL Connected!"); 

     var sqlstr = "SELECT TOP 1000 * FROM tbl_A NOLOCK"; 
     console.log("Executing '" + sqlstr + "' against SQL Server"); 

     db.query(sqlstr, function (sql1err, rows, moreResults) { 
     if (sql1err) throw sql1err; 

     for (var i = 0; i < rows.length; i++) { 
      InsertActivity(db, rows[i], i, rows.length, function() {}); 
     } 
     }); 
}); 

function InsertActivity(sql, activity, cur, total, callback) { 
    console.log("Getting Responses for Activity #" + activity.ActivityID); 
    var rsql = "SELECT * FROM tbl_Responses NOLOCK WHERE ActivityID = " + activity.ActivityID; 
    sql.query(rsql, function (sqlerr, rows, moreResults) { 
     if (sqlerr) console.log(sqlerr); 
     activity.resonses = rows; 

     MongoClient.connect('mongodb://localhost:27017/m', function (merr, mdb) { 
     console.log("Mongo Connected!"); 
     mdb.collection("activity").insert(activity, function() { 
      console.log("Inserted Activity #" + activity.ActivityID + " inserted into Mongo"); 
      mdb.close(function() { console.log("Mongo Disconnected!"); }); 
      callback(); 
     }); 
     }); 

     if (cur == total - 1) sql.close(function() { console.log("SQL Disconnected!"); }); 
    }); 

    console.log(rsql); 
} 

回答

0

你需要的是不幸的是一个无证的函数(我会解决这个问题)。函数是db.queryResult,它返回结果对象,允许您单独获取行。这将避免将整个结果集缓冲到内存中。

https://github.com/wankdanker/node-odbc/blob/master/test/test-query-select-fetch.js

var db = require('odbc')(); 

db.open(connectionString, function (err) { 
    db.queryResult('select * from tbl_A NOLOCK', function (err, result) { 
     fetchMore(); 

     function fetchMore() { 
      result.fetch(function (err, data) { 
       if (!data) { 
        //we're all done, clean up 
       } 

       doStuffWithData(data, function (err) { 
        fetchMore(); 
       }); 
      }); 
     } 
    }); 
}); 

function doStuffWithData(data, cb) { 
    //do stuff 
    cb(null); 
}