我有一个像这样的大型 JSON 文件:
[
{
"id": 2000,
"city": "New York",
"lat": "",
"lon": "",
},
...
]
我正在寻找每个对象中的纬度和经度。我正在使用 JSONStream 模块来管道数据:
var writeStream = fs.createWriteStream('data/stream.json');
var readStream = fs.createReadStream('data/dummy/institucion_1_2000.json', {encoding: 'utf8'})
// Search for lat and lon
var search = es.mapSync(function(data){
if(data.lat == ""){
// Search for the lat and lon
geocoder.geocode({address: data.city, country: "US"})
.then(function(res) {
console.log("Searched for " + res[0].formattedAddress);
data.lat = res[0].latitude;
data.lon = res[0].longitude;
})
.catch(function(err) {
console.log("There was an error with element with id = " + data.id);
console.log("Here is the error: " + err);
if(err == 'Error: Status is OVER_QUERY_LIMIT. You have exceeded your rate-limit for this API.') {
process.exit();
}
});
return data;
}
})
// Pipe
readStream
.pipe(JSONStream.parse('*'))
.pipe(search)
.pipe(JSONStream.stringify()) // This doesent wait until the search is finish
.pipe(writeStream)
地理编码部分有效。
我的问题是 JSONStream.stringify 在搜索功能结束之前读取然后管道数据。所以我得到了相同的 JSON 文件,没有我需要的修改。如果我只是试试这个:
if(data.lat == ""){
lat = 1;
}
而不是需要更多时间的地理编码,它可以工作。我猜我的问题在于修改流式传输的数据所需的时间。那么,一旦数据被修改,有没有办法通过管道传输数据?
编辑 我在同步和异步之间搞砸了。感谢djones
var search = es.map(function (data, callback) {
if(data.lat == ""){
geocoder.geocode({address: data.city, country: "USA"}) // Choose between Comuna_Empresa and Comuna_Institucion
.then(function(res) {
console.log("Searched for " + res[0].formattedAddress);
data.lat = res[0].latitude;
data.lon = res[0].longitude;
callback(null,data);
})
.catch(function(err) {
console.log("There was an error with element at index = " + index);
console.log("Here is the error: " + err);
});
}
})