generated from alexk111/store-of-something
-
-
Notifications
You must be signed in to change notification settings - Fork 2
/
data-collector-cpi.js
106 lines (92 loc) · 3.13 KB
/
data-collector-cpi.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
const http = require("http");
const path = require("path");
const csv = require("csv-parser");
const fse = require("fs-extra");
const pathSrc = "./src";
const pathCollected = pathSrc + "/data/_collected";
const pathCollectedCPI = pathCollected + "/cpi";
async function delay(duration) {
return new Promise((resolve) => setTimeout(resolve,duration));
}
async function loadCountriesFromCSV(filePath) {
const countriesByCode = {};
return new Promise((resolve, reject) => {
fse
.createReadStream(filePath)
.pipe(csv({}))
.on("data", (data) => {
const {country_code, country_name, currency_code} = data;
countriesByCode[country_code] = {
country_name,
currency_code
}
})
.on("end", () => {
resolve(countriesByCode);
})
.on("error", (err) => {
reject(err);
});
});
}
async function loadCPIFromRemoteAPI(countryCodes) {
const url = `http://dataservices.imf.org/REST/SDMX_JSON.svc/CompactData/CPI/M.${countryCodes.join("+")}.PCPI_IX?startPeriod=2013&endPeriod=${(new Date()).getUTCFullYear()}`;
return new Promise((resolve, reject) => {
http
.get(url, {
headers: {
"User-Agent": "Data Agent"
}
}, (res) => {
let body = "";
res.on("data", (chunk) => {
body += chunk;
});
res.on("end", async () => {
try {
const gotData = JSON.parse(body);
if (gotData && gotData.CompactData && gotData.CompactData.DataSet && gotData.CompactData.DataSet.Series) {
for (const seriesItem of gotData.CompactData.DataSet.Series) {
if (seriesItem.Obs) {
const countryCode = seriesItem["@REF_AREA"];
const pathOutFile = path.join(pathCollectedCPI, `${countryCode}.json`);
const obsData = seriesItem.Obs;
const outData = [];
for (let i = 0; i < obsData.length; i++) {
const dataItem = obsData[i];
outData.push([dataItem["@TIME_PERIOD"], dataItem["@OBS_VALUE"]]);
}
await fse.writeFile(pathOutFile, JSON.stringify(outData,null,2));
}
}
}
resolve();
} catch (error) {
reject(error.message);
}
});
})
.on("error", (error) => {
reject(error.message);
});
});
}
function chunkArrayInGroups(arr, size) {
var myArray = [];
for(var i = 0; i < arr.length; i += size) {
myArray.push(arr.slice(i, i+size));
}
return myArray;
}
async function build() {
console.info("Collecting CPI data...");
const countries = await loadCountriesFromCSV(`${pathSrc}/data/countries.csv`);
const countryCodeGroups = chunkArrayInGroups(Object.keys(countries), 70);
for (let i=0; i<countryCodeGroups.length; i++) {
console.info(`${i+1}/${countryCodeGroups.length}`);
const countryCodeGroup = countryCodeGroups[i];
await loadCPIFromRemoteAPI(countryCodeGroup);
await delay(500); // API limits = 10 requests in 5 second window from one user (IP)
}
}
build();