Fix/pipeline/ohlcv ratelimit (#1403)
Use time-based throttling and increase batch size of CC query
This commit is contained in:
@@ -52,9 +52,9 @@
|
||||
"@types/p-limit": "^2.0.0",
|
||||
"async-parallel": "^1.2.3",
|
||||
"axios": "^0.18.0",
|
||||
"bottleneck": "^2.13.2",
|
||||
"dockerode": "^2.5.7",
|
||||
"ethereum-types": "^1.0.6",
|
||||
"p-limit": "^2.0.0",
|
||||
"pg": "^7.5.0",
|
||||
"prettier": "^1.15.3",
|
||||
"ramda": "^0.25.0",
|
||||
|
@@ -1,6 +1,6 @@
|
||||
// tslint:disable:no-duplicate-imports
|
||||
import { fetchAsync } from '@0x/utils';
|
||||
import promiseLimit = require('p-limit');
|
||||
import Bottleneck from 'bottleneck';
|
||||
import { stringify } from 'querystring';
|
||||
import * as R from 'ramda';
|
||||
|
||||
@@ -33,43 +33,41 @@ export interface CryptoCompareOHLCVParams {
|
||||
toTs?: number;
|
||||
}
|
||||
|
||||
const ONE_WEEK = 7 * 24 * 60 * 60 * 1000; // tslint:disable-line:custom-no-magic-numbers
|
||||
const ONE_HOUR = 60 * 60 * 1000; // tslint:disable-line:custom-no-magic-numbers
|
||||
const ONE_SECOND = 1000;
|
||||
const ONE_HOUR_AGO = new Date().getTime() - ONE_HOUR;
|
||||
const HTTP_OK_STATUS = 200;
|
||||
const CRYPTO_COMPARE_VALID_EMPTY_RESPONSE_TYPE = 96;
|
||||
const MAX_PAGE_SIZE = 2000;
|
||||
|
||||
export class CryptoCompareOHLCVSource {
|
||||
public readonly interval = ONE_WEEK; // the hourly API returns data for one week at a time
|
||||
public readonly default_exchange = 'CCCAGG';
|
||||
public readonly intervalBetweenRecords = ONE_HOUR;
|
||||
public readonly defaultExchange = 'CCCAGG';
|
||||
public readonly interval = this.intervalBetweenRecords * MAX_PAGE_SIZE; // the hourly API returns data for one interval at a time
|
||||
private readonly _url: string = 'https://min-api.cryptocompare.com/data/histohour?';
|
||||
|
||||
// rate-limit for all API calls through this class instance
|
||||
private readonly _promiseLimit: (fetchFn: () => Promise<Response>) => Promise<Response>;
|
||||
constructor(maxConcurrentRequests: number = 50) {
|
||||
this._promiseLimit = promiseLimit(maxConcurrentRequests);
|
||||
private readonly _limiter: Bottleneck;
|
||||
constructor(maxReqsPerSecond: number) {
|
||||
this._limiter = new Bottleneck({
|
||||
minTime: ONE_SECOND / maxReqsPerSecond,
|
||||
reservoir: 30,
|
||||
reservoirRefreshAmount: 30,
|
||||
reservoirRefreshInterval: ONE_SECOND,
|
||||
});
|
||||
}
|
||||
|
||||
// gets OHLCV records starting from pair.latest
|
||||
public async getHourlyOHLCVAsync(pair: TradingPair): Promise<CryptoCompareOHLCVRecord[]> {
|
||||
const params = {
|
||||
e: this.default_exchange,
|
||||
e: this.defaultExchange,
|
||||
fsym: pair.fromSymbol,
|
||||
tsym: pair.toSymbol,
|
||||
limit: MAX_PAGE_SIZE,
|
||||
toTs: Math.floor((pair.latestSavedTime + this.interval) / ONE_SECOND), // CryptoCompare uses timestamp in seconds. not ms
|
||||
};
|
||||
const url = this._url + stringify(params);
|
||||
|
||||
// go through the instance-wide rate-limit
|
||||
const fetchPromise: Promise<Response> = this._promiseLimit(() => {
|
||||
// tslint:disable-next-line:no-console
|
||||
console.log(`Scraping Crypto Compare at ${url}`);
|
||||
return fetchAsync(url);
|
||||
});
|
||||
|
||||
const response = await Promise.resolve(fetchPromise);
|
||||
const response = await this._limiter.schedule(() => fetchAsync(url));
|
||||
if (response.status !== HTTP_OK_STATUS) {
|
||||
throw new Error(`HTTP error while scraping Crypto Compare: [${response}]`);
|
||||
}
|
||||
|
@@ -11,7 +11,7 @@ import { fetchOHLCVTradingPairsAsync, TradingPair } from '../utils/get_ohlcv_tra
|
||||
const SOURCE_NAME = 'CryptoCompare';
|
||||
const TWO_HOURS_AGO = new Date().getTime() - 2 * 60 * 60 * 1000; // tslint:disable-line:custom-no-magic-numbers
|
||||
|
||||
const MAX_CONCURRENT_REQUESTS = parseInt(process.env.CRYPTOCOMPARE_MAX_CONCURRENT_REQUESTS || '14', 10); // tslint:disable-line:custom-no-magic-numbers
|
||||
const MAX_REQS_PER_SECOND = parseInt(process.env.CRYPTOCOMPARE_MAX_REQS_PER_SECOND || '15', 10); // tslint:disable-line:custom-no-magic-numbers
|
||||
const EARLIEST_BACKFILL_DATE = process.env.OHLCV_EARLIEST_BACKFILL_DATE || '2014-06-01';
|
||||
const EARLIEST_BACKFILL_TIME = new Date(EARLIEST_BACKFILL_DATE).getTime();
|
||||
|
||||
@@ -20,7 +20,7 @@ let connection: Connection;
|
||||
(async () => {
|
||||
connection = await createConnection(ormConfig as ConnectionOptions);
|
||||
const repository = connection.getRepository(OHLCVExternal);
|
||||
const source = new CryptoCompareOHLCVSource(MAX_CONCURRENT_REQUESTS);
|
||||
const source = new CryptoCompareOHLCVSource(MAX_REQS_PER_SECOND);
|
||||
|
||||
const jobTime = new Date().getTime();
|
||||
const tradingPairs = await fetchOHLCVTradingPairsAsync(connection, SOURCE_NAME, EARLIEST_BACKFILL_TIME);
|
||||
@@ -63,7 +63,7 @@ async function fetchAndSaveAsync(
|
||||
console.log(`Retrieved ${records.length} records for ${JSON.stringify(pair)}`);
|
||||
if (records.length > 0) {
|
||||
const metadata: OHLCVMetadata = {
|
||||
exchange: source.default_exchange,
|
||||
exchange: source.defaultExchange,
|
||||
fromSymbol: pair.fromSymbol,
|
||||
toSymbol: pair.toSymbol,
|
||||
source: SOURCE_NAME,
|
||||
|
@@ -13,7 +13,7 @@ const expect = chai.expect;
|
||||
describe('ohlcv_external data source (Crypto Compare)', () => {
|
||||
describe('generateBackfillIntervals', () => {
|
||||
it('generates pairs with intervals to query', () => {
|
||||
const source = new CryptoCompareOHLCVSource();
|
||||
const source = new CryptoCompareOHLCVSource(20);
|
||||
const pair: TradingPair = {
|
||||
fromSymbol: 'ETH',
|
||||
toSymbol: 'ZRX',
|
||||
@@ -31,7 +31,7 @@ describe('ohlcv_external data source (Crypto Compare)', () => {
|
||||
});
|
||||
|
||||
it('returns single pair if no backfill is needed', () => {
|
||||
const source = new CryptoCompareOHLCVSource();
|
||||
const source = new CryptoCompareOHLCVSource(20);
|
||||
const pair: TradingPair = {
|
||||
fromSymbol: 'ETH',
|
||||
toSymbol: 'ZRX',
|
||||
|
Reference in New Issue
Block a user