CartoDB-SQL-API/app/controllers/copy_controller.js

227 lines
8.1 KiB
JavaScript
Raw Normal View History

'use strict';
const userMiddleware = require('../middlewares/user');
const errorMiddleware = require('../middlewares/error');
const authorizationMiddleware = require('../middlewares/authorization');
const connectionParamsMiddleware = require('../middlewares/connection-params');
const timeoutLimitsMiddleware = require('../middlewares/timeout-limits');
const { initializeProfilerMiddleware } = require('../middlewares/profiler');
const rateLimitsMiddleware = require('../middlewares/rate-limit');
const { RATE_LIMIT_ENDPOINTS_GROUPS } = rateLimitsMiddleware;
2018-05-25 01:48:24 +08:00
const errorHandlerFactory = require('../services/error_handler_factory');
2018-06-12 22:56:18 +08:00
const StreamCopy = require('../services/stream_copy');
2018-06-08 21:03:21 +08:00
const StreamCopyMetrics = require('../services/stream_copy_metrics');
const Logger = require('../services/logger');
const { Client } = require('pg');
const zlib = require('zlib');
2018-05-22 17:54:10 +08:00
function CopyController(metadataBackend, userDatabaseService, userLimitsService, statsClient) {
this.metadataBackend = metadataBackend;
this.userDatabaseService = userDatabaseService;
this.userLimitsService = userLimitsService;
2018-05-22 17:54:10 +08:00
this.statsClient = statsClient;
2018-06-08 23:02:31 +08:00
this.logger = new Logger(global.settings.dataIngestionLogPath, 'data-ingestion');
}
CopyController.prototype.route = function (app) {
const { base_url } = global.settings;
2018-05-08 18:52:33 +08:00
const copyFromMiddlewares = endpointGroup => {
return [
initializeProfilerMiddleware('copyfrom'),
userMiddleware(this.metadataBackend),
rateLimitsMiddleware(this.userLimitsService, endpointGroup),
authorizationMiddleware(this.metadataBackend),
connectionParamsMiddleware(this.userDatabaseService),
timeoutLimitsMiddleware(this.metadataBackend),
validateCopyQuery(),
2018-06-08 23:04:10 +08:00
handleCopyFrom(this.logger),
2018-05-25 23:50:59 +08:00
errorHandler(),
errorMiddleware()
];
};
2018-05-08 18:52:33 +08:00
const copyToMiddlewares = endpointGroup => {
return [
initializeProfilerMiddleware('copyto'),
userMiddleware(this.metadataBackend),
rateLimitsMiddleware(this.userLimitsService, endpointGroup),
authorizationMiddleware(this.metadataBackend),
connectionParamsMiddleware(this.userDatabaseService),
timeoutLimitsMiddleware(this.metadataBackend),
validateCopyQuery(),
2018-06-08 23:02:31 +08:00
handleCopyTo(this.logger),
2018-05-25 23:50:59 +08:00
errorHandler(),
errorMiddleware()
];
};
2018-05-04 00:50:13 +08:00
app.post(`${base_url}/sql/copyfrom`, copyFromMiddlewares(RATE_LIMIT_ENDPOINTS_GROUPS.COPY_FROM));
app.get(`${base_url}/sql/copyto`, copyToMiddlewares(RATE_LIMIT_ENDPOINTS_GROUPS.COPY_TO));
};
2018-06-08 23:02:31 +08:00
function handleCopyTo (logger) {
2018-05-22 17:54:10 +08:00
return function handleCopyToMiddleware (req, res, next) {
2018-06-08 21:03:21 +08:00
const sql = req.query.q;
const { userDbParams, user } = res.locals;
2018-05-22 17:54:10 +08:00
const filename = req.query.filename || 'carto-sql-copyto.dmp';
2018-05-08 18:52:33 +08:00
2018-06-12 22:56:18 +08:00
const streamCopy = new StreamCopy(sql, userDbParams);
2018-06-11 18:56:16 +08:00
const metrics = new StreamCopyMetrics(logger, 'copyto', sql, user);
2018-06-08 21:03:21 +08:00
2018-05-22 17:54:10 +08:00
res.header("Content-Disposition", `attachment; filename=${encodeURIComponent(filename)}`);
res.header("Content-Type", "application/octet-stream");
2018-05-08 19:08:29 +08:00
2018-06-13 00:39:50 +08:00
streamCopy.on('copy-to-end', rows => {
metrics.end(rows);
});
2018-06-08 23:09:28 +08:00
streamCopy.to(
function (err, pgstream, client, done) {
if (err) {
2018-06-08 21:03:21 +08:00
return next(err);
2018-06-08 23:09:28 +08:00
}
2018-06-08 21:03:21 +08:00
2018-06-08 23:09:28 +08:00
let responseEnded = false;
res
.on('error', err => {
2018-06-08 21:03:21 +08:00
metrics.end(null, err);
pgstream.unpipe(res);
2018-06-08 23:09:28 +08:00
done();
2018-06-08 21:03:21 +08:00
return next(err);
2018-06-08 23:09:28 +08:00
})
.on('close', () => {
if (!responseEnded) {
streamCopy.setConnectionClosedByClient(true);
2018-06-08 23:09:28 +08:00
// Cancel the running COPY TO query
// See https://www.postgresql.org/docs/9.5/static/protocol-flow.html#PROTOCOL-COPY
const runningClient = client;
const cancelingClient = new Client(runningClient.connectionParameters);
cancelingClient.cancel(runningClient, pgstream);
const err = new Error('Connection closed by client');
metrics.end(null, err);
pgstream.unpipe(res);
// see https://node-postgres.com/api/pool#releasecallback
done(err);
return next(err);
}
})
.on('end', () => responseEnded = true);
pgstream
2018-06-08 23:09:28 +08:00
.on('data', data => metrics.addSize(data.length))
.pipe(res);
}
);
2018-05-22 17:54:10 +08:00
};
}
2018-05-08 18:52:33 +08:00
2018-06-08 23:02:31 +08:00
function handleCopyFrom (logger) {
return function handleCopyFromMiddleware (req, res, next) {
2018-06-08 21:03:21 +08:00
const sql = req.query.q;
const { userDbParams, user } = res.locals;
2018-06-11 18:55:30 +08:00
const isGzip = req.get('content-encoding') === 'gzip';
2018-06-08 21:03:21 +08:00
2018-06-12 22:56:18 +08:00
const streamCopy = new StreamCopy(sql, userDbParams);
2018-06-11 18:56:16 +08:00
const metrics = new StreamCopyMetrics(logger, 'copyfrom', sql, user, isGzip);
2018-06-08 21:03:21 +08:00
2018-06-13 00:39:50 +08:00
streamCopy.on('copy-from-end', rows => {
metrics.end(rows);
const { time } = metrics;
if (!time || !rows) {
return next(new Error("No rows copied"));
}
2018-06-13 00:39:50 +08:00
res.send({
time,
total_rows: rows
});
});
2018-06-08 23:09:28 +08:00
streamCopy.from(
function (err, pgstream, client, done) {
if (err) {
2018-06-12 21:18:28 +08:00
return next(err);
2018-06-08 23:09:28 +08:00
}
let requestEnded = false;
req
.on('error', err => {
2018-06-08 21:03:21 +08:00
metrics.end(null, err);
req.unpipe(pgstream);
2018-06-08 23:09:28 +08:00
pgstream.end();
2018-06-08 21:03:21 +08:00
done();
2018-06-08 23:09:28 +08:00
next(err);
})
.on('close', () => {
if (!requestEnded) {
const err = new Error('Connection closed by client');
metrics.end(null, err);
const connection = client.connection;
connection.sendCopyFail('CARTO SQL API: Connection closed by client');
req.unpipe(pgstream);
done();
next(err);
}
})
.on('data', data => {
2018-06-11 18:55:30 +08:00
if (isGzip) {
2018-06-08 23:09:28 +08:00
metrics.addGzipSize(data.length);
} else {
metrics.addSize(data.length);
}
})
.on('end', () => requestEnded = true);
2018-06-11 18:55:30 +08:00
if (isGzip) {
2018-06-08 23:09:28 +08:00
req
.pipe(zlib.createGunzip())
.on('data', data => metrics.addSize(data.length))
.pipe(pgstream);
} else {
req.pipe(pgstream);
}
2018-06-08 22:50:12 +08:00
}
2018-06-08 23:09:28 +08:00
);
};
}
2018-05-08 18:52:33 +08:00
function validateCopyQuery () {
return function validateCopyQueryMiddleware (req, res, next) {
const sql = req.query.q;
if (!sql) {
2018-06-08 21:03:21 +08:00
return next(new Error("SQL is missing"));
}
if (!sql.toUpperCase().startsWith("COPY ")) {
2018-06-08 21:03:21 +08:00
return next(new Error("SQL must start with COPY"));
}
2018-05-22 22:02:14 +08:00
next();
};
}
2018-05-25 23:50:59 +08:00
function errorHandler () {
return function errorHandlerMiddleware (err, req, res, next) {
if (res.headersSent) {
console.error("EXCEPTION REPORT: " + err.stack);
2018-05-25 23:50:59 +08:00
const errorHandler = errorHandlerFactory(err);
res.write(JSON.stringify(errorHandler.getResponse()));
res.end();
} else {
return next(err);
}
};
}
2018-05-04 00:31:49 +08:00
module.exports = CopyController;