athena-client - a simple aws athena client for nodejs and typescript
This is version 2.x document. 1.x document is here
Install with:
npm install athena-client
Usage Example
Create Client
var clientConfig = {
bucketUri: 's3://xxxx'
}
var awsConfig = {
region: 'xxxx',
}
var athena = require("athena-client")
var client = athena.createClient(clientConfig, awsConfig)
Receive result by Callback
client.execute('SELECT 1', function(err, data) {
if (err) {
return console.error(err)
}
console.log(data)
})
Receive result by Promise
client.execute('SELECT 1').toPromise()
.then(function(data) {
console.log(data)
}).catch(function(err) {
console.error(err)
})
Receive result by Stream
var stream = client.execute('SELECT 1').toStream()
stream.on('data', (record) => {
console.log(record)
})
stream.on('query_end', (queryExecution) => {
console.log(queryExecution)
})
stream.on('end', () => {
console.log('end')
})
stream.on('error', (e) => {
console.error(e)
})
API
athena = require("athena-client")
This module exposes the createClient
method, which execute query to AWS Athena
client = athena.createClient([clientConfig], [awsConfig])
Returns a client instance attached to the account specified by the given clientConfig and awsConfig.
clientConfig
object properties
Property | Default | Description |
---|
bucketUri | Required | URI of S3 bucket for saving a query results file(.csv) and a metadata file (.csv.metadata) |
pollingInterval | 1000 | Interval of polling sql results (ms) |
queryTimeout | 0 | Timeout of query execution. 0 is no timeout |
concurrentExecMax | 5 | The number of cuncurrent execution of query max. It should be set smaller than AWS Service limit (default is 5) |
maxBufferSize | '128M' | Maximum buffer when retrieving query results |
awsConfig
object properties
Property | Default | Description |
---|
region | Required | Your Athena and S3 region |
accessKeyId | undifined | Your IAM accessKeyId. This is optional |
secretAccessKey | undifined | Your IAM secretAccessKey. This is optional |
client.execute([query], [callback])
It will return the following result.
If you want to know more about params of queryExecution
, please refer to the aws-sdk document
{
"records": [
{"_col0:": "1"}
],
"queryExecution": {
"Query": "SELECT 1",
"QueryExecutionId": "55571bb9-8e4e-4274-90b7-8cffe4539c3c",
"ResultConfiguration": {
"OutputLocation": "s3://bucket/55571bb9-8e4e-4274-90b7-8cffe4539c3c"
},
"Statistics": {
"DataScannedInBytes": 0,
"EngineExecutionTimeInMillis": 137
},
"Status": {
"CompletionDateTime": "2017-12-31T16:03:53.493Z",
"State": "SUCCEEDED",
"SubmissionDateTime": "2017-12-31T16:03:53.209Z"
}
}
}
client.execute([query]).toPromise()
It will return promise object to get result.
client.execute([query]).toStream()
It will return stream object to get result. If your query results are very large
, we recommend using this stream.
stream.on('data', (record) => {
console.log(record)
})
stream.on('query_end', (queryExecution) => {
console.log(queryExecution)
})
stream.on('end', () => {
console.log('end')
})
stream.on('error', (e) => {
console.error(e)
})