- Recipes
- AWS Redshift to Dremio
Connect AWS Redshift and Dremio in our serverless environment
Use this template to Read rows from AWS Redshift table using them to insert data in Dremio.
Share
Read rows from AWS Redshift table
Used integrations:
JavaScript
Python
class AwsRedshiftSourceSelect {
async init() {
// TODO: Create your aws-redshift credential
// More info at https://yepcode.io/docs/integrations/aws-redshift/#credential-configuration
this.awsRedshift = yepcode.integration.awsRedshift(
"your-aws-redshift-credential-name"
);
// TODO: Customize the command to be executed
// More info at https://docs.aws.amazon.com/AWSJavaScriptSDK/v3/latest/clients/client-redshift-data/interfaces/executestatementcommandinput.html
const {
Id
} = await this.awsRedshift.send(
new ExecuteStatementCommand({
ClusterIdentifier: "your-cluster-identifier",
Database: "your-database-name",
DbUser: "your-database-user",
Sql: "SELECT * FROM your-table-name;",
})
);
this.statementId = Id;
await this._awaitStatementToFinish();
}
async fetch(publish, done) {
let nextToken;
// if result is returned paginated, iterate to publish entire statement result
do {
const result = await this.awsRedshift.send(
new GetStatementResultCommand({
Id: this.statementId,
NextToken: nextToken,
})
);
nextToken = result.NextToken;
for (const record of result.Records) {
// Each record come as a list of record cells
// More info at https://docs.aws.amazon.com/AWSJavaScriptSDK/v3/latest/clients/client-redshift-data/interfaces/getstatementresultcommandoutput.html
// TODO: Customize record columns mapping to the item that will be published
const item = {
id: record.id,
...record
};
await publish(item);
}
} while (nextToken);
done();
}
async close() {}
_awaitStatementToFinish() {
return new Promise((resolve, reject) => {
const describeStatementCommand = new DescribeStatementCommand({
Id: this.statementId,
});
// Configure interval to check statement status
const intervalId = setInterval(async () => {
const result = await this.awsRedshift.send(describeStatementCommand);
if (result.Status === "FINISHED") {
clearInterval(intervalId);
resolve();
return;
}
if (result.Status === "FAILED" || result.Status === "ABORTED") {
clearInterval(intervalId);
reject();
return;
}
}, 1000);
});
}
}
import time
class AwsRedshiftSourceSelect:
def setup(self):
# TODO: Create your Redshift credential:
# More info at https://yepcode.io/docs/integrations/aws-redshift/#credential-configuration
self.aws_redshift_client = yepcode.integration.awsRedshift(
"your-redshift-credential-name"
)
# TODO: Customize your cluster id, database name, user and sql query
response = self.aws_redshift_client.execute_statement(
ClusterIdentifier="cluster-name",
Database="db-name",
DbUser="db-user",
Sql="SELECT * FROM your-table-name"
)
self.statement_id = response.get("Id")
self._await_statement_to_finish()
def generator(self):
# See all supported params in: https://boto3.amazonaws.com/v1/documentation/api/latest/reference/services/redshift-data/client/execute_statement.html
response = self.aws_redshift_client.get_statement_result(Id=self.statement_id)
for record in response.get("Records", []):
yield record
def _await_statement_to_finish(self):
while True:
response = self.aws_redshift_client.describe_statement(
Id=self.statement_id
)
status = response["Status"]
if status == "FINISHED":
return
if status in ("FAILED", "ABORTED"):
raise Exception(f"Statement failed with status: {status}")
time.sleep(1)
def close(self):
pass
Do you need help solving this integration with YepCode?
Let's talkInsert data in Dremio
Used integrations:
JavaScript
Python
class HttpTargetDremioInsert {
async init() {
// TODO: Create your http credential with dremio information:
// More info at https://yepcode.io/docs/integrations/http/#credential-configuration
// Official docs: https://docs.dremio.com/current/reference/api/
this.dremio = await yepcode.integration.http(
"your-dremio-credential-name"
);
}
async consume(item) {
const projectId = "<your-dremio-project-id>";
// TODO: Map your item to row and customize INSERT statement
// More info at https://docs.dremio.com/cloud/reference/sql/commands/insert/
const query = `INSERT INTO your_source_path.your_table VALUES (${item.id}, ${item.name})`;
// Use the SQL API to submit queries. The response contains the ID for the job associated with the SQL query
// Official docs: https://docs.dremio.com/cloud/reference/api/sql
const {
data: job
} = await this.dremio.post(`${projectId}/sql`, {
sql: query,
});
// Use the Job API to check the job status. Jobs final status are COMPLETED, FAILED and CANCELED
// Official docs: https://docs.dremio.com/cloud/reference/api/job/
const finalJobStates = ["COMPLETED", "FAILED", "CANCELED"];
let jobInfoResponse = null;
do {
jobInfoResponse = await this.dremio.get(
`${this.projectId}/job/${job.id}`
);
} while (!finalJobStates.includes(jobInfoResponse.data.jobState));
const {
data: jobInfo
} = jobInfoResponse;
if (jobInfo.jobState === "COMPLETED") {
console.log("Success!!");
} else if (jobInfo.jobState === "FAILED") {
console.log(`Uups! Something was wrong: ${jobInfo.errorMessage}`);
} else {
console.log(
`The job's been cancelled: ${jobInfo.cancellationReason}`
);
}
}
async close() {}
}
class HttpTargetDremioInsert:
def setup(self):
## TODO: Create your http credential with dremio information
## More info at https://yepcode.io/docs/integrations/http/#credential-configuration
## Official docs: https://docs.dremio.com/cloud/reference/api/
self.dremio = yepcode.integration.http(
"your-dremio-credential-name"
)
def consume(self, item, done):
## TODO: Customize your select query
query = f'INSERT INTO your_source_path.table_name VALUES ({item.id}, {item.name})'
## Use the SQL API to submit queries. The response contains the ID for the job ssociated with the SQL query
## Official docs: https://docs.dremio.com/cloud/reference/api/sql
project_id = "<your-dremio-project-id>"
query_response = self.dremio.post(
f"{project_id}/sql",
json={"sql" : query}
)
job_id = query_response.json()['id']
## Use the Job API to check the job status. Jobs final status are COMPLETED, FAILED and CANCELED
## Official docs: https://docs.dremio.com/cloud/reference/api/job/
job_state = 'INIT'
job_info_response = None
FINAL_JOB_STATES = ['COMPLETED', 'FAILED', 'CANCELED']
while job_state not in FINAL_JOB_STATES:
job_info_response = self.dremio.get(f"{project_id}/job/{job_id}")
job_state = job_info_response.json()['jobState']
if job_state == 'COMPLETED':
print("The query has been completed")
elif job_state == 'FAILED':
yield f"Uups! Something was wrong: {job_info_response.json()['errorMessage']}"
else:
yield f"The job's been cancelled: {job_info_response.json()['cancellationReason']}"
done()
def close(self):
pass
FAQs
YepCode is a SaaS platform that allows to create, execute and monitor integrations and automations using source code in a serverless environment.
We like to call it the Zapier for developers, since we bring all the agility and benefits of NoCode tools (avoid server provisioning, environment configuration, deployments,...), but with all the power of being able to use a programming language like JavaScript or Python.
These recipes are a good starting point for you to build your own YepCode processes and solve your integration and automation problems.
You only have to fill the sign up form and your account will be created with our FREE plan (no credit card required).
YepCode has been created with a clear enterprise approach (multi-tenant environment, team management, high security and auditing standards, IdP integrations, on-premise options,...) so we can be the Swiss army knife of any team of engineering, especially those that need to extract or send information to external systems, and where a certain dynamism or adaptation to change is necessary in that process.
Sure! You just need to do some configuration to allow YepCode servers to connect to that service. Check our docs page to get more information.