- Recipes
- Github repository files to Dremio
Connect Github repository files and Dremio in our serverless environment
Use this template to Get files from Github repository using them to insert data in Dremio.
Share
Get files from Github repository
Used integrations:
- JavaScript
- Python
class GithubSourceRepositoryFiles {
async init() {
// TODO: Create your github credential
// More info at https://yepcode.io/docs/integrations/github/#credential-configuration
this.github = yepcode.integration.github("your-github-credential-name");
// TODO: Customize the repo name and owner
this.repositoryOwner = "your-github-username";
this.repositoryName = "your-repository-name";
}
async fetch(publish, done) {
// TODO: Customize the path you want to obtain all files in it and its subdirectories (if has)
// It can also be a file path to only obtain one file
// If you pass undefined you will obtain the entire repository content
await this._publishPathContent("/path-in-repo", publish);
done();
}
_isFileContent = isString;
_isDirectoryInfo = isObject;
_publishPathContent = async (path, publishCallback) => {
// More info of this request at: https://docs.github.com/en/rest/repos/contents#get-repository-content
const response = await this.github.rest.repos.getContent({
mediaType: {
format: "raw",
},
owner: this.repositoryOwner,
repo: this.repositoryName,
path: path,
});
const {
data
} = response;
if (this._isFileContent(data)) {
// TODO: Customize the item to publish for each file in the repository
publishCallback({
path,
content: data
});
return;
}
if (this._isDirectoryInfo(data)) {
for (const directoryEntry of data) {
await this._publishPathContent(directoryEntry.path, publishCallback);
}
return;
}
console.error("Unexpected data type: ", response.headers["content-type"]);
};
async close() {}
}
Comming soon
We are releasing new Python recipes every week
Do you need help solving this integration with YepCode?
Let's talkInsert data in Dremio
Used integrations:
- JavaScript
- Python
class HttpTargetDremioInsert {
async init() {
// TODO: Create your http credential with dremio information:
// More info at https://yepcode.io/docs/integrations/http/#credential-configuration
// Official docs: https://docs.dremio.com/current/reference/api/
this.httpClient = yepcode.integration.http("your-dremio-credential-name");
}
async consume(item) {
const projectId = "<your-dremio-project-id>";
// TODO: Map your item to row and customize INSERT statement
// More info at https://docs.dremio.com/cloud/reference/sql/commands/insert/
const query = `INSERT INTO your_source_path.your_table VALUES (${item.id}, ${item.name})`;
// Use the SQL API to submit queries. The response contains the ID for the job associated with the SQL query
// Official docs: https://docs.dremio.com/cloud/reference/api/sql
const {
data: job
} = await this.httpClient.post(`${projectId}/sql`, {
sql: query,
});
// Use the Job API to check the job status. Jobs final status are COMPLETED, FAILED and CANCELED
// Official docs: https://docs.dremio.com/cloud/reference/api/job/
const finalJobStates = ["COMPLETED", "FAILED", "CANCELED"];
let jobInfoResponse = null;
do {
jobInfoResponse = await this.httpClient.get(
`${this.projectId}/job/${job.id}`
);
} while (!finalJobStates.includes(jobInfoResponse.data.jobState));
const {
data: jobInfo
} = jobInfoResponse;
if (jobInfo.jobState === "COMPLETED") {
console.log("Success!!");
} else if (jobInfo.jobState === "FAILED") {
console.log(`Uups! Something was wrong: ${jobInfo.errorMessage}`);
} else {
console.log(`The job's been cancelled: ${jobInfo.cancellationReason}`);
}
}
async close() {}
}
class HttpTargetDremioInsert:
def setup(self):
## TODO: Create your http credential with dremio information
## More info at https://yepcode.io/docs/integrations/http/#credential-configuration
## Official docs: https://docs.dremio.com/cloud/reference/api/
self.session = yepcode.integration.http(
"your-dremio-credential-name"
)
def consume(self, item, done):
## TODO: Customize your select query
query = f'INSERT INTO your_source_path.table_name VALUES ({item.id}, {item.name})'
## Use the SQL API to submit queries. The response contains the ID for the job ssociated with the SQL query
## Official docs: https://docs.dremio.com/cloud/reference/api/sql
project_id = "<your-dremio-project-id>"
query_response = self.session.post(
f"{project_id}/sql",
json={"sql" : query}
)
job_id = query_response.json()['id']
## Use the Job API to check the job status. Jobs final status are COMPLETED, FAILED and CANCELED
## Official docs: https://docs.dremio.com/cloud/reference/api/job/
job_state = 'INIT'
job_info_response = None
FINAL_JOB_STATES = ['COMPLETED', 'FAILED', 'CANCELED']
while job_state not in FINAL_JOB_STATES:
job_info_response = self.session.get(f"{project_id}/job/{job_id}")
job_state = job_info_response.json()['jobState']
if job_state == 'COMPLETED':
print("The query has been completed")
elif job_state == 'FAILED':
yield f"Uups! Something was wrong: {job_info_response.json()['errorMessage']}"
else:
yield f"The job's been cancelled: {job_info_response.json()['cancellationReason']}"
done()
def close(self):
pass
FAQs
YepCode is a SaaS platform that enables the creation, execution and monitoring of integrations and automations using source code in a serverless environment.
We like to call it the Zapier for developers, since we bring all the agility and benefits of NoCode tools (avoid server provisioning, environment configuration, deployments,...), but with all the power of being able to use a programming language like JavaScript or Python.
These recipes are an excellent starting point for creating your own YepCode processes and solving complex integration and automation problems.
You only have to complete the sign up form and your account will be created with our FREE plan (no credit card required).
YepCode has been created with a clear enterprise focus, offering a multi-tenant environment, team management capabilities, high security and auditing standards, Identity Provider (IdP) integrations, and on-premise options. It serves as the Swiss army knife for engineering teams, especially those requiring the extraction or transmission of information to external systems. It excels in scenarios demanding flexibility and adaptability to change within the process.
Sure! You only need to configure YepCode servers to establish a connection with that service. Check our docs page to get more information.