gorealis/realis.go

357 lines
12 KiB
Go
Raw Normal View History

2016-08-02 11:42:00 -07:00
/**
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
2016-08-02 11:42:00 -07:00
// Package realis provides the ability to use Thrift API to communicate with Apache Aurora.
package realis
import (
"encoding/base64"
"fmt"
"git.apache.org/thrift.git/lib/go/thrift"
"github.com/pkg/errors"
"github.com/rdelval/gorealis/gen-go/apache/aurora"
"github.com/rdelval/gorealis/response"
2016-08-02 11:42:00 -07:00
"net/http"
"net/http/cookiejar"
"os"
"time"
)
type Realis interface {
AbortJobUpdate(updateKey aurora.JobUpdateKey, message string) (*aurora.Response, error)
AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error)
CreateJob(auroraJob Job) (*aurora.Response, error)
DescheduleCronJob(key *aurora.JobKey) (*aurora.Response, error)
2016-11-15 22:24:07 -08:00
GetTaskStatus(query *aurora.TaskQuery)([]*aurora.ScheduledTask, error)
FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error)
GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error)
JobUpdateDetails(updateQuery aurora.JobUpdateQuery) (*aurora.Response, error)
KillJob(key *aurora.JobKey) (*aurora.Response, error)
KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
RestartJob(key *aurora.JobKey) (*aurora.Response, error)
RollbackJobUpdate(key aurora.JobUpdateKey, message string) (*aurora.Response, error)
ScheduleCronJob(auroraJob Job) (*aurora.Response, error)
StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error)
StartCronJob(key *aurora.JobKey) (*aurora.Response, error)
Close()
}
type realisClient struct {
2016-08-02 11:42:00 -07:00
client *aurora.AuroraSchedulerManagerClient
}
// Wrap object to provide future flexibility
type RealisConfig struct {
transport thrift.TTransport
protoFactory thrift.TProtocolFactory
2016-08-02 11:42:00 -07:00
}
// Create a new Client with a default transport layer
func NewClient(config RealisConfig) Realis {
return realisClient{
client: aurora.NewAuroraSchedulerManagerClientFactory(config.transport, config.protoFactory)}
2016-08-02 11:42:00 -07:00
}
// Create a default configuration of the transport layer, requires a URL to test connection with.
2016-11-14 13:27:25 -08:00
func NewDefaultConfig(url string, timeoutms int) (RealisConfig, error) {
2016-08-02 11:42:00 -07:00
jar, err := cookiejar.New(nil)
if err != nil {
return RealisConfig{}, errors.Wrap(err, "Error creating Cookie Jar")
2016-08-02 11:42:00 -07:00
}
//Custom client to timeout after 10 seconds to avoid hanging
trans, err := thrift.NewTHttpPostClientWithOptions(url+"/api",
2016-11-14 13:27:25 -08:00
thrift.THttpClientOptions{Client: &http.Client{Timeout: time.Millisecond * time.Duration(timeoutms), Jar: jar}})
2016-08-02 11:42:00 -07:00
if err != nil {
return RealisConfig{}, errors.Wrap(err, "Error creating transport")
2016-08-02 11:42:00 -07:00
}
if err := trans.Open(); err != nil {
fmt.Fprintln(os.Stderr)
return RealisConfig{}, errors.Wrapf(err, "Error opening connection to %s", url)
2016-08-02 11:42:00 -07:00
}
httpTrans := (trans).(*thrift.THttpClient)
httpTrans.SetHeader("Accept", "application/vnd.apache.thrift.binary")
httpTrans.SetHeader("Content-Type", "application/vnd.apache.thrift.binary")
httpTrans.SetHeader("User-Agent", "GoRealis v1.0.4")
2016-08-02 11:42:00 -07:00
return RealisConfig{transport: trans, protoFactory: thrift.NewTBinaryProtocolFactoryDefault()}, nil
2016-08-02 11:42:00 -07:00
}
// Helper function to add basic authorization needed to communicate with Apache Aurora.
2016-08-02 11:42:00 -07:00
func AddBasicAuth(config *RealisConfig, username string, password string) {
httpTrans := (config.transport).(*thrift.THttpClient)
httpTrans.SetHeader("Authorization", "Basic "+basicAuth(username, password))
}
func basicAuth(username, password string) string {
auth := username + ":" + password
return base64.StdEncoding.EncodeToString([]byte(auth))
}
// Releases resources associated with the realis client.
func (r realisClient) Close() {
2016-08-02 11:42:00 -07:00
r.client.Transport.Close()
}
// Uses predefined set of states to retrieve a set of active jobs in Apache Aurora.
func (r realisClient) GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error) {
2016-08-02 11:42:00 -07:00
taskQ := &aurora.TaskQuery{Role: key.Role,
Environment: key.Environment,
JobName: key.Name,
Statuses: states}
2016-08-02 11:42:00 -07:00
resp, err := r.client.GetTasksWithoutConfigs(taskQ)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for active IDs")
2016-08-02 11:42:00 -07:00
}
tasks := response.ScheduleStatusResult(resp).GetTasks()
2016-08-02 11:42:00 -07:00
jobInstanceIds := make(map[int32]bool)
2016-08-02 11:42:00 -07:00
for _, task := range tasks {
jobInstanceIds[task.GetAssignedTask().GetInstanceId()] = true
2016-08-02 11:42:00 -07:00
}
return jobInstanceIds, nil
2016-08-02 11:42:00 -07:00
}
// Kill specific instances of a job.
func (r realisClient) KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
instanceIds := make(map[int32]bool)
for _, instId := range instances {
instanceIds[instId] = true
}
resp, err := r.client.KillTasks(key, instanceIds)
if err != nil {
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
}
return response.ResponseCodeCheck(resp)
}
// Sends a kill message to the scheduler for all active tasks under a job.
func (r realisClient) KillJob(key *aurora.JobKey) (*aurora.Response, error) {
2016-08-02 11:42:00 -07:00
instanceIds, err := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Could not retrieve relevant task instance IDs")
2016-08-02 11:42:00 -07:00
}
if len(instanceIds) > 0 {
resp, err := r.client.KillTasks(key, instanceIds)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
} else {
return nil, errors.New("No tasks in the Active state")
2016-08-02 11:42:00 -07:00
}
}
// Sends a create job message to the scheduler with a specific job configuration.
func (r realisClient) CreateJob(auroraJob Job) (*aurora.Response, error) {
resp, err := r.client.CreateJob(auroraJob.JobConfig())
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending Create command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
}
func (r realisClient) ScheduleCronJob(auroraJob Job) (*aurora.Response, error) {
resp, err := r.client.ScheduleCronJob(auroraJob.JobConfig())
if err != nil {
return nil, errors.Wrap(err, "Error sending Cron Job Schedule message to Aurora Scheduler")
}
return response.ResponseCodeCheck(resp)
}
func (r realisClient) DescheduleCronJob(key *aurora.JobKey) (*aurora.Response, error) {
resp, err := r.client.DescheduleCronJob(key)
if err != nil {
return nil, errors.Wrap(err, "Error sending Cron Job De-schedule message to Aurora Scheduler")
}
return response.ResponseCodeCheck(resp)
}
func (r realisClient) StartCronJob(key *aurora.JobKey) (*aurora.Response, error) {
resp, err := r.client.StartCronJob(key)
if err != nil {
return nil, errors.Wrap(err, "Error sending Start Cron Job message to Aurora Scheduler")
}
return response.ResponseCodeCheck(resp)
}
// Restarts specific instances specified
func (r realisClient) RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
instanceIds := make(map[int32]bool)
for _, instId := range instances {
instanceIds[instId] = true
}
resp, err := r.client.RestartShards(key, instanceIds)
if err != nil {
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
}
return response.ResponseCodeCheck(resp)
}
// Restarts all active tasks under a job configuration.
func (r realisClient) RestartJob(key *aurora.JobKey) (*aurora.Response, error) {
2016-08-02 11:42:00 -07:00
instanceIds, err := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Could not retrieve relevant task instance IDs")
2016-08-02 11:42:00 -07:00
}
if len(instanceIds) > 0 {
resp, err := r.client.RestartShards(key, instanceIds)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
} else {
return nil, errors.New("No tasks in the Active state")
2016-08-02 11:42:00 -07:00
}
}
// Update all tasks under a job configuration. Currently gorealis doesn't support for canary deployments.
func (r realisClient) StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error) {
2016-08-02 11:42:00 -07:00
resp, err := r.client.StartJobUpdate(updateJob.req, message)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending StartJobUpdate command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
}
// Abort Job Update on Aurora. Requires the updateId which can be obtained on the Aurora web UI.
func (r realisClient) AbortJobUpdate(
updateKey aurora.JobUpdateKey,
message string) (*aurora.Response, error) {
2016-08-02 11:42:00 -07:00
resp, err := r.client.AbortJobUpdate(&updateKey, message)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending AbortJobUpdate command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
}
// Scale up the number of instances under a job configuration using the configuration for specific
// instance to scale up.
func (r realisClient) AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error) {
2016-08-02 11:42:00 -07:00
resp, err := r.client.AddInstances(&instKey, count)
2016-08-02 11:42:00 -07:00
if err != nil {
return nil, errors.Wrap(err, "Error sending AddInstances command to Aurora Scheduler")
2016-08-02 11:42:00 -07:00
}
return response.ResponseCodeCheck(resp)
2016-08-02 11:42:00 -07:00
}
2016-11-15 22:24:07 -08:00
func (r realisClient) GetTaskStatus(query *aurora.TaskQuery)(tasks []*aurora.ScheduledTask, e error) {
resp, err := r.client.GetTasksStatus(query)
if err != nil {
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for task status")
}
//Check for response code..
if resp.GetResponseCode() != aurora.ResponseCode_OK {
return nil, errors.New(resp.ResponseCode.String() + "--" + response.CombineMessage(resp))
}
return response.ScheduleStatusResult(resp).GetTasks(), nil
}
func (r realisClient) FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error) {
ids := make(map[int32]bool)
ids[instKey.InstanceId] = true
taskQ := &aurora.TaskQuery{Role: instKey.JobKey.Role,
Environment: instKey.JobKey.Environment,
JobName: instKey.JobKey.Name,
InstanceIds: ids,
Statuses: aurora.ACTIVE_STATES}
resp, err := r.client.GetTasksStatus(taskQ)
if err != nil {
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for task configuration")
}
2016-11-15 22:24:07 -08:00
//Check for response code..
if resp.GetResponseCode() != aurora.ResponseCode_OK {
return nil, errors.New(resp.ResponseCode.String() + "--" +response.CombineMessage(resp))
}
tasks := response.ScheduleStatusResult(resp).GetTasks()
if len(tasks) == 0 {
return nil, errors.Errorf("Instance %d for jobkey %s/%s/%s doesn't exist",
instKey.InstanceId,
instKey.JobKey.Environment,
instKey.JobKey.Role,
instKey.JobKey.Name)
}
// Currently, instance 0 is always picked
return tasks[0].AssignedTask.Task, nil
}
func (r realisClient) JobUpdateDetails(updateQuery aurora.JobUpdateQuery) (*aurora.Response, error) {
resp, err := r.client.GetJobUpdateDetails(&updateQuery)
if err != nil {
return nil, errors.Wrap(err, "Unable to get job update details")
}
return response.ResponseCodeCheck(resp)
}
func (r realisClient) RollbackJobUpdate(key aurora.JobUpdateKey, message string) (*aurora.Response, error) {
resp, err := r.client.RollbackJobUpdate(&key, message)
if err != nil {
return nil, errors.Wrap(err, "Unable to roll back job update")
}
return response.ResponseCodeCheck(resp)
}