2016-08-02 11:42:00 -07:00
|
|
|
/**
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
2016-08-09 16:18:30 -07:00
|
|
|
|
2016-08-02 11:42:00 -07:00
|
|
|
// Package realis provides the ability to use Thrift API to communicate with Apache Aurora.
|
|
|
|
package realis
|
|
|
|
|
|
|
|
import (
|
|
|
|
"encoding/base64"
|
|
|
|
"fmt"
|
|
|
|
"git.apache.org/thrift.git/lib/go/thrift"
|
|
|
|
"github.com/pkg/errors"
|
2016-09-19 15:34:56 -04:00
|
|
|
"github.com/rdelval/gorealis/gen-go/apache/aurora"
|
2016-08-02 11:42:00 -07:00
|
|
|
"net/http"
|
|
|
|
"net/http/cookiejar"
|
|
|
|
"os"
|
|
|
|
"time"
|
|
|
|
)
|
|
|
|
|
2016-08-12 12:48:42 -07:00
|
|
|
type Realis interface {
|
2016-08-25 18:56:55 -07:00
|
|
|
AbortJobUpdate(updateKey aurora.JobUpdateKey, message string) (*aurora.Response, error)
|
2016-08-24 15:38:44 -07:00
|
|
|
AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error)
|
|
|
|
CreateJob(auroraJob Job) (*aurora.Response, error)
|
|
|
|
FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error)
|
2016-09-19 15:34:56 -04:00
|
|
|
GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error)
|
2016-08-25 18:56:55 -07:00
|
|
|
JobUpdateDetails(updateKey aurora.JobUpdateKey) (*aurora.Response, error)
|
2016-08-12 12:48:42 -07:00
|
|
|
KillJob(key *aurora.JobKey) (*aurora.Response, error)
|
2016-08-25 18:56:55 -07:00
|
|
|
KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
|
|
|
|
RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
|
2016-08-12 12:48:42 -07:00
|
|
|
RestartJob(key *aurora.JobKey) (*aurora.Response, error)
|
|
|
|
StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error)
|
|
|
|
Close()
|
|
|
|
}
|
|
|
|
|
|
|
|
type realisClient struct {
|
2016-08-02 11:42:00 -07:00
|
|
|
client *aurora.AuroraSchedulerManagerClient
|
|
|
|
}
|
|
|
|
|
|
|
|
// Wrap object to provide future flexibility
|
|
|
|
type RealisConfig struct {
|
|
|
|
transport thrift.TTransport
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Create a new Client with a default transport layer
|
2016-08-12 12:48:42 -07:00
|
|
|
func NewClient(config RealisConfig) Realis {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
httpTrans := (config.transport).(*thrift.THttpClient)
|
|
|
|
httpTrans.SetHeader("User-Agent", "GoRealis v0.1")
|
|
|
|
|
|
|
|
protocolFactory := thrift.NewTJSONProtocolFactory()
|
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
return realisClient{
|
|
|
|
client: aurora.NewAuroraSchedulerManagerClientFactory(config.transport, protocolFactory)}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Create a default configuration of the transport layer, requires a URL to test connection with.
|
2016-08-02 11:42:00 -07:00
|
|
|
func NewDefaultConfig(url string) (RealisConfig, error) {
|
|
|
|
jar, err := cookiejar.New(nil)
|
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return RealisConfig{}, errors.Wrap(err, "Error creating Cookie Jar")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
//Custom client to timeout after 10 seconds to avoid hanging
|
|
|
|
trans, err := thrift.NewTHttpPostClientWithOptions(url+"/api",
|
|
|
|
thrift.THttpClientOptions{Client: &http.Client{Timeout: time.Second * 10, Jar: jar}})
|
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return RealisConfig{}, errors.Wrap(err, "Error creating transport")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
if err := trans.Open(); err != nil {
|
|
|
|
fmt.Fprintln(os.Stderr)
|
2016-08-16 18:40:02 -07:00
|
|
|
return RealisConfig{}, errors.Wrapf(err, "Error opening connection to %s", url)
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return RealisConfig{transport: trans}, nil
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Helper function to add basic authorization needed to communicate with Apache Aurora.
|
2016-08-02 11:42:00 -07:00
|
|
|
func AddBasicAuth(config *RealisConfig, username string, password string) {
|
|
|
|
httpTrans := (config.transport).(*thrift.THttpClient)
|
|
|
|
httpTrans.SetHeader("Authorization", "Basic "+basicAuth(username, password))
|
|
|
|
}
|
|
|
|
|
|
|
|
func basicAuth(username, password string) string {
|
|
|
|
auth := username + ":" + password
|
|
|
|
return base64.StdEncoding.EncodeToString([]byte(auth))
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Releases resources associated with the realis client.
|
2016-08-12 12:48:42 -07:00
|
|
|
func (r realisClient) Close() {
|
2016-08-02 11:42:00 -07:00
|
|
|
r.client.Transport.Close()
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Uses predefined set of states to retrieve a set of active jobs in Apache Aurora.
|
2016-08-26 16:35:31 -07:00
|
|
|
func (r realisClient) GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
taskQ := &aurora.TaskQuery{Role: key.Role,
|
|
|
|
Environment: key.Environment,
|
|
|
|
JobName: key.Name,
|
2016-08-26 16:35:31 -07:00
|
|
|
Statuses: states}
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
response, err := r.client.GetTasksWithoutConfigs(taskQ)
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for active IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
tasks := response.GetResult_().GetScheduleStatusResult_().GetTasks()
|
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
jobInstanceIds := make(map[int32]bool)
|
2016-08-02 11:42:00 -07:00
|
|
|
for _, task := range tasks {
|
2016-08-09 14:21:43 -07:00
|
|
|
jobInstanceIds[task.GetAssignedTask().GetInstanceId()] = true
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
return jobInstanceIds, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
// Kill specific instances of a job.
|
|
|
|
func (r realisClient) KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
instanceIds := make(map[int32]bool)
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
for _, instId := range instances {
|
|
|
|
instanceIds[instId] = true
|
|
|
|
}
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
response, err := r.client.KillTasks(key, instanceIds)
|
2016-08-09 13:44:54 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
|
2016-08-09 13:44:54 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return response, nil
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Sends a kill message to the scheduler for all active tasks under a job.
|
2016-08-12 12:48:42 -07:00
|
|
|
func (r realisClient) KillJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2016-08-26 16:35:31 -07:00
|
|
|
instanceIds, err := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
|
2016-08-02 11:42:00 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Could not retrieve relevant task instance IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
if len(instanceIds) > 0 {
|
|
|
|
response, err := r.client.KillTasks(key, instanceIds)
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2016-08-09 13:30:26 -07:00
|
|
|
|
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
} else {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.New("No tasks in the Active state")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Sends a create job message to the scheduler with a specific job configuration.
|
2016-08-24 15:38:44 -07:00
|
|
|
func (r realisClient) CreateJob(auroraJob Job) (*aurora.Response, error) {
|
|
|
|
response, err := r.client.CreateJob(auroraJob.JobConfig())
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Create command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 13:30:26 -07:00
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
// Restarts specific instances specified
|
|
|
|
func (r realisClient) RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
|
|
|
|
instanceIds := make(map[int32]bool)
|
|
|
|
|
|
|
|
for _, instId := range instances {
|
|
|
|
instanceIds[instId] = true
|
|
|
|
}
|
|
|
|
|
|
|
|
response, err := r.client.RestartShards(key, instanceIds)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
|
|
|
|
}
|
|
|
|
|
|
|
|
return response, nil
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Restarts all active tasks under a job configuration.
|
2016-08-12 12:48:42 -07:00
|
|
|
func (r realisClient) RestartJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2016-08-26 16:35:31 -07:00
|
|
|
instanceIds, err := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
|
2016-08-02 11:42:00 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Could not retrieve relevant task instance IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
if len(instanceIds) > 0 {
|
|
|
|
response, err := r.client.RestartShards(key, instanceIds)
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 13:30:26 -07:00
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
} else {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.New("No tasks in the Active state")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-16 18:40:02 -07:00
|
|
|
// Update all tasks under a job configuration. Currently gorealis doesn't support for canary deployments.
|
2016-08-12 12:48:42 -07:00
|
|
|
func (r realisClient) StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
response, err := r.client.StartJobUpdate(updateJob.req, message)
|
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending StartJobUpdate command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 13:30:26 -07:00
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Abort Job Update on Aurora. Requires the updateId which can be obtained on the Aurora web UI.
|
2016-08-12 12:48:42 -07:00
|
|
|
func (r realisClient) AbortJobUpdate(
|
2016-08-25 18:56:55 -07:00
|
|
|
updateKey aurora.JobUpdateKey,
|
2016-08-09 13:30:26 -07:00
|
|
|
message string) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
response, err := r.client.AbortJobUpdate(&updateKey, message)
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending AbortJobUpdate command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 13:30:26 -07:00
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Scale up the number of instances under a job configuration using the configuration for specific
|
|
|
|
// instance to scale up.
|
2016-08-24 15:38:44 -07:00
|
|
|
func (r realisClient) AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2016-08-24 15:38:44 -07:00
|
|
|
response, err := r.client.AddInstances(&instKey, count)
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending AddInstances command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 13:30:26 -07:00
|
|
|
return response, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2016-08-24 15:38:44 -07:00
|
|
|
|
|
|
|
func (r realisClient) FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error) {
|
|
|
|
|
|
|
|
ids := make(map[int32]bool)
|
|
|
|
|
|
|
|
ids[instKey.InstanceId] = true
|
|
|
|
taskQ := &aurora.TaskQuery{Role: instKey.JobKey.Role,
|
|
|
|
Environment: instKey.JobKey.Environment,
|
|
|
|
JobName: instKey.JobKey.Name,
|
2016-08-24 17:21:59 -07:00
|
|
|
InstanceIds: ids,
|
|
|
|
Statuses: aurora.ACTIVE_STATES}
|
2016-08-24 15:38:44 -07:00
|
|
|
|
|
|
|
response, err := r.client.GetTasksStatus(taskQ)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for task configuration")
|
|
|
|
}
|
|
|
|
|
|
|
|
tasks := response.GetResult_().GetScheduleStatusResult_().GetTasks()
|
|
|
|
|
2016-08-24 17:21:59 -07:00
|
|
|
if len(tasks) == 0 {
|
2016-08-24 15:38:44 -07:00
|
|
|
return nil, errors.Errorf("Instance %d for jobkey %s/%s/%s doesn't exist",
|
|
|
|
instKey.InstanceId,
|
|
|
|
instKey.JobKey.Environment,
|
|
|
|
instKey.JobKey.Role,
|
|
|
|
instKey.JobKey.Name)
|
|
|
|
}
|
|
|
|
|
|
|
|
return tasks[0].AssignedTask.Task, nil
|
|
|
|
}
|
2016-08-25 18:56:55 -07:00
|
|
|
|
|
|
|
func (r realisClient) JobUpdateDetails(updateKey aurora.JobUpdateKey) (*aurora.Response, error) {
|
|
|
|
|
|
|
|
resp, err := r.client.GetJobUpdateDetails(&updateKey)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Unable to get job update details")
|
|
|
|
}
|
|
|
|
|
2016-09-19 15:34:56 -04:00
|
|
|
return resp, nil
|
2016-08-25 18:56:55 -07:00
|
|
|
}
|