2016-08-02 11:42:00 -07:00
|
|
|
/**
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
2016-08-09 16:18:30 -07:00
|
|
|
|
2016-08-02 11:42:00 -07:00
|
|
|
// Package realis provides the ability to use Thrift API to communicate with Apache Aurora.
|
|
|
|
package realis
|
|
|
|
|
|
|
|
import (
|
|
|
|
"encoding/base64"
|
2017-03-09 11:37:03 -08:00
|
|
|
"net/http"
|
|
|
|
"net/http/cookiejar"
|
|
|
|
"time"
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
"fmt"
|
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
"math/rand"
|
|
|
|
|
2016-08-02 11:42:00 -07:00
|
|
|
"git.apache.org/thrift.git/lib/go/thrift"
|
|
|
|
"github.com/pkg/errors"
|
2016-09-19 15:34:56 -04:00
|
|
|
"github.com/rdelval/gorealis/gen-go/apache/aurora"
|
2016-11-02 20:41:43 -04:00
|
|
|
"github.com/rdelval/gorealis/response"
|
2016-08-02 11:42:00 -07:00
|
|
|
)
|
|
|
|
|
2017-03-23 19:18:23 -04:00
|
|
|
const VERSION = "1.0.4"
|
|
|
|
|
2016-08-12 12:48:42 -07:00
|
|
|
type Realis interface {
|
2016-08-25 18:56:55 -07:00
|
|
|
AbortJobUpdate(updateKey aurora.JobUpdateKey, message string) (*aurora.Response, error)
|
2016-08-24 15:38:44 -07:00
|
|
|
AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error)
|
2017-03-10 01:14:09 -08:00
|
|
|
RemoveInstances(key *aurora.JobKey, count int32) (*aurora.Response, error)
|
2016-08-24 15:38:44 -07:00
|
|
|
CreateJob(auroraJob Job) (*aurora.Response, error)
|
2016-09-30 01:24:49 -04:00
|
|
|
DescheduleCronJob(key *aurora.JobKey) (*aurora.Response, error)
|
2017-02-13 19:31:41 -05:00
|
|
|
GetTaskStatus(query *aurora.TaskQuery) ([]*aurora.ScheduledTask, error)
|
2016-08-24 15:38:44 -07:00
|
|
|
FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error)
|
2016-09-19 15:34:56 -04:00
|
|
|
GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error)
|
2016-09-29 20:45:24 -04:00
|
|
|
JobUpdateDetails(updateQuery aurora.JobUpdateQuery) (*aurora.Response, error)
|
2016-08-12 12:48:42 -07:00
|
|
|
KillJob(key *aurora.JobKey) (*aurora.Response, error)
|
2016-08-25 18:56:55 -07:00
|
|
|
KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
|
|
|
|
RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error)
|
2016-08-12 12:48:42 -07:00
|
|
|
RestartJob(key *aurora.JobKey) (*aurora.Response, error)
|
2016-09-30 00:44:38 -04:00
|
|
|
RollbackJobUpdate(key aurora.JobUpdateKey, message string) (*aurora.Response, error)
|
2016-09-30 01:24:49 -04:00
|
|
|
ScheduleCronJob(auroraJob Job) (*aurora.Response, error)
|
2016-08-12 12:48:42 -07:00
|
|
|
StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error)
|
2016-09-30 01:24:49 -04:00
|
|
|
StartCronJob(key *aurora.JobKey) (*aurora.Response, error)
|
2017-03-09 11:37:03 -08:00
|
|
|
GetJobUpdateSummaries(jobUpdateQuery *aurora.JobUpdateQuery) (*aurora.Response, error)
|
2017-03-16 23:19:30 -07:00
|
|
|
ReestablishConn() error
|
2017-03-30 18:17:21 -07:00
|
|
|
RealisConfig() *RealisConfig
|
2016-08-12 12:48:42 -07:00
|
|
|
Close()
|
|
|
|
}
|
|
|
|
|
|
|
|
type realisClient struct {
|
2017-03-16 23:19:30 -07:00
|
|
|
config *RealisConfig
|
2017-03-09 11:37:03 -08:00
|
|
|
client *aurora.AuroraSchedulerManagerClient
|
|
|
|
readonlyClient *aurora.ReadOnlySchedulerClient
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
type option func(*RealisConfig)
|
|
|
|
|
|
|
|
//Config sets for options in RealisConfig.
|
|
|
|
func BasicAuth(username, password string) option {
|
|
|
|
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.username = username
|
|
|
|
config.password = password
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func SchedulerUrl(url string) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.url = url
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TimeoutMS(timeout int) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.timeoutms = timeout
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func ZKCluster(cluster *Cluster) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.cluster = cluster
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-31 10:48:36 -07:00
|
|
|
func ZKUrl(url string) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.cluster = GetDefaultClusterFromZKUrl(url)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
func Retries(backoff *Backoff) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.backoff = backoff
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func ThriftJSON() option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.jsonTransport = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func ThriftBinary() option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.binTransport = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func BackOff(b *Backoff) option {
|
|
|
|
return func(config *RealisConfig) {
|
|
|
|
config.backoff = b
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-04-06 23:15:44 -07:00
|
|
|
func newTJSONTransport(url string, timeout int) (thrift.TTransport, error) {
|
|
|
|
|
|
|
|
trans, err := defaultTTransport(url, timeout)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
httpTrans := (trans).(*thrift.THttpClient)
|
|
|
|
httpTrans.SetHeader("Content-Type", "application/x-thrift")
|
|
|
|
httpTrans.SetHeader("User-Agent", "GoRealis v"+VERSION)
|
|
|
|
return trans, err
|
|
|
|
}
|
|
|
|
|
|
|
|
func newTBinTransport(url string, timeout int) (thrift.TTransport, error) {
|
|
|
|
trans, err := defaultTTransport(url, timeout)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
httpTrans := (trans).(*thrift.THttpClient)
|
|
|
|
httpTrans.DelHeader("Content-Type") // Workaround for using thrift HttpPostClient
|
|
|
|
httpTrans.SetHeader("Accept", "application/vnd.apache.thrift.binary")
|
|
|
|
httpTrans.SetHeader("Content-Type", "application/vnd.apache.thrift.binary")
|
|
|
|
httpTrans.SetHeader("User-Agent", "GoRealis v"+VERSION)
|
|
|
|
|
|
|
|
return trans, err
|
|
|
|
}
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
func NewRealisClient(options ...option) (Realis, error) {
|
|
|
|
config := &RealisConfig{}
|
|
|
|
fmt.Println(" options length: ", options)
|
|
|
|
for _, opt := range options {
|
|
|
|
opt(config)
|
|
|
|
}
|
|
|
|
//Default timeout
|
|
|
|
if config.timeoutms == 0 {
|
|
|
|
config.timeoutms = 10000
|
|
|
|
}
|
|
|
|
//Set default Transport to JSON if needed.
|
|
|
|
if !config.jsonTransport && !config.binTransport {
|
|
|
|
config.jsonTransport = true
|
|
|
|
}
|
|
|
|
var url string
|
|
|
|
var err error
|
|
|
|
//Cluster or URL?
|
|
|
|
if config.cluster != nil {
|
|
|
|
url, err = LeaderFromZK(*config.cluster)
|
|
|
|
if err != nil {
|
|
|
|
fmt.Errorf("LeaderFromZK error: %+v\n ", err)
|
|
|
|
}
|
|
|
|
fmt.Println("schedURLFromZK: ", url)
|
|
|
|
} else if config.url != "" {
|
|
|
|
fmt.Println("Scheduler URL: ", config.url)
|
|
|
|
url = config.url
|
|
|
|
} else {
|
|
|
|
return nil, errors.New("Incomplete Options -- url or cluster required")
|
|
|
|
}
|
|
|
|
|
|
|
|
if config.jsonTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTJSONTransport(url, config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
2017-04-06 23:15:44 -07:00
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
config.transport = trans
|
|
|
|
config.protoFactory = thrift.NewTJSONProtocolFactory()
|
|
|
|
} else if config.binTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTBinTransport(url, config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
config.transport = trans
|
|
|
|
config.protoFactory = thrift.NewTBinaryProtocolFactoryDefault()
|
|
|
|
}
|
|
|
|
|
|
|
|
//Basic Authentication.
|
|
|
|
if config.username != "" && config.password != "" {
|
|
|
|
AddBasicAuth(config, config.username, config.password)
|
|
|
|
}
|
|
|
|
|
|
|
|
//Set defaultBackoff if required.
|
|
|
|
if config.backoff == nil {
|
|
|
|
config.backoff = &defaultBackoff
|
2017-04-06 23:15:44 -07:00
|
|
|
} else {
|
|
|
|
defaultBackoff = *config.backoff
|
|
|
|
fmt.Printf(" updating default backoff : %+v\n", *config.backoff)
|
2017-03-30 18:17:21 -07:00
|
|
|
}
|
|
|
|
|
2017-04-18 16:35:27 -07:00
|
|
|
fmt.Printf("gorealis config url: %+v\n", config.url)
|
2017-03-30 18:17:21 -07:00
|
|
|
|
|
|
|
return &realisClient{
|
|
|
|
config: config,
|
|
|
|
client: aurora.NewAuroraSchedulerManagerClientFactory(config.transport, config.protoFactory),
|
|
|
|
readonlyClient: aurora.NewReadOnlySchedulerClientFactory(config.transport, config.protoFactory)}, nil
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2017-02-13 19:31:41 -05:00
|
|
|
// Wrapper object to provide future flexibility
|
2016-08-02 11:42:00 -07:00
|
|
|
type RealisConfig struct {
|
2017-03-30 18:17:21 -07:00
|
|
|
username, password string
|
|
|
|
url string
|
|
|
|
timeoutms int
|
|
|
|
binTransport, jsonTransport bool
|
|
|
|
cluster *Cluster
|
|
|
|
backoff *Backoff
|
|
|
|
transport thrift.TTransport
|
|
|
|
protoFactory thrift.TProtocolFactory
|
2017-03-16 23:19:30 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
type Backoff struct {
|
|
|
|
Duration time.Duration // the base duration
|
|
|
|
Factor float64 // Duration is multipled by factor each iteration
|
|
|
|
Jitter float64 // The amount of jitter applied each iteration
|
|
|
|
Steps int // Exit with error after this many steps
|
|
|
|
}
|
|
|
|
|
|
|
|
var defaultBackoff = Backoff{
|
2017-03-20 22:34:45 -07:00
|
|
|
Steps: 3,
|
|
|
|
Duration: 10 * time.Second,
|
2017-03-16 23:19:30 -07:00
|
|
|
Factor: 5.0,
|
|
|
|
Jitter: 0.1,
|
|
|
|
}
|
|
|
|
|
|
|
|
// Jitter returns a time.Duration between duration and duration + maxFactor *
|
|
|
|
// duration.
|
|
|
|
//
|
|
|
|
// This allows clients to avoid converging on periodic behavior. If maxFactor
|
|
|
|
// is 0.0, a suggested default value will be chosen.
|
|
|
|
func Jitter(duration time.Duration, maxFactor float64) time.Duration {
|
|
|
|
if maxFactor <= 0.0 {
|
|
|
|
maxFactor = 1.0
|
|
|
|
}
|
|
|
|
wait := duration + time.Duration(rand.Float64()*maxFactor*float64(duration))
|
|
|
|
return wait
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create a new Client with Cluster information and other details.
|
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
func NewDefaultClientUsingCluster(cluster *Cluster, user, passwd string) (Realis, error) {
|
2017-03-16 23:19:30 -07:00
|
|
|
|
|
|
|
url, err := LeaderFromZK(*cluster)
|
|
|
|
if err != nil {
|
|
|
|
fmt.Println(err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
fmt.Printf(" url: %s\n", url)
|
|
|
|
|
|
|
|
//Create new configuration with default transport layer
|
2017-03-21 16:59:27 -07:00
|
|
|
config, err := newDefaultConfig(url, 10000)
|
2017-03-16 23:19:30 -07:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println(err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
config.username = user
|
|
|
|
config.password = passwd
|
|
|
|
config.cluster = cluster
|
2017-03-20 22:34:45 -07:00
|
|
|
config.url = ""
|
|
|
|
// Configured for vagrant
|
|
|
|
AddBasicAuth(config, user, passwd)
|
2017-03-21 16:59:27 -07:00
|
|
|
r := newClient(config)
|
2017-03-20 22:34:45 -07:00
|
|
|
return r, nil
|
|
|
|
}
|
|
|
|
|
2017-03-21 16:59:27 -07:00
|
|
|
func GetDefaultClusterFromZKUrl(zkurl string) *Cluster {
|
|
|
|
return &Cluster{Name: "defaultCluster",
|
2017-03-20 22:34:45 -07:00
|
|
|
AuthMechanism: "UNAUTHENTICATED",
|
2017-03-21 16:59:27 -07:00
|
|
|
ZK: zkurl,
|
2017-03-20 22:34:45 -07:00
|
|
|
SchedZKPath: "/aurora/scheduler",
|
|
|
|
AgentRunDir: "latest",
|
|
|
|
AgentRoot: "/var/lib/mesos",
|
|
|
|
}
|
2017-03-21 16:59:27 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
//This api would create default cluster object..
|
|
|
|
func NewDefaultClientUsingZKUrl(zkUrl, user, passwd string) (Realis, error) {
|
|
|
|
|
|
|
|
fmt.Println(" zkUrl: %s", zkUrl)
|
|
|
|
cluster := GetDefaultClusterFromZKUrl(zkUrl)
|
2017-03-20 22:34:45 -07:00
|
|
|
|
|
|
|
url, err := LeaderFromZK(*cluster)
|
|
|
|
if err != nil {
|
|
|
|
fmt.Println(err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
fmt.Printf(" url: %s\n", url)
|
|
|
|
|
|
|
|
//Create new configuration with default transport layer
|
2017-03-21 16:59:27 -07:00
|
|
|
config, err := newDefaultConfig(url, 10000)
|
2017-03-20 22:34:45 -07:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println(err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
config.username = user
|
|
|
|
config.password = passwd
|
|
|
|
config.cluster = cluster
|
|
|
|
config.url = ""
|
|
|
|
// Configured for vagrant
|
|
|
|
AddBasicAuth(config, user, passwd)
|
2017-03-21 16:59:27 -07:00
|
|
|
r := newClient(config)
|
2017-03-20 22:34:45 -07:00
|
|
|
return r, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func NewDefaultClientUsingUrl(url, user, passwd string) (Realis, error) {
|
|
|
|
|
|
|
|
fmt.Printf(" url: %s\n", url)
|
|
|
|
//Create new configuration with default transport layer
|
2017-03-21 16:59:27 -07:00
|
|
|
config, err := newDefaultConfig(url, 10000)
|
2017-03-20 22:34:45 -07:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println(err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
config.username = user
|
|
|
|
config.password = passwd
|
|
|
|
config.url = url
|
|
|
|
config.cluster = nil
|
2017-03-16 23:19:30 -07:00
|
|
|
// Configured for vagrant
|
|
|
|
AddBasicAuth(config, user, passwd)
|
2017-03-21 16:59:27 -07:00
|
|
|
r := newClient(config)
|
2017-03-16 23:19:30 -07:00
|
|
|
return r, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Create a new Client with a default transport layer
|
2017-03-21 16:59:27 -07:00
|
|
|
func newClient(realisconfig *RealisConfig) Realis {
|
2017-03-10 15:50:26 -08:00
|
|
|
return &realisClient{
|
2017-03-16 23:19:30 -07:00
|
|
|
config: realisconfig,
|
|
|
|
client: aurora.NewAuroraSchedulerManagerClientFactory(realisconfig.transport, realisconfig.protoFactory),
|
|
|
|
readonlyClient: aurora.NewReadOnlySchedulerClientFactory(realisconfig.transport, realisconfig.protoFactory)}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-02-13 19:31:41 -05:00
|
|
|
// Creates a default Thrift Transport object for communications in gorealis using an HTTP Post Client
|
|
|
|
func defaultTTransport(urlstr string, timeoutms int) (thrift.TTransport, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
jar, err := cookiejar.New(nil)
|
|
|
|
if err != nil {
|
2017-02-13 19:31:41 -05:00
|
|
|
return &thrift.THttpClient{}, errors.Wrap(err, "Error creating Cookie Jar")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-02-13 19:31:41 -05:00
|
|
|
trans, err := thrift.NewTHttpPostClientWithOptions(urlstr+"/api",
|
2016-11-14 13:27:25 -08:00
|
|
|
thrift.THttpClientOptions{Client: &http.Client{Timeout: time.Millisecond * time.Duration(timeoutms), Jar: jar}})
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
if err != nil {
|
2017-02-13 19:31:41 -05:00
|
|
|
return &thrift.THttpClient{}, errors.Wrap(err, "Error creating transport")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
if err := trans.Open(); err != nil {
|
2017-02-13 19:31:41 -05:00
|
|
|
return &thrift.THttpClient{}, errors.Wrapf(err, "Error opening connection to %s", urlstr)
|
|
|
|
}
|
|
|
|
|
|
|
|
return trans, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create a default configuration of the transport layer, requires a URL to test connection with.
|
|
|
|
// Uses HTTP Post as transport layer and Thrift JSON as the wire protocol by default.
|
2017-03-21 16:59:27 -07:00
|
|
|
func newDefaultConfig(url string, timeoutms int) (*RealisConfig, error) {
|
|
|
|
return newTJSONConfig(url, timeoutms)
|
2017-02-13 19:31:41 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// Creates a realis config object using HTTP Post and Thrift JSON protocol to communicate with Aurora.
|
2017-03-21 16:59:27 -07:00
|
|
|
func newTJSONConfig(url string, timeoutms int) (*RealisConfig, error) {
|
2017-02-13 19:31:41 -05:00
|
|
|
trans, err := defaultTTransport(url, timeoutms)
|
|
|
|
if err != nil {
|
2017-03-16 23:19:30 -07:00
|
|
|
return &RealisConfig{}, errors.Wrap(err, "Error creating realis config")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2017-02-13 19:31:41 -05:00
|
|
|
|
|
|
|
httpTrans := (trans).(*thrift.THttpClient)
|
|
|
|
httpTrans.SetHeader("Content-Type", "application/x-thrift")
|
2017-03-23 19:18:23 -04:00
|
|
|
httpTrans.SetHeader("User-Agent", "GoRealis v"+VERSION)
|
2017-02-13 19:31:41 -05:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
return &RealisConfig{transport: trans, protoFactory: thrift.NewTJSONProtocolFactory()}, nil
|
2017-02-13 19:31:41 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// Creates a realis config config using HTTP Post and Thrift Binary protocol to communicate with Aurora.
|
2017-03-21 16:59:27 -07:00
|
|
|
func newTBinaryConfig(url string, timeoutms int) (*RealisConfig, error) {
|
2017-02-13 19:31:41 -05:00
|
|
|
trans, err := defaultTTransport(url, timeoutms)
|
|
|
|
if err != nil {
|
2017-03-16 23:19:30 -07:00
|
|
|
return &RealisConfig{}, errors.Wrap(err, "Error creating realis config")
|
2017-02-13 19:31:41 -05:00
|
|
|
}
|
|
|
|
|
2017-02-10 19:23:20 -05:00
|
|
|
httpTrans := (trans).(*thrift.THttpClient)
|
2017-03-23 19:18:23 -04:00
|
|
|
httpTrans.DelHeader("Content-Type") // Workaround for using thrift HttpPostClient
|
|
|
|
|
2017-02-10 19:23:20 -05:00
|
|
|
httpTrans.SetHeader("Accept", "application/vnd.apache.thrift.binary")
|
|
|
|
httpTrans.SetHeader("Content-Type", "application/vnd.apache.thrift.binary")
|
2017-03-23 19:18:23 -04:00
|
|
|
httpTrans.SetHeader("User-Agent", "GoRealis v"+VERSION)
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
return &RealisConfig{transport: trans, protoFactory: thrift.NewTBinaryProtocolFactoryDefault()}, nil
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Helper function to add basic authorization needed to communicate with Apache Aurora.
|
2016-08-02 11:42:00 -07:00
|
|
|
func AddBasicAuth(config *RealisConfig, username string, password string) {
|
2017-03-16 23:19:30 -07:00
|
|
|
config.username = username
|
|
|
|
config.password = password
|
2016-08-02 11:42:00 -07:00
|
|
|
httpTrans := (config.transport).(*thrift.THttpClient)
|
|
|
|
httpTrans.SetHeader("Authorization", "Basic "+basicAuth(username, password))
|
|
|
|
}
|
|
|
|
|
|
|
|
func basicAuth(username, password string) string {
|
|
|
|
auth := username + ":" + password
|
|
|
|
return base64.StdEncoding.EncodeToString([]byte(auth))
|
|
|
|
}
|
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
func (r *realisClient) ReestablishConn() error {
|
|
|
|
//close existing connection..
|
|
|
|
fmt.Println("ReestablishConn begin ....")
|
|
|
|
r.Close()
|
2017-03-20 22:34:45 -07:00
|
|
|
//First check cluster object for re-establish; if not available then try with scheduler url.
|
2017-03-30 18:17:21 -07:00
|
|
|
//var config *RealisConfig
|
|
|
|
var err error
|
|
|
|
var url string
|
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
if r.config.cluster != nil && r.config.username != "" && r.config.password != "" {
|
2017-03-20 22:34:45 -07:00
|
|
|
//Re-establish using cluster object.
|
2017-03-30 18:17:21 -07:00
|
|
|
url, err = LeaderFromZK(*r.config.cluster)
|
2017-03-16 23:19:30 -07:00
|
|
|
if err != nil {
|
2017-03-20 22:34:45 -07:00
|
|
|
fmt.Errorf("LeaderFromZK error: %+v\n ", err)
|
2017-03-16 23:19:30 -07:00
|
|
|
}
|
|
|
|
fmt.Println("ReestablishConn url: ", url)
|
2017-03-30 18:17:21 -07:00
|
|
|
if r.config.jsonTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTJSONTransport(url, r.config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
r.config.transport = trans
|
|
|
|
r.config.protoFactory = thrift.NewTJSONProtocolFactory()
|
|
|
|
} else if r.config.binTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTBinTransport(url, r.config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
r.config.transport = trans
|
|
|
|
r.config.protoFactory = thrift.NewTBinaryProtocolFactoryDefault()
|
|
|
|
}
|
2017-03-16 23:19:30 -07:00
|
|
|
if err != nil {
|
2017-03-30 18:17:21 -07:00
|
|
|
fmt.Println("error creating config: ", err)
|
2017-03-16 23:19:30 -07:00
|
|
|
}
|
|
|
|
// Configured for basic-auth
|
2017-03-30 18:17:21 -07:00
|
|
|
AddBasicAuth(r.config, r.config.username, r.config.password)
|
|
|
|
r.client = aurora.NewAuroraSchedulerManagerClientFactory(r.config.transport, r.config.protoFactory)
|
|
|
|
r.readonlyClient = aurora.NewReadOnlySchedulerClientFactory(r.config.transport, r.config.protoFactory)
|
2017-03-20 22:34:45 -07:00
|
|
|
} else if r.config.url != "" && r.config.username != "" && r.config.password != "" {
|
|
|
|
//Re-establish using scheduler url.
|
2017-03-30 18:17:21 -07:00
|
|
|
fmt.Println("ReestablishConn url: ", r.config.url)
|
|
|
|
if r.config.jsonTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTJSONTransport(url, r.config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
r.config.transport = trans
|
|
|
|
r.config.protoFactory = thrift.NewTJSONProtocolFactory()
|
|
|
|
} else if r.config.binTransport {
|
2017-04-06 23:15:44 -07:00
|
|
|
trans, err := newTBinTransport(url, r.config.timeoutms)
|
2017-03-30 18:17:21 -07:00
|
|
|
if err != nil {
|
|
|
|
return errors.Wrap(err, "Error creating realis")
|
|
|
|
}
|
|
|
|
r.config.transport = trans
|
|
|
|
r.config.protoFactory = thrift.NewTBinaryProtocolFactoryDefault()
|
2017-03-20 22:34:45 -07:00
|
|
|
}
|
2017-03-30 18:17:21 -07:00
|
|
|
AddBasicAuth(r.config, r.config.username, r.config.password)
|
|
|
|
r.client = aurora.NewAuroraSchedulerManagerClientFactory(r.config.transport, r.config.protoFactory)
|
|
|
|
r.readonlyClient = aurora.NewReadOnlySchedulerClientFactory(r.config.transport, r.config.protoFactory)
|
2017-03-16 23:19:30 -07:00
|
|
|
} else {
|
|
|
|
fmt.Println(" Missing Data for ReestablishConn ")
|
|
|
|
fmt.Println(" r.config.cluster: ", r.config.cluster)
|
|
|
|
fmt.Println(" r.config.username: ", r.config.username)
|
|
|
|
fmt.Println(" r.config.passwd: ", r.config.password)
|
2017-03-20 22:34:45 -07:00
|
|
|
fmt.Println(" r.config.url: ", r.config.url)
|
2017-03-16 23:19:30 -07:00
|
|
|
return errors.New(" Missing Data for ReestablishConn ")
|
|
|
|
}
|
2017-04-18 16:35:27 -07:00
|
|
|
fmt.Printf(" config url before return: %+v\n", r.config.url)
|
2017-03-16 23:19:30 -07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Releases resources associated with the realis client.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) Close() {
|
2016-08-02 11:42:00 -07:00
|
|
|
r.client.Transport.Close()
|
2017-03-09 11:37:03 -08:00
|
|
|
r.readonlyClient.Transport.Close()
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Uses predefined set of states to retrieve a set of active jobs in Apache Aurora.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) GetInstanceIds(key *aurora.JobKey, states map[aurora.ScheduleStatus]bool) (map[int32]bool, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
taskQ := &aurora.TaskQuery{Role: key.Role,
|
|
|
|
Environment: key.Environment,
|
|
|
|
JobName: key.Name,
|
2016-08-26 16:35:31 -07:00
|
|
|
Statuses: states}
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.GetTasksWithoutConfigs(taskQ); err == nil {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for active IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2017-05-30 12:03:17 -07:00
|
|
|
resp, err = response.ResponseCodeCheck(resp)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
tasks := response.ScheduleStatusResult(resp).GetTasks()
|
2016-08-09 14:21:43 -07:00
|
|
|
jobInstanceIds := make(map[int32]bool)
|
2016-08-02 11:42:00 -07:00
|
|
|
for _, task := range tasks {
|
2016-08-09 14:21:43 -07:00
|
|
|
jobInstanceIds[task.GetAssignedTask().GetInstanceId()] = true
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2016-08-09 14:21:43 -07:00
|
|
|
return jobInstanceIds, nil
|
2017-05-30 12:03:17 -07:00
|
|
|
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) GetJobUpdateSummaries(jobUpdateQuery *aurora.JobUpdateQuery) (*aurora.Response, error) {
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.readonlyClient.GetJobUpdateSummaries(jobUpdateQuery); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error getting job update summaries from Aurora Scheduler")
|
2017-03-09 11:37:03 -08:00
|
|
|
}
|
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
// Kill specific instances of a job.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) KillInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
instanceIds := make(map[int32]bool)
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2017-03-30 18:17:21 -07:00
|
|
|
|
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
for _, instId := range instances {
|
|
|
|
instanceIds[instId] = true
|
|
|
|
}
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
if resp, err = r.client.KillTasks(key, instanceIds); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
2017-03-16 23:19:30 -07:00
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-09 13:44:54 -07:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
|
2016-08-09 13:44:54 -07:00
|
|
|
}
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
func (r *realisClient) RealisConfig() *RealisConfig {
|
|
|
|
return r.config
|
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Sends a kill message to the scheduler for all active tasks under a job.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) KillJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var instanceIds map[int32]bool
|
|
|
|
var err error
|
|
|
|
var resp *aurora.Response
|
|
|
|
instanceIds, err = r.GetInstanceIds(key, aurora.ACTIVE_STATES)
|
2016-08-02 11:42:00 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Could not retrieve relevant task instance IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 14:21:43 -07:00
|
|
|
if len(instanceIds) > 0 {
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-16 23:19:30 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
|
|
|
|
if resp, err = r.client.KillTasks(key, instanceIds); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
if err != nil {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Kill command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
}
|
2017-03-16 23:19:30 -07:00
|
|
|
return nil, errors.New("No tasks in the Active state")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Sends a create job message to the scheduler with a specific job configuration.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) CreateJob(auroraJob Job) (*aurora.Response, error) {
|
2017-03-16 23:19:30 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-16 23:19:30 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
2017-03-30 18:17:21 -07:00
|
|
|
fmt.Println(" STEPS: ", i)
|
2017-03-16 23:19:30 -07:00
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
2017-03-30 18:17:21 -07:00
|
|
|
fmt.Println(" calling CreateJob")
|
2017-03-16 23:19:30 -07:00
|
|
|
if resp, err = r.client.CreateJob(auroraJob.JobConfig()); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
2017-03-30 18:17:21 -07:00
|
|
|
fmt.Println("CreateJob err: %+v\n", err)
|
2017-03-16 23:19:30 -07:00
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2017-03-16 23:19:30 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Create command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) ScheduleCronJob(auroraJob Job) (*aurora.Response, error) {
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2016-09-30 01:24:49 -04:00
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
if resp, err = r.client.ScheduleCronJob(auroraJob.JobConfig()); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Cron Job Schedule message to Aurora Scheduler")
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) DescheduleCronJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2016-09-30 01:24:49 -04:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
|
|
|
|
if resp, err = r.client.DescheduleCronJob(key); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Cron Job De-schedule message to Aurora Scheduler")
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) StartCronJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2016-09-30 01:24:49 -04:00
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
if resp, err = r.client.StartCronJob(key); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Start Cron Job message to Aurora Scheduler")
|
2016-09-30 01:24:49 -04:00
|
|
|
}
|
|
|
|
|
2016-08-25 18:56:55 -07:00
|
|
|
// Restarts specific instances specified
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) RestartInstances(key *aurora.JobKey, instances ...int32) (*aurora.Response, error) {
|
2016-08-25 18:56:55 -07:00
|
|
|
instanceIds := make(map[int32]bool)
|
|
|
|
|
|
|
|
for _, instId := range instances {
|
|
|
|
instanceIds[instId] = true
|
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2017-03-30 18:17:21 -07:00
|
|
|
|
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
2016-08-25 18:56:55 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
if resp, err = r.client.RestartShards(key, instanceIds); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-25 18:56:55 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
}
|
|
|
|
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
|
2016-08-25 18:56:55 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Restarts all active tasks under a job configuration.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) RestartJob(key *aurora.JobKey) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
instanceIds, err1 := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
|
|
|
|
if err1 != nil {
|
|
|
|
return nil, errors.Wrap(err1, "Could not retrieve relevant task instance IDs")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2016-08-09 14:21:43 -07:00
|
|
|
if len(instanceIds) > 0 {
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
|
|
|
|
if resp, err = r.client.RestartShards(key, instanceIds); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending Restart command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
|
|
|
|
} else {
|
2016-08-16 18:40:02 -07:00
|
|
|
return nil, errors.New("No tasks in the Active state")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-16 18:40:02 -07:00
|
|
|
// Update all tasks under a job configuration. Currently gorealis doesn't support for canary deployments.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) StartJobUpdate(updateJob *UpdateJob, message string) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-16 23:19:30 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.StartJobUpdate(updateJob.req, message); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2017-03-16 23:19:30 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending StartJobUpdate command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Abort Job Update on Aurora. Requires the updateId which can be obtained on the Aurora web UI.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) AbortJobUpdate(
|
2016-08-25 18:56:55 -07:00
|
|
|
updateKey aurora.JobUpdateKey,
|
2016-08-09 13:30:26 -07:00
|
|
|
message string) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.AbortJobUpdate(&updateKey, message); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending AbortJobUpdate command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
|
|
|
|
2016-08-09 16:18:30 -07:00
|
|
|
// Scale up the number of instances under a job configuration using the configuration for specific
|
|
|
|
// instance to scale up.
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) AddInstances(instKey aurora.InstanceKey, count int32) (*aurora.Response, error) {
|
2016-08-02 11:42:00 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.AddInstances(&instKey, count); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Error sending AddInstances command to Aurora Scheduler")
|
2016-08-02 11:42:00 -07:00
|
|
|
}
|
2016-08-24 15:38:44 -07:00
|
|
|
|
2017-03-21 12:52:29 -07:00
|
|
|
//Scale down the number of instances under a job configuration using the configuration of a specific instance
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) RemoveInstances(key *aurora.JobKey, count int32) (*aurora.Response, error) {
|
2017-03-10 01:14:09 -08:00
|
|
|
instanceIds, err := r.GetInstanceIds(key, aurora.ACTIVE_STATES)
|
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "RemoveInstances: Could not retrieve relevant instance IDs")
|
|
|
|
}
|
|
|
|
if len(instanceIds) < int(count) {
|
2017-03-10 15:50:26 -08:00
|
|
|
return nil, errors.New(fmt.Sprintf("RemoveInstances: No sufficient instances to Kill - "+
|
2017-03-10 01:14:09 -08:00
|
|
|
"Instances to kill %d Total Instances %d", count, len(instanceIds)))
|
|
|
|
}
|
|
|
|
instanceList := make([]int32, count)
|
|
|
|
i := 0
|
|
|
|
for k := range instanceIds {
|
|
|
|
instanceList[i] = k
|
|
|
|
i += 1
|
|
|
|
if i == int(count) {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return r.KillInstances(key, instanceList...)
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) GetTaskStatus(query *aurora.TaskQuery) (tasks []*aurora.ScheduledTask, e error) {
|
2016-11-15 22:24:07 -08:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.GetTasksStatus(query); err == nil {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-11-15 22:24:07 -08:00
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for task status")
|
|
|
|
}
|
|
|
|
//Check for response code..
|
|
|
|
if resp.GetResponseCode() != aurora.ResponseCode_OK {
|
|
|
|
return nil, errors.New(resp.ResponseCode.String() + "--" + response.CombineMessage(resp))
|
|
|
|
}
|
|
|
|
|
|
|
|
return response.ScheduleStatusResult(resp).GetTasks(), nil
|
|
|
|
}
|
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) FetchTaskConfig(instKey aurora.InstanceKey) (*aurora.TaskConfig, error) {
|
2016-08-24 15:38:44 -07:00
|
|
|
|
|
|
|
ids := make(map[int32]bool)
|
|
|
|
|
|
|
|
ids[instKey.InstanceId] = true
|
|
|
|
taskQ := &aurora.TaskQuery{Role: instKey.JobKey.Role,
|
|
|
|
Environment: instKey.JobKey.Environment,
|
|
|
|
JobName: instKey.JobKey.Name,
|
2016-08-24 17:21:59 -07:00
|
|
|
InstanceIds: ids,
|
|
|
|
Statuses: aurora.ACTIVE_STATES}
|
2016-08-24 15:38:44 -07:00
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-16 23:19:30 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
|
|
|
|
if resp, err = r.client.GetTasksStatus(taskQ); err == nil {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-24 15:38:44 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, errors.Wrap(err, "Error querying Aurora Scheduler for task configuration")
|
|
|
|
}
|
|
|
|
|
2016-11-15 22:24:07 -08:00
|
|
|
//Check for response code..
|
|
|
|
if resp.GetResponseCode() != aurora.ResponseCode_OK {
|
2017-02-13 19:31:41 -05:00
|
|
|
return nil, errors.New(resp.ResponseCode.String() + "--" + response.CombineMessage(resp))
|
2016-11-15 22:24:07 -08:00
|
|
|
}
|
|
|
|
|
2016-09-30 01:24:49 -04:00
|
|
|
tasks := response.ScheduleStatusResult(resp).GetTasks()
|
2016-08-24 15:38:44 -07:00
|
|
|
|
2016-08-24 17:21:59 -07:00
|
|
|
if len(tasks) == 0 {
|
2016-08-24 15:38:44 -07:00
|
|
|
return nil, errors.Errorf("Instance %d for jobkey %s/%s/%s doesn't exist",
|
|
|
|
instKey.InstanceId,
|
|
|
|
instKey.JobKey.Environment,
|
|
|
|
instKey.JobKey.Role,
|
|
|
|
instKey.JobKey.Name)
|
|
|
|
}
|
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
// Currently, instance 0 is always picked..
|
2016-08-24 15:38:44 -07:00
|
|
|
return tasks[0].AssignedTask.Task, nil
|
|
|
|
}
|
2016-08-25 18:56:55 -07:00
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) JobUpdateDetails(updateQuery aurora.JobUpdateQuery) (*aurora.Response, error) {
|
2016-08-25 18:56:55 -07:00
|
|
|
|
2017-03-20 22:34:45 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
2016-08-25 18:56:55 -07:00
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-20 22:34:45 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.GetJobUpdateDetails(&updateQuery); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-08-25 18:56:55 -07:00
|
|
|
}
|
2017-03-20 22:34:45 -07:00
|
|
|
return nil, errors.Wrap(err, "Unable to get job update details")
|
2016-08-25 18:56:55 -07:00
|
|
|
}
|
2016-09-30 00:44:38 -04:00
|
|
|
|
2017-03-10 15:50:26 -08:00
|
|
|
func (r *realisClient) RollbackJobUpdate(key aurora.JobUpdateKey, message string) (*aurora.Response, error) {
|
2017-03-16 23:19:30 -07:00
|
|
|
var resp *aurora.Response
|
|
|
|
var err error
|
|
|
|
|
2017-03-30 18:17:21 -07:00
|
|
|
defaultBackoff := r.config.backoff
|
2017-03-16 23:19:30 -07:00
|
|
|
duration := defaultBackoff.Duration
|
|
|
|
for i := 0; i < defaultBackoff.Steps; i++ {
|
|
|
|
if i != 0 {
|
|
|
|
adjusted := duration
|
|
|
|
if defaultBackoff.Jitter > 0.0 {
|
|
|
|
adjusted = Jitter(duration, defaultBackoff.Jitter)
|
|
|
|
}
|
|
|
|
fmt.Println(" sleeping for: ", adjusted)
|
|
|
|
time.Sleep(adjusted)
|
|
|
|
duration = time.Duration(float64(duration) * defaultBackoff.Factor)
|
|
|
|
}
|
|
|
|
if resp, err = r.client.RollbackJobUpdate(&key, message); err == nil {
|
|
|
|
return response.ResponseCodeCheck(resp)
|
|
|
|
}
|
|
|
|
err1 := r.ReestablishConn()
|
|
|
|
if err1 != nil {
|
|
|
|
fmt.Println("error in ReestablishConn: ", err1)
|
|
|
|
}
|
2016-09-30 00:44:38 -04:00
|
|
|
}
|
|
|
|
|
2017-03-16 23:19:30 -07:00
|
|
|
return nil, errors.Wrap(err, "Unable to roll back job update")
|
2016-09-30 00:44:38 -04:00
|
|
|
}
|