serving

package
v0.0.0-...-1dfa148 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Mar 12, 2024 License: Apache-2.0 Imports: 34 Imported by: 0

Documentation

Index

Constants

View Source
const (
	GPU_RESOURCE_NAME        = "nvidia.com/gpu"
	ALIYUN_GPU_RESOURCE_NAME = "aliyun.com/gpu"
	GPU_MEM_RESOURCE_NAME    = "aliyun.com/gpu-mem"
	GPU_CORE_RESOURCE_NAME   = "aliyun.com/gpu-core.percentage"
)
View Source
const (
	ResourceGPU       v1.ResourceName = "nvidia.com/gpu"
	ResourceGPUMemory v1.ResourceName = "aliyun.com/gpu-mem"
	ResourceGPUCore   v1.ResourceName = "aliyun.com/gpu-core.percentage"
)

Variables

This section is empty.

Functions

func AcceptJobLog

func AcceptJobLog(name, version string, jobType types.ServingJobType, args *types.LogArgs) error

func CheckJobIsOwnedByProcesser

func CheckJobIsOwnedByProcesser(labels map[string]string) bool

func DeleteServingJob

func DeleteServingJob(namespace, name, version string, jobType types.ServingJobType) error

func DisplayAllServingJobs

func DisplayAllServingJobs(jobs []ServingJob, allNamespace bool, format types.FormatStyle)

func GetAllProcesser

func GetAllProcesser() map[types.ServingJobType]Processer

func PrintLine

func PrintLine(w io.Writer, fields ...string)

func PrintServingJob

func PrintServingJob(job ServingJob, format types.FormatStyle)

func RunTrafficRouterSplit

func RunTrafficRouterSplit(namespace string, args *types.TrafficRouterSplitArgs) (err error)

func SubmitCustomServingJob

func SubmitCustomServingJob(namespace string, args *types.CustomServingArgs) (err error)

func SubmitKFServingJob

func SubmitKFServingJob(namespace string, args *types.KFServingArgs) (err error)

func SubmitKServeJob

func SubmitKServeJob(namespace string, args *types.KServeArgs) (err error)

func SubmitSeldonServingJob

func SubmitSeldonServingJob(namespace string, args *types.SeldonServingArgs) (err error)

func SubmitTensorRTServingJob

func SubmitTensorRTServingJob(namespace string, args *types.TensorRTServingArgs) (err error)

func SubmitTensorflowServingJob

func SubmitTensorflowServingJob(namespace string, args *types.TensorFlowServingArgs) (err error)

func SubmitTritonServingJob

func SubmitTritonServingJob(namespace string, args *types.TritonServingArgs) (err error)

func UpdateCustomServing

func UpdateCustomServing(args *types.UpdateCustomServingArgs) error

func UpdateKServe

func UpdateKServe(args *types.UpdateKServeArgs) error

func UpdateTensorflowServing

func UpdateTensorflowServing(args *types.UpdateTensorFlowServingArgs) error

func UpdateTritonServing

func UpdateTritonServing(args *types.UpdateTritonServingArgs) error

func ValidateJobsBeforeSubmiting

func ValidateJobsBeforeSubmiting(jobs []ServingJob, name string) error

Types

type CustomServingProcesser

type CustomServingProcesser struct {
	// contains filtered or unexported fields
}

CustomServingProcesser use the default processer

func (CustomServingProcesser) FilterServingJobs

func (p CustomServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (CustomServingProcesser) GetServingJobs

func (p CustomServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (CustomServingProcesser) IsDeploymentPod

func (p CustomServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (CustomServingProcesser) IsEnabled

func (p CustomServingProcesser) IsEnabled() bool

func (CustomServingProcesser) IsKnownDeployment

func (p CustomServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (CustomServingProcesser) IsKnownService

func (p CustomServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (CustomServingProcesser) IsSupported

func (p CustomServingProcesser) IsSupported(namespace, name, version string) bool

func (CustomServingProcesser) ListServingJobs

func (p CustomServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (CustomServingProcesser) Type

func (p CustomServingProcesser) Type() types.ServingJobType

type KFServingProcesser

type KFServingProcesser struct {
	// contains filtered or unexported fields
}

TensorflowServingProcesser use the default processer

func (KFServingProcesser) FilterServingJobs

func (p KFServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (KFServingProcesser) GetServingJobs

func (p KFServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (KFServingProcesser) IsDeploymentPod

func (p KFServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (KFServingProcesser) IsEnabled

func (p KFServingProcesser) IsEnabled() bool

func (KFServingProcesser) IsKnownDeployment

func (p KFServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (KFServingProcesser) IsKnownService

func (p KFServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (KFServingProcesser) IsSupported

func (p KFServingProcesser) IsSupported(namespace, name, version string) bool

func (KFServingProcesser) ListServingJobs

func (p KFServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (KFServingProcesser) Type

func (p KFServingProcesser) Type() types.ServingJobType

type KServeProcesser

type KServeProcesser struct {
	// contains filtered or unexported fields
}

KServeProcesser use the default processer

func (*KServeProcesser) FilterServingJobs

func (p *KServeProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (*KServeProcesser) GetServingJobs

func (p *KServeProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (KServeProcesser) IsDeploymentPod

func (p KServeProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (KServeProcesser) IsEnabled

func (p KServeProcesser) IsEnabled() bool

func (KServeProcesser) IsKnownDeployment

func (p KServeProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (KServeProcesser) IsKnownService

func (p KServeProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (KServeProcesser) IsSupported

func (p KServeProcesser) IsSupported(namespace, name, version string) bool

func (*KServeProcesser) ListServingJobs

func (p *KServeProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (KServeProcesser) Type

func (p KServeProcesser) Type() types.ServingJobType

type Processer

type Processer interface {
	// Type returns the processer type
	Type() types.ServingJobType
	// IsSupported is used to check the processer support the serving job or not
	IsSupported(namespace, name, version string) bool
	// IsEnabled returns the processer is enabled or not
	IsEnabled() bool
	// ListServingJobs is used to list serving jobs
	ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)
	// GetServingJob is used to get serving job
	GetServingJobs(namespace, name, version string) ([]ServingJob, error)
	// FilterServingJobs is used to filter serving jobs
	FilterServingJobs(namespace string, allNamespace bool, filter string) ([]ServingJob, error)
}

Processer is used to process serving jobs

func NewCustomServingProcesser

func NewCustomServingProcesser() Processer

func NewKFServingProcesser

func NewKFServingProcesser() Processer

func NewKServeProcesser

func NewKServeProcesser() Processer

func NewSeldonServingProcesser

func NewSeldonServingProcesser() Processer

func NewTensorflowServingProcesser

func NewTensorflowServingProcesser() Processer

func NewTensorrtServingProcesser

func NewTensorrtServingProcesser() Processer

func NewTritonServingProcesser

func NewTritonServingProcesser() Processer

type SeldonServingProcesser

type SeldonServingProcesser struct {
	// contains filtered or unexported fields
}

SeldonServingProcesser use the default processer

func (*SeldonServingProcesser) FilterServingJobs

func (p *SeldonServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (*SeldonServingProcesser) GetServingJobs

func (p *SeldonServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (SeldonServingProcesser) IsDeploymentPod

func (p SeldonServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (SeldonServingProcesser) IsEnabled

func (p SeldonServingProcesser) IsEnabled() bool

func (SeldonServingProcesser) IsKnownDeployment

func (p SeldonServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (SeldonServingProcesser) IsKnownService

func (p SeldonServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (SeldonServingProcesser) IsSupported

func (p SeldonServingProcesser) IsSupported(namespace, name, version string) bool

func (*SeldonServingProcesser) ListServingJobs

func (p *SeldonServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (SeldonServingProcesser) Type

func (p SeldonServingProcesser) Type() types.ServingJobType

type ServingJob

type ServingJob interface {
	// GetName returns the job name
	Name() string
	// GetNamespace returns the namespace
	Namespace() string
	// Uid returns the uid
	Uid() string
	// Type returns the type
	Type() types.ServingJobType
	// Version returns the job version
	Version() string
	// Pods returns the job pods
	Pods() []*v1.Pod
	// Deployment returns the deployment
	Deployment() *appv1.Deployment
	// Service returns the job services
	Services() []*v1.Service
	// Age returns the job age
	Age() time.Duration
	// Get start time
	StartTime() *metav1.Time
	// Endpoints return the endpoints
	Endpoints() []types.Endpoint
	// IPAddress return the inference address
	IPAddress() string
	// RequestCPUs returns the cpus which serving job owned
	RequestCPUs() float64
	// RequestGPUs returns the gpus which serving job owned
	RequestGPUs() float64
	// RequestGPUMemory returns the gpu memory,only for gpushare
	RequestGPUMemory() int
	// RequestGPUCore returns the gpu core, only for cgpu
	RequestGPUCore() int
	// DesiredInstances return the desired instances count
	DesiredInstances() int
	// AvailableInstances returns the available instances
	AvailableInstances() int
	// Convert2JobInfo convert to ServingJobInfo
	Convert2JobInfo() types.ServingJobInfo
}

ServingJob defines a serving job

func ListServingJobs

func ListServingJobs(namespace string, allNamespace bool, servingType types.ServingJobType) ([]ServingJob, error)

func SearchServingJob

func SearchServingJob(namespace, name, version string, servingType types.ServingJobType) (ServingJob, error)

type ServingJobGroup

type ServingJobGroup struct {
	Id        string
	Namespace string
	JobType   types.ServingJobType
	JobName   string
}

type TensorflowServingProcesser

type TensorflowServingProcesser struct {
	// contains filtered or unexported fields
}

TensorflowServingProcesser use the default processer

func (TensorflowServingProcesser) FilterServingJobs

func (p TensorflowServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (TensorflowServingProcesser) GetServingJobs

func (p TensorflowServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (TensorflowServingProcesser) IsDeploymentPod

func (p TensorflowServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (TensorflowServingProcesser) IsEnabled

func (p TensorflowServingProcesser) IsEnabled() bool

func (TensorflowServingProcesser) IsKnownDeployment

func (p TensorflowServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (TensorflowServingProcesser) IsKnownService

func (p TensorflowServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (TensorflowServingProcesser) IsSupported

func (p TensorflowServingProcesser) IsSupported(namespace, name, version string) bool

func (TensorflowServingProcesser) ListServingJobs

func (p TensorflowServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (TensorflowServingProcesser) Type

func (p TensorflowServingProcesser) Type() types.ServingJobType

type TensorrtServingProcesser

type TensorrtServingProcesser struct {
	// contains filtered or unexported fields
}

TensorrtServingProcesser use the default processer

func (TensorrtServingProcesser) FilterServingJobs

func (p TensorrtServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (TensorrtServingProcesser) GetServingJobs

func (p TensorrtServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (TensorrtServingProcesser) IsDeploymentPod

func (p TensorrtServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (TensorrtServingProcesser) IsEnabled

func (p TensorrtServingProcesser) IsEnabled() bool

func (TensorrtServingProcesser) IsKnownDeployment

func (p TensorrtServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (TensorrtServingProcesser) IsKnownService

func (p TensorrtServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (TensorrtServingProcesser) IsSupported

func (p TensorrtServingProcesser) IsSupported(namespace, name, version string) bool

func (TensorrtServingProcesser) ListServingJobs

func (p TensorrtServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (TensorrtServingProcesser) Type

func (p TensorrtServingProcesser) Type() types.ServingJobType

type TritonServingProcesser

type TritonServingProcesser struct {
	// contains filtered or unexported fields
}

TritonServingProcesser use the default processer

func (TritonServingProcesser) FilterServingJobs

func (p TritonServingProcesser) FilterServingJobs(namespace string, allNamespace bool, label string) ([]ServingJob, error)

func (TritonServingProcesser) GetServingJobs

func (p TritonServingProcesser) GetServingJobs(namespace, name, version string) ([]ServingJob, error)

func (TritonServingProcesser) IsDeploymentPod

func (p TritonServingProcesser) IsDeploymentPod(deployment *appv1.Deployment, pod *v1.Pod) bool

func (TritonServingProcesser) IsEnabled

func (p TritonServingProcesser) IsEnabled() bool

func (TritonServingProcesser) IsKnownDeployment

func (p TritonServingProcesser) IsKnownDeployment(namespace, name, version string, deployment *appv1.Deployment) bool

func (TritonServingProcesser) IsKnownService

func (p TritonServingProcesser) IsKnownService(namespace, name, version string, service *v1.Service) bool

func (TritonServingProcesser) IsSupported

func (p TritonServingProcesser) IsSupported(namespace, name, version string) bool

func (TritonServingProcesser) ListServingJobs

func (p TritonServingProcesser) ListServingJobs(namespace string, allNamespace bool) ([]ServingJob, error)

func (TritonServingProcesser) Type

func (p TritonServingProcesser) Type() types.ServingJobType

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL