server

package
v0.12.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Dec 29, 2023 License: Apache-2.0 Imports: 19 Imported by: 0

Documentation

Overview

Copyright 2021 IBM Corporation

Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.

Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.

Index

Constants

This section is empty.

Variables

This section is empty.

Functions

This section is empty.

Types

type AdapterConfiguration

type AdapterConfiguration struct {
	Port                         int
	MLServerPort                 int
	MLServerContainerMemReqBytes int
	MLServerMemBufferBytes       int
	CapacityInBytes              int
	MaxLoadingConcurrency        int
	ModelLoadingTimeoutMS        int
	DefaultModelSizeInBytes      int
	ModelSizeMultiplier          float64
	RuntimeVersion               string
	LimitModelConcurrency        int // 0 means no limit (default)
	RootModelDir                 string
	UseEmbeddedPuller            bool
}

func GetAdapterConfigurationFromEnv

func GetAdapterConfigurationFromEnv(log logr.Logger) (*AdapterConfiguration, error)

type MLServerAdapterServer

type MLServerAdapterServer struct {
	Client        mlserver.GRPCInferenceServiceClient
	Conn          *grpc.ClientConn
	Puller        *puller.Puller
	AdapterConfig *AdapterConfiguration
	Log           logr.Logger

	// embed generated Unimplemented type for forward-compatibility for gRPC
	mmesh.UnimplementedModelRuntimeServer
}

func NewMLServerAdapterServer

func NewMLServerAdapterServer(runtimePort int, config *AdapterConfiguration, log logr.Logger) *MLServerAdapterServer

func (*MLServerAdapterServer) LoadModel

func (*MLServerAdapterServer) RuntimeStatus

func (*MLServerAdapterServer) UnloadModel

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL