v1

package
v0.122.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Oct 7, 2024 License: Apache-2.0 Imports: 16 Imported by: 4

Documentation

Overview

Package v1 is a reverse proxy.

It translates gRPC into RESTful JSON APIs.

Index

Constants

This section is empty.

Variables

View Source
var (
	ModelFormat_name = map[int32]string{
		0: "MODEL_FORMAT_UNSPECIFIED",
		1: "MODEL_FORMAT_GGUF",
		2: "MODEL_FORMAT_HUGGING_FACE",
		3: "MODEL_FORMAT_NVIDIA_TRITON",
	}
	ModelFormat_value = map[string]int32{
		"MODEL_FORMAT_UNSPECIFIED":   0,
		"MODEL_FORMAT_GGUF":          1,
		"MODEL_FORMAT_HUGGING_FACE":  2,
		"MODEL_FORMAT_NVIDIA_TRITON": 3,
	}
)

Enum value maps for ModelFormat.

View Source
var (
	AdapterType_name = map[int32]string{
		0: "ADAPTER_TYPE_UNSPECIFIED",
		1: "ADAPTER_TYPE_LORA",
		2: "ADAPTER_TYPE_QLORA",
	}
	AdapterType_value = map[string]int32{
		"ADAPTER_TYPE_UNSPECIFIED": 0,
		"ADAPTER_TYPE_LORA":        1,
		"ADAPTER_TYPE_QLORA":       2,
	}
)

Enum value maps for AdapterType.

View Source
var (
	QuantizationType_name = map[int32]string{
		0: "QUANTIZATION_TYPE_UNSPECIFIED",
		1: "QUANTIZATION_TYPE_GGUF",
		2: "QUANTIZATION_TYPE_AWQ",
	}
	QuantizationType_value = map[string]int32{
		"QUANTIZATION_TYPE_UNSPECIFIED": 0,
		"QUANTIZATION_TYPE_GGUF":        1,
		"QUANTIZATION_TYPE_AWQ":         2,
	}
)

Enum value maps for QuantizationType.

View Source
var File_api_v1_model_manager_service_proto protoreflect.FileDescriptor
View Source
var ModelsService_ServiceDesc = grpc.ServiceDesc{
	ServiceName: "llmariner.models.server.v1.ModelsService",
	HandlerType: (*ModelsServiceServer)(nil),
	Methods: []grpc.MethodDesc{
		{
			MethodName: "ListModels",
			Handler:    _ModelsService_ListModels_Handler,
		},
		{
			MethodName: "GetModel",
			Handler:    _ModelsService_GetModel_Handler,
		},
		{
			MethodName: "DeleteModel",
			Handler:    _ModelsService_DeleteModel_Handler,
		},
		{
			MethodName: "ListBaseModels",
			Handler:    _ModelsService_ListBaseModels_Handler,
		},
	},
	Streams:  []grpc.StreamDesc{},
	Metadata: "api/v1/model_manager_service.proto",
}

ModelsService_ServiceDesc is the grpc.ServiceDesc for ModelsService service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)

View Source
var ModelsWorkerService_ServiceDesc = grpc.ServiceDesc{
	ServiceName: "llmariner.models.server.v1.ModelsWorkerService",
	HandlerType: (*ModelsWorkerServiceServer)(nil),
	Methods: []grpc.MethodDesc{
		{
			MethodName: "CreateStorageConfig",
			Handler:    _ModelsWorkerService_CreateStorageConfig_Handler,
		},
		{
			MethodName: "GetStorageConfig",
			Handler:    _ModelsWorkerService_GetStorageConfig_Handler,
		},
		{
			MethodName: "GetModel",
			Handler:    _ModelsWorkerService_GetModel_Handler,
		},
		{
			MethodName: "RegisterModel",
			Handler:    _ModelsWorkerService_RegisterModel_Handler,
		},
		{
			MethodName: "PublishModel",
			Handler:    _ModelsWorkerService_PublishModel_Handler,
		},
		{
			MethodName: "GetModelPath",
			Handler:    _ModelsWorkerService_GetModelPath_Handler,
		},
		{
			MethodName: "GetModelAttributes",
			Handler:    _ModelsWorkerService_GetModelAttributes_Handler,
		},
		{
			MethodName: "CreateBaseModel",
			Handler:    _ModelsWorkerService_CreateBaseModel_Handler,
		},
		{
			MethodName: "GetBaseModelPath",
			Handler:    _ModelsWorkerService_GetBaseModelPath_Handler,
		},
	},
	Streams:  []grpc.StreamDesc{},
	Metadata: "api/v1/model_manager_service.proto",
}

ModelsWorkerService_ServiceDesc is the grpc.ServiceDesc for ModelsWorkerService service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)

Functions

func RegisterModelsServiceHandler

func RegisterModelsServiceHandler(ctx context.Context, mux *runtime.ServeMux, conn *grpc.ClientConn) error

RegisterModelsServiceHandler registers the http handlers for service ModelsService to "mux". The handlers forward requests to the grpc endpoint over "conn".

func RegisterModelsServiceHandlerClient

func RegisterModelsServiceHandlerClient(ctx context.Context, mux *runtime.ServeMux, client ModelsServiceClient) error

RegisterModelsServiceHandlerClient registers the http handlers for service ModelsService to "mux". The handlers forward requests to the grpc endpoint over the given implementation of "ModelsServiceClient". Note: the gRPC framework executes interceptors within the gRPC handler. If the passed in "ModelsServiceClient" doesn't go through the normal gRPC flow (creating a gRPC client etc.) then it will be up to the passed in "ModelsServiceClient" to call the correct interceptors.

func RegisterModelsServiceHandlerFromEndpoint

func RegisterModelsServiceHandlerFromEndpoint(ctx context.Context, mux *runtime.ServeMux, endpoint string, opts []grpc.DialOption) (err error)

RegisterModelsServiceHandlerFromEndpoint is same as RegisterModelsServiceHandler but automatically dials to "endpoint" and closes the connection when "ctx" gets done.

func RegisterModelsServiceHandlerServer

func RegisterModelsServiceHandlerServer(ctx context.Context, mux *runtime.ServeMux, server ModelsServiceServer) error

RegisterModelsServiceHandlerServer registers the http handlers for service ModelsService to "mux". UnaryRPC :call ModelsServiceServer directly. StreamingRPC :currently unsupported pending https://github.com/grpc/grpc-go/issues/906. Note that using this registration option will cause many gRPC library features to stop working. Consider using RegisterModelsServiceHandlerFromEndpoint instead.

func RegisterModelsServiceServer

func RegisterModelsServiceServer(s grpc.ServiceRegistrar, srv ModelsServiceServer)

func RegisterModelsWorkerServiceServer

func RegisterModelsWorkerServiceServer(s grpc.ServiceRegistrar, srv ModelsWorkerServiceServer)

Types

type AdapterType

type AdapterType int32
const (
	AdapterType_ADAPTER_TYPE_UNSPECIFIED AdapterType = 0
	AdapterType_ADAPTER_TYPE_LORA        AdapterType = 1
	AdapterType_ADAPTER_TYPE_QLORA       AdapterType = 2
)

func (AdapterType) Descriptor

func (AdapterType) Enum

func (x AdapterType) Enum() *AdapterType

func (AdapterType) EnumDescriptor deprecated

func (AdapterType) EnumDescriptor() ([]byte, []int)

Deprecated: Use AdapterType.Descriptor instead.

func (AdapterType) Number

func (x AdapterType) Number() protoreflect.EnumNumber

func (AdapterType) String

func (x AdapterType) String() string

func (AdapterType) Type

type BaseModel

type BaseModel struct {
	Id      string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	Created int64  `protobuf:"varint,2,opt,name=created,proto3" json:"created,omitempty"`
	Object  string `protobuf:"bytes,3,opt,name=object,proto3" json:"object,omitempty"`
	// contains filtered or unexported fields
}

func (*BaseModel) Descriptor deprecated

func (*BaseModel) Descriptor() ([]byte, []int)

Deprecated: Use BaseModel.ProtoReflect.Descriptor instead.

func (*BaseModel) GetCreated

func (x *BaseModel) GetCreated() int64

func (*BaseModel) GetId

func (x *BaseModel) GetId() string

func (*BaseModel) GetObject

func (x *BaseModel) GetObject() string

func (*BaseModel) ProtoMessage

func (*BaseModel) ProtoMessage()

func (*BaseModel) ProtoReflect

func (x *BaseModel) ProtoReflect() protoreflect.Message

func (*BaseModel) Reset

func (x *BaseModel) Reset()

func (*BaseModel) String

func (x *BaseModel) String() string

type CreateBaseModelRequest

type CreateBaseModelRequest struct {
	Id   string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	Path string `protobuf:"bytes,2,opt,name=path,proto3" json:"path,omitempty"`
	// formats is the supported formats of the base model. If not set, the format is considered as GGUF
	// for backward compatibility.
	Formats []ModelFormat `protobuf:"varint,4,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"`
	// gguf_model_path is the path of the GGUF model. Set if the model suppors the GGUF formta.
	GgufModelPath string `protobuf:"bytes,3,opt,name=gguf_model_path,json=ggufModelPath,proto3" json:"gguf_model_path,omitempty"`
	// contains filtered or unexported fields
}

func (*CreateBaseModelRequest) Descriptor deprecated

func (*CreateBaseModelRequest) Descriptor() ([]byte, []int)

Deprecated: Use CreateBaseModelRequest.ProtoReflect.Descriptor instead.

func (*CreateBaseModelRequest) GetFormats

func (x *CreateBaseModelRequest) GetFormats() []ModelFormat

func (*CreateBaseModelRequest) GetGgufModelPath

func (x *CreateBaseModelRequest) GetGgufModelPath() string

func (*CreateBaseModelRequest) GetId

func (x *CreateBaseModelRequest) GetId() string

func (*CreateBaseModelRequest) GetPath

func (x *CreateBaseModelRequest) GetPath() string

func (*CreateBaseModelRequest) ProtoMessage

func (*CreateBaseModelRequest) ProtoMessage()

func (*CreateBaseModelRequest) ProtoReflect

func (x *CreateBaseModelRequest) ProtoReflect() protoreflect.Message

func (*CreateBaseModelRequest) Reset

func (x *CreateBaseModelRequest) Reset()

func (*CreateBaseModelRequest) String

func (x *CreateBaseModelRequest) String() string

type CreateStorageConfigRequest

type CreateStorageConfigRequest struct {
	PathPrefix string `protobuf:"bytes,1,opt,name=path_prefix,json=pathPrefix,proto3" json:"path_prefix,omitempty"`
	// contains filtered or unexported fields
}

func (*CreateStorageConfigRequest) Descriptor deprecated

func (*CreateStorageConfigRequest) Descriptor() ([]byte, []int)

Deprecated: Use CreateStorageConfigRequest.ProtoReflect.Descriptor instead.

func (*CreateStorageConfigRequest) GetPathPrefix

func (x *CreateStorageConfigRequest) GetPathPrefix() string

func (*CreateStorageConfigRequest) ProtoMessage

func (*CreateStorageConfigRequest) ProtoMessage()

func (*CreateStorageConfigRequest) ProtoReflect

func (*CreateStorageConfigRequest) Reset

func (x *CreateStorageConfigRequest) Reset()

func (*CreateStorageConfigRequest) String

func (x *CreateStorageConfigRequest) String() string

type DeleteModelRequest

type DeleteModelRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

func (*DeleteModelRequest) Descriptor deprecated

func (*DeleteModelRequest) Descriptor() ([]byte, []int)

Deprecated: Use DeleteModelRequest.ProtoReflect.Descriptor instead.

func (*DeleteModelRequest) GetId

func (x *DeleteModelRequest) GetId() string

func (*DeleteModelRequest) ProtoMessage

func (*DeleteModelRequest) ProtoMessage()

func (*DeleteModelRequest) ProtoReflect

func (x *DeleteModelRequest) ProtoReflect() protoreflect.Message

func (*DeleteModelRequest) Reset

func (x *DeleteModelRequest) Reset()

func (*DeleteModelRequest) String

func (x *DeleteModelRequest) String() string

type DeleteModelResponse

type DeleteModelResponse struct {
	Id      string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	Object  string `protobuf:"bytes,2,opt,name=object,proto3" json:"object,omitempty"`
	Deleted bool   `protobuf:"varint,3,opt,name=deleted,proto3" json:"deleted,omitempty"`
	// contains filtered or unexported fields
}

func (*DeleteModelResponse) Descriptor deprecated

func (*DeleteModelResponse) Descriptor() ([]byte, []int)

Deprecated: Use DeleteModelResponse.ProtoReflect.Descriptor instead.

func (*DeleteModelResponse) GetDeleted

func (x *DeleteModelResponse) GetDeleted() bool

func (*DeleteModelResponse) GetId

func (x *DeleteModelResponse) GetId() string

func (*DeleteModelResponse) GetObject

func (x *DeleteModelResponse) GetObject() string

func (*DeleteModelResponse) ProtoMessage

func (*DeleteModelResponse) ProtoMessage()

func (*DeleteModelResponse) ProtoReflect

func (x *DeleteModelResponse) ProtoReflect() protoreflect.Message

func (*DeleteModelResponse) Reset

func (x *DeleteModelResponse) Reset()

func (*DeleteModelResponse) String

func (x *DeleteModelResponse) String() string

type GetBaseModelPathRequest

type GetBaseModelPathRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

func (*GetBaseModelPathRequest) Descriptor deprecated

func (*GetBaseModelPathRequest) Descriptor() ([]byte, []int)

Deprecated: Use GetBaseModelPathRequest.ProtoReflect.Descriptor instead.

func (*GetBaseModelPathRequest) GetId

func (x *GetBaseModelPathRequest) GetId() string

func (*GetBaseModelPathRequest) ProtoMessage

func (*GetBaseModelPathRequest) ProtoMessage()

func (*GetBaseModelPathRequest) ProtoReflect

func (x *GetBaseModelPathRequest) ProtoReflect() protoreflect.Message

func (*GetBaseModelPathRequest) Reset

func (x *GetBaseModelPathRequest) Reset()

func (*GetBaseModelPathRequest) String

func (x *GetBaseModelPathRequest) String() string

type GetBaseModelPathResponse

type GetBaseModelPathResponse struct {
	Formats []ModelFormat `protobuf:"varint,3,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"`
	Path    string        `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"`
	// gguf_model_path is the path of the GGUF model. Set if the model suppors the GGUF formta.
	GgufModelPath string `protobuf:"bytes,2,opt,name=gguf_model_path,json=ggufModelPath,proto3" json:"gguf_model_path,omitempty"`
	// contains filtered or unexported fields
}

func (*GetBaseModelPathResponse) Descriptor deprecated

func (*GetBaseModelPathResponse) Descriptor() ([]byte, []int)

Deprecated: Use GetBaseModelPathResponse.ProtoReflect.Descriptor instead.

func (*GetBaseModelPathResponse) GetFormats

func (x *GetBaseModelPathResponse) GetFormats() []ModelFormat

func (*GetBaseModelPathResponse) GetGgufModelPath

func (x *GetBaseModelPathResponse) GetGgufModelPath() string

func (*GetBaseModelPathResponse) GetPath

func (x *GetBaseModelPathResponse) GetPath() string

func (*GetBaseModelPathResponse) ProtoMessage

func (*GetBaseModelPathResponse) ProtoMessage()

func (*GetBaseModelPathResponse) ProtoReflect

func (x *GetBaseModelPathResponse) ProtoReflect() protoreflect.Message

func (*GetBaseModelPathResponse) Reset

func (x *GetBaseModelPathResponse) Reset()

func (*GetBaseModelPathResponse) String

func (x *GetBaseModelPathResponse) String() string

type GetModelAttributesRequest

type GetModelAttributesRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

func (*GetModelAttributesRequest) Descriptor deprecated

func (*GetModelAttributesRequest) Descriptor() ([]byte, []int)

Deprecated: Use GetModelAttributesRequest.ProtoReflect.Descriptor instead.

func (*GetModelAttributesRequest) GetId

func (x *GetModelAttributesRequest) GetId() string

func (*GetModelAttributesRequest) ProtoMessage

func (*GetModelAttributesRequest) ProtoMessage()

func (*GetModelAttributesRequest) ProtoReflect

func (*GetModelAttributesRequest) Reset

func (x *GetModelAttributesRequest) Reset()

func (*GetModelAttributesRequest) String

func (x *GetModelAttributesRequest) String() string

type GetModelPathRequest

type GetModelPathRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

GetModelPathRequest is deprecated, use GetModelAttributesRequest instead.

func (*GetModelPathRequest) Descriptor deprecated

func (*GetModelPathRequest) Descriptor() ([]byte, []int)

Deprecated: Use GetModelPathRequest.ProtoReflect.Descriptor instead.

func (*GetModelPathRequest) GetId

func (x *GetModelPathRequest) GetId() string

func (*GetModelPathRequest) ProtoMessage

func (*GetModelPathRequest) ProtoMessage()

func (*GetModelPathRequest) ProtoReflect

func (x *GetModelPathRequest) ProtoReflect() protoreflect.Message

func (*GetModelPathRequest) Reset

func (x *GetModelPathRequest) Reset()

func (*GetModelPathRequest) String

func (x *GetModelPathRequest) String() string

type GetModelPathResponse

type GetModelPathResponse struct {
	Path string `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"`
	// contains filtered or unexported fields
}

GetModelPathResponse is deprecated, use GetModelAttributesResponse instead.

func (*GetModelPathResponse) Descriptor deprecated

func (*GetModelPathResponse) Descriptor() ([]byte, []int)

Deprecated: Use GetModelPathResponse.ProtoReflect.Descriptor instead.

func (*GetModelPathResponse) GetPath

func (x *GetModelPathResponse) GetPath() string

func (*GetModelPathResponse) ProtoMessage

func (*GetModelPathResponse) ProtoMessage()

func (*GetModelPathResponse) ProtoReflect

func (x *GetModelPathResponse) ProtoReflect() protoreflect.Message

func (*GetModelPathResponse) Reset

func (x *GetModelPathResponse) Reset()

func (*GetModelPathResponse) String

func (x *GetModelPathResponse) String() string

type GetModelRequest

type GetModelRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

func (*GetModelRequest) Descriptor deprecated

func (*GetModelRequest) Descriptor() ([]byte, []int)

Deprecated: Use GetModelRequest.ProtoReflect.Descriptor instead.

func (*GetModelRequest) GetId

func (x *GetModelRequest) GetId() string

func (*GetModelRequest) ProtoMessage

func (*GetModelRequest) ProtoMessage()

func (*GetModelRequest) ProtoReflect

func (x *GetModelRequest) ProtoReflect() protoreflect.Message

func (*GetModelRequest) Reset

func (x *GetModelRequest) Reset()

func (*GetModelRequest) String

func (x *GetModelRequest) String() string

type GetStorageConfigRequest

type GetStorageConfigRequest struct {
	// contains filtered or unexported fields
}

func (*GetStorageConfigRequest) Descriptor deprecated

func (*GetStorageConfigRequest) Descriptor() ([]byte, []int)

Deprecated: Use GetStorageConfigRequest.ProtoReflect.Descriptor instead.

func (*GetStorageConfigRequest) ProtoMessage

func (*GetStorageConfigRequest) ProtoMessage()

func (*GetStorageConfigRequest) ProtoReflect

func (x *GetStorageConfigRequest) ProtoReflect() protoreflect.Message

func (*GetStorageConfigRequest) Reset

func (x *GetStorageConfigRequest) Reset()

func (*GetStorageConfigRequest) String

func (x *GetStorageConfigRequest) String() string

type ListBaseModelsRequest

type ListBaseModelsRequest struct {
	// contains filtered or unexported fields
}

func (*ListBaseModelsRequest) Descriptor deprecated

func (*ListBaseModelsRequest) Descriptor() ([]byte, []int)

Deprecated: Use ListBaseModelsRequest.ProtoReflect.Descriptor instead.

func (*ListBaseModelsRequest) ProtoMessage

func (*ListBaseModelsRequest) ProtoMessage()

func (*ListBaseModelsRequest) ProtoReflect

func (x *ListBaseModelsRequest) ProtoReflect() protoreflect.Message

func (*ListBaseModelsRequest) Reset

func (x *ListBaseModelsRequest) Reset()

func (*ListBaseModelsRequest) String

func (x *ListBaseModelsRequest) String() string

type ListBaseModelsResponse

type ListBaseModelsResponse struct {
	Object string       `protobuf:"bytes,1,opt,name=object,proto3" json:"object,omitempty"`
	Data   []*BaseModel `protobuf:"bytes,2,rep,name=data,proto3" json:"data,omitempty"`
	// contains filtered or unexported fields
}

func (*ListBaseModelsResponse) Descriptor deprecated

func (*ListBaseModelsResponse) Descriptor() ([]byte, []int)

Deprecated: Use ListBaseModelsResponse.ProtoReflect.Descriptor instead.

func (*ListBaseModelsResponse) GetData

func (x *ListBaseModelsResponse) GetData() []*BaseModel

func (*ListBaseModelsResponse) GetObject

func (x *ListBaseModelsResponse) GetObject() string

func (*ListBaseModelsResponse) ProtoMessage

func (*ListBaseModelsResponse) ProtoMessage()

func (*ListBaseModelsResponse) ProtoReflect

func (x *ListBaseModelsResponse) ProtoReflect() protoreflect.Message

func (*ListBaseModelsResponse) Reset

func (x *ListBaseModelsResponse) Reset()

func (*ListBaseModelsResponse) String

func (x *ListBaseModelsResponse) String() string

type ListModelsRequest

type ListModelsRequest struct {
	// contains filtered or unexported fields
}

func (*ListModelsRequest) Descriptor deprecated

func (*ListModelsRequest) Descriptor() ([]byte, []int)

Deprecated: Use ListModelsRequest.ProtoReflect.Descriptor instead.

func (*ListModelsRequest) ProtoMessage

func (*ListModelsRequest) ProtoMessage()

func (*ListModelsRequest) ProtoReflect

func (x *ListModelsRequest) ProtoReflect() protoreflect.Message

func (*ListModelsRequest) Reset

func (x *ListModelsRequest) Reset()

func (*ListModelsRequest) String

func (x *ListModelsRequest) String() string

type ListModelsResponse

type ListModelsResponse struct {
	Object string   `protobuf:"bytes,1,opt,name=object,proto3" json:"object,omitempty"`
	Data   []*Model `protobuf:"bytes,2,rep,name=data,proto3" json:"data,omitempty"`
	// contains filtered or unexported fields
}

func (*ListModelsResponse) Descriptor deprecated

func (*ListModelsResponse) Descriptor() ([]byte, []int)

Deprecated: Use ListModelsResponse.ProtoReflect.Descriptor instead.

func (*ListModelsResponse) GetData

func (x *ListModelsResponse) GetData() []*Model

func (*ListModelsResponse) GetObject

func (x *ListModelsResponse) GetObject() string

func (*ListModelsResponse) ProtoMessage

func (*ListModelsResponse) ProtoMessage()

func (*ListModelsResponse) ProtoReflect

func (x *ListModelsResponse) ProtoReflect() protoreflect.Message

func (*ListModelsResponse) Reset

func (x *ListModelsResponse) Reset()

func (*ListModelsResponse) String

func (x *ListModelsResponse) String() string

type Model

type Model struct {
	Id      string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	Created int64  `protobuf:"varint,2,opt,name=created,proto3" json:"created,omitempty"`
	Object  string `protobuf:"bytes,3,opt,name=object,proto3" json:"object,omitempty"`
	OwnedBy string `protobuf:"bytes,4,opt,name=owned_by,json=ownedBy,proto3" json:"owned_by,omitempty"`
	// contains filtered or unexported fields
}

func (*Model) Descriptor deprecated

func (*Model) Descriptor() ([]byte, []int)

Deprecated: Use Model.ProtoReflect.Descriptor instead.

func (*Model) GetCreated

func (x *Model) GetCreated() int64

func (*Model) GetId

func (x *Model) GetId() string

func (*Model) GetObject

func (x *Model) GetObject() string

func (*Model) GetOwnedBy

func (x *Model) GetOwnedBy() string

func (*Model) ProtoMessage

func (*Model) ProtoMessage()

func (*Model) ProtoReflect

func (x *Model) ProtoReflect() protoreflect.Message

func (*Model) Reset

func (x *Model) Reset()

func (*Model) String

func (x *Model) String() string

type ModelAttributes

type ModelAttributes struct {
	Path         string           `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"`
	BaseModel    string           `protobuf:"bytes,2,opt,name=base_model,json=baseModel,proto3" json:"base_model,omitempty"`
	Adapter      AdapterType      `protobuf:"varint,3,opt,name=adapter,proto3,enum=llmariner.models.server.v1.AdapterType" json:"adapter,omitempty"`
	Quantization QuantizationType `` /* 127-byte string literal not displayed */
	// contains filtered or unexported fields
}

func (*ModelAttributes) Descriptor deprecated

func (*ModelAttributes) Descriptor() ([]byte, []int)

Deprecated: Use ModelAttributes.ProtoReflect.Descriptor instead.

func (*ModelAttributes) GetAdapter

func (x *ModelAttributes) GetAdapter() AdapterType

func (*ModelAttributes) GetBaseModel

func (x *ModelAttributes) GetBaseModel() string

func (*ModelAttributes) GetPath

func (x *ModelAttributes) GetPath() string

func (*ModelAttributes) GetQuantization

func (x *ModelAttributes) GetQuantization() QuantizationType

func (*ModelAttributes) ProtoMessage

func (*ModelAttributes) ProtoMessage()

func (*ModelAttributes) ProtoReflect

func (x *ModelAttributes) ProtoReflect() protoreflect.Message

func (*ModelAttributes) Reset

func (x *ModelAttributes) Reset()

func (*ModelAttributes) String

func (x *ModelAttributes) String() string

type ModelFormat

type ModelFormat int32
const (
	ModelFormat_MODEL_FORMAT_UNSPECIFIED  ModelFormat = 0
	ModelFormat_MODEL_FORMAT_GGUF         ModelFormat = 1
	ModelFormat_MODEL_FORMAT_HUGGING_FACE ModelFormat = 2
	// Model format for Nvidia Triton Inference Server. This model files include the tokenizer configuration
	// of the original model, compiled model files for TensorRT-LLM backend, and configuration files for
	// Triton Inference Server.
	ModelFormat_MODEL_FORMAT_NVIDIA_TRITON ModelFormat = 3
)

func (ModelFormat) Descriptor

func (ModelFormat) Enum

func (x ModelFormat) Enum() *ModelFormat

func (ModelFormat) EnumDescriptor deprecated

func (ModelFormat) EnumDescriptor() ([]byte, []int)

Deprecated: Use ModelFormat.Descriptor instead.

func (ModelFormat) Number

func (x ModelFormat) Number() protoreflect.EnumNumber

func (ModelFormat) String

func (x ModelFormat) String() string

func (ModelFormat) Type

type ModelFormats

type ModelFormats struct {
	Formats []ModelFormat `protobuf:"varint,1,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"`
	// contains filtered or unexported fields
}

ModelFormats is a list of model formats. Used to store marshalled data into a store.

func (*ModelFormats) Descriptor deprecated

func (*ModelFormats) Descriptor() ([]byte, []int)

Deprecated: Use ModelFormats.ProtoReflect.Descriptor instead.

func (*ModelFormats) GetFormats

func (x *ModelFormats) GetFormats() []ModelFormat

func (*ModelFormats) ProtoMessage

func (*ModelFormats) ProtoMessage()

func (*ModelFormats) ProtoReflect

func (x *ModelFormats) ProtoReflect() protoreflect.Message

func (*ModelFormats) Reset

func (x *ModelFormats) Reset()

func (*ModelFormats) String

func (x *ModelFormats) String() string

type ModelsServiceClient

type ModelsServiceClient interface {
	ListModels(ctx context.Context, in *ListModelsRequest, opts ...grpc.CallOption) (*ListModelsResponse, error)
	GetModel(ctx context.Context, in *GetModelRequest, opts ...grpc.CallOption) (*Model, error)
	DeleteModel(ctx context.Context, in *DeleteModelRequest, opts ...grpc.CallOption) (*DeleteModelResponse, error)
	// The following API endpoints are not part of the OpenAPI API specification.
	ListBaseModels(ctx context.Context, in *ListBaseModelsRequest, opts ...grpc.CallOption) (*ListBaseModelsResponse, error)
}

ModelsServiceClient is the client API for ModelsService service.

For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.

type ModelsServiceServer

type ModelsServiceServer interface {
	ListModels(context.Context, *ListModelsRequest) (*ListModelsResponse, error)
	GetModel(context.Context, *GetModelRequest) (*Model, error)
	DeleteModel(context.Context, *DeleteModelRequest) (*DeleteModelResponse, error)
	// The following API endpoints are not part of the OpenAPI API specification.
	ListBaseModels(context.Context, *ListBaseModelsRequest) (*ListBaseModelsResponse, error)
	// contains filtered or unexported methods
}

ModelsServiceServer is the server API for ModelsService service. All implementations must embed UnimplementedModelsServiceServer for forward compatibility

type ModelsWorkerServiceClient

type ModelsWorkerServiceClient interface {
	// CreateStorageConfig creates a new storage config. Used by model-manager-loader.
	CreateStorageConfig(ctx context.Context, in *CreateStorageConfigRequest, opts ...grpc.CallOption) (*StorageConfig, error)
	// GetStorageConfig gets a storage config. Used by model-manager-loader.
	GetStorageConfig(ctx context.Context, in *GetStorageConfigRequest, opts ...grpc.CallOption) (*StorageConfig, error)
	// GetModel gets a model. Used by inference-manager-engine.
	GetModel(ctx context.Context, in *GetModelRequest, opts ...grpc.CallOption) (*Model, error)
	// RegisterModel registers a new fine-tuned model. Used by job-manager-dispatcher and model-manager-loader.
	// The model is not published until PublishModel is called.
	RegisterModel(ctx context.Context, in *RegisterModelRequest, opts ...grpc.CallOption) (*RegisterModelResponse, error)
	// PublishModel publishes the fine-tuned model. Used by job-manager-dispatcher and model-manager-loader.
	PublishModel(ctx context.Context, in *PublishModelRequest, opts ...grpc.CallOption) (*PublishModelResponse, error)
	// GetModelPath returns the path of the model. Used by inference-manager-engine and model-manager-loader.
	GetModelPath(ctx context.Context, in *GetModelPathRequest, opts ...grpc.CallOption) (*GetModelPathResponse, error)
	// GetModelAttributes returns the attributes of the model. Used by inference-manager-engine.
	GetModelAttributes(ctx context.Context, in *GetModelAttributesRequest, opts ...grpc.CallOption) (*ModelAttributes, error)
	// CreateBaseModel creates a new base model. Used by model-manager-loader.
	CreateBaseModel(ctx context.Context, in *CreateBaseModelRequest, opts ...grpc.CallOption) (*BaseModel, error)
	// GetBaseModelPath returns the path of the base model. Used by job-manager-dispatcher,
	// inference-manager-engine, and model-manager-loader.
	GetBaseModelPath(ctx context.Context, in *GetBaseModelPathRequest, opts ...grpc.CallOption) (*GetBaseModelPathResponse, error)
}

ModelsWorkerServiceClient is the client API for ModelsWorkerService service.

For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.

type ModelsWorkerServiceServer

type ModelsWorkerServiceServer interface {
	// CreateStorageConfig creates a new storage config. Used by model-manager-loader.
	CreateStorageConfig(context.Context, *CreateStorageConfigRequest) (*StorageConfig, error)
	// GetStorageConfig gets a storage config. Used by model-manager-loader.
	GetStorageConfig(context.Context, *GetStorageConfigRequest) (*StorageConfig, error)
	// GetModel gets a model. Used by inference-manager-engine.
	GetModel(context.Context, *GetModelRequest) (*Model, error)
	// RegisterModel registers a new fine-tuned model. Used by job-manager-dispatcher and model-manager-loader.
	// The model is not published until PublishModel is called.
	RegisterModel(context.Context, *RegisterModelRequest) (*RegisterModelResponse, error)
	// PublishModel publishes the fine-tuned model. Used by job-manager-dispatcher and model-manager-loader.
	PublishModel(context.Context, *PublishModelRequest) (*PublishModelResponse, error)
	// GetModelPath returns the path of the model. Used by inference-manager-engine and model-manager-loader.
	GetModelPath(context.Context, *GetModelPathRequest) (*GetModelPathResponse, error)
	// GetModelAttributes returns the attributes of the model. Used by inference-manager-engine.
	GetModelAttributes(context.Context, *GetModelAttributesRequest) (*ModelAttributes, error)
	// CreateBaseModel creates a new base model. Used by model-manager-loader.
	CreateBaseModel(context.Context, *CreateBaseModelRequest) (*BaseModel, error)
	// GetBaseModelPath returns the path of the base model. Used by job-manager-dispatcher,
	// inference-manager-engine, and model-manager-loader.
	GetBaseModelPath(context.Context, *GetBaseModelPathRequest) (*GetBaseModelPathResponse, error)
	// contains filtered or unexported methods
}

ModelsWorkerServiceServer is the server API for ModelsWorkerService service. All implementations must embed UnimplementedModelsWorkerServiceServer for forward compatibility

type PublishModelRequest

type PublishModelRequest struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// contains filtered or unexported fields
}

func (*PublishModelRequest) Descriptor deprecated

func (*PublishModelRequest) Descriptor() ([]byte, []int)

Deprecated: Use PublishModelRequest.ProtoReflect.Descriptor instead.

func (*PublishModelRequest) GetId

func (x *PublishModelRequest) GetId() string

func (*PublishModelRequest) ProtoMessage

func (*PublishModelRequest) ProtoMessage()

func (*PublishModelRequest) ProtoReflect

func (x *PublishModelRequest) ProtoReflect() protoreflect.Message

func (*PublishModelRequest) Reset

func (x *PublishModelRequest) Reset()

func (*PublishModelRequest) String

func (x *PublishModelRequest) String() string

type PublishModelResponse

type PublishModelResponse struct {
	// contains filtered or unexported fields
}

func (*PublishModelResponse) Descriptor deprecated

func (*PublishModelResponse) Descriptor() ([]byte, []int)

Deprecated: Use PublishModelResponse.ProtoReflect.Descriptor instead.

func (*PublishModelResponse) ProtoMessage

func (*PublishModelResponse) ProtoMessage()

func (*PublishModelResponse) ProtoReflect

func (x *PublishModelResponse) ProtoReflect() protoreflect.Message

func (*PublishModelResponse) Reset

func (x *PublishModelResponse) Reset()

func (*PublishModelResponse) String

func (x *PublishModelResponse) String() string

type QuantizationType

type QuantizationType int32
const (
	QuantizationType_QUANTIZATION_TYPE_UNSPECIFIED QuantizationType = 0
	QuantizationType_QUANTIZATION_TYPE_GGUF        QuantizationType = 1
	QuantizationType_QUANTIZATION_TYPE_AWQ         QuantizationType = 2
)

func (QuantizationType) Descriptor

func (QuantizationType) Enum

func (QuantizationType) EnumDescriptor deprecated

func (QuantizationType) EnumDescriptor() ([]byte, []int)

Deprecated: Use QuantizationType.Descriptor instead.

func (QuantizationType) Number

func (QuantizationType) String

func (x QuantizationType) String() string

func (QuantizationType) Type

type RegisterModelRequest

type RegisterModelRequest struct {

	// id is the model name.
	Id        string `protobuf:"bytes,7,opt,name=id,proto3" json:"id,omitempty"`
	BaseModel string `protobuf:"bytes,1,opt,name=base_model,json=baseModel,proto3" json:"base_model,omitempty"`
	// suffix is deprecated, use adapter and quantization instead.
	Suffix         string           `protobuf:"bytes,2,opt,name=suffix,proto3" json:"suffix,omitempty"`
	OrganizationId string           `protobuf:"bytes,3,opt,name=organization_id,json=organizationId,proto3" json:"organization_id,omitempty"`
	ProjectId      string           `protobuf:"bytes,4,opt,name=project_id,json=projectId,proto3" json:"project_id,omitempty"`
	Adapter        AdapterType      `protobuf:"varint,5,opt,name=adapter,proto3,enum=llmariner.models.server.v1.AdapterType" json:"adapter,omitempty"`
	Quantization   QuantizationType `` /* 127-byte string literal not displayed */
	Path           string           `protobuf:"bytes,8,opt,name=path,proto3" json:"path,omitempty"`
	// contains filtered or unexported fields
}

func (*RegisterModelRequest) Descriptor deprecated

func (*RegisterModelRequest) Descriptor() ([]byte, []int)

Deprecated: Use RegisterModelRequest.ProtoReflect.Descriptor instead.

func (*RegisterModelRequest) GetAdapter

func (x *RegisterModelRequest) GetAdapter() AdapterType

func (*RegisterModelRequest) GetBaseModel

func (x *RegisterModelRequest) GetBaseModel() string

func (*RegisterModelRequest) GetId added in v0.119.0

func (x *RegisterModelRequest) GetId() string

func (*RegisterModelRequest) GetOrganizationId

func (x *RegisterModelRequest) GetOrganizationId() string

func (*RegisterModelRequest) GetPath added in v0.119.0

func (x *RegisterModelRequest) GetPath() string

func (*RegisterModelRequest) GetProjectId

func (x *RegisterModelRequest) GetProjectId() string

func (*RegisterModelRequest) GetQuantization

func (x *RegisterModelRequest) GetQuantization() QuantizationType

func (*RegisterModelRequest) GetSuffix

func (x *RegisterModelRequest) GetSuffix() string

func (*RegisterModelRequest) ProtoMessage

func (*RegisterModelRequest) ProtoMessage()

func (*RegisterModelRequest) ProtoReflect

func (x *RegisterModelRequest) ProtoReflect() protoreflect.Message

func (*RegisterModelRequest) Reset

func (x *RegisterModelRequest) Reset()

func (*RegisterModelRequest) String

func (x *RegisterModelRequest) String() string

type RegisterModelResponse

type RegisterModelResponse struct {
	Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"`
	// path is the path where the model is stored.
	Path string `protobuf:"bytes,2,opt,name=path,proto3" json:"path,omitempty"`
	// contains filtered or unexported fields
}

func (*RegisterModelResponse) Descriptor deprecated

func (*RegisterModelResponse) Descriptor() ([]byte, []int)

Deprecated: Use RegisterModelResponse.ProtoReflect.Descriptor instead.

func (*RegisterModelResponse) GetId

func (x *RegisterModelResponse) GetId() string

func (*RegisterModelResponse) GetPath

func (x *RegisterModelResponse) GetPath() string

func (*RegisterModelResponse) ProtoMessage

func (*RegisterModelResponse) ProtoMessage()

func (*RegisterModelResponse) ProtoReflect

func (x *RegisterModelResponse) ProtoReflect() protoreflect.Message

func (*RegisterModelResponse) Reset

func (x *RegisterModelResponse) Reset()

func (*RegisterModelResponse) String

func (x *RegisterModelResponse) String() string

type StorageConfig

type StorageConfig struct {
	PathPrefix string `protobuf:"bytes,1,opt,name=path_prefix,json=pathPrefix,proto3" json:"path_prefix,omitempty"`
	// contains filtered or unexported fields
}

func (*StorageConfig) Descriptor deprecated

func (*StorageConfig) Descriptor() ([]byte, []int)

Deprecated: Use StorageConfig.ProtoReflect.Descriptor instead.

func (*StorageConfig) GetPathPrefix

func (x *StorageConfig) GetPathPrefix() string

func (*StorageConfig) ProtoMessage

func (*StorageConfig) ProtoMessage()

func (*StorageConfig) ProtoReflect

func (x *StorageConfig) ProtoReflect() protoreflect.Message

func (*StorageConfig) Reset

func (x *StorageConfig) Reset()

func (*StorageConfig) String

func (x *StorageConfig) String() string

type UnimplementedModelsServiceServer

type UnimplementedModelsServiceServer struct {
}

UnimplementedModelsServiceServer must be embedded to have forward compatible implementations.

func (UnimplementedModelsServiceServer) DeleteModel

func (UnimplementedModelsServiceServer) GetModel

func (UnimplementedModelsServiceServer) ListBaseModels

func (UnimplementedModelsServiceServer) ListModels

type UnimplementedModelsWorkerServiceServer

type UnimplementedModelsWorkerServiceServer struct {
}

UnimplementedModelsWorkerServiceServer must be embedded to have forward compatible implementations.

func (UnimplementedModelsWorkerServiceServer) CreateBaseModel

func (UnimplementedModelsWorkerServiceServer) CreateStorageConfig

func (UnimplementedModelsWorkerServiceServer) GetBaseModelPath

func (UnimplementedModelsWorkerServiceServer) GetModel

func (UnimplementedModelsWorkerServiceServer) GetModelAttributes

func (UnimplementedModelsWorkerServiceServer) GetModelPath

func (UnimplementedModelsWorkerServiceServer) GetStorageConfig

func (UnimplementedModelsWorkerServiceServer) PublishModel

func (UnimplementedModelsWorkerServiceServer) RegisterModel

type UnsafeModelsServiceServer

type UnsafeModelsServiceServer interface {
	// contains filtered or unexported methods
}

UnsafeModelsServiceServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to ModelsServiceServer will result in compilation errors.

type UnsafeModelsWorkerServiceServer

type UnsafeModelsWorkerServiceServer interface {
	// contains filtered or unexported methods
}

UnsafeModelsWorkerServiceServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to ModelsWorkerServiceServer will result in compilation errors.

Directories

Path Synopsis

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL