Documentation ¶
Overview ¶
Package v1 is a reverse proxy.
It translates gRPC into RESTful JSON APIs.
Index ¶
- Variables
- func RegisterModelsServiceHandler(ctx context.Context, mux *runtime.ServeMux, conn *grpc.ClientConn) error
- func RegisterModelsServiceHandlerClient(ctx context.Context, mux *runtime.ServeMux, client ModelsServiceClient) error
- func RegisterModelsServiceHandlerFromEndpoint(ctx context.Context, mux *runtime.ServeMux, endpoint string, ...) (err error)
- func RegisterModelsServiceHandlerServer(ctx context.Context, mux *runtime.ServeMux, server ModelsServiceServer) error
- func RegisterModelsServiceServer(s grpc.ServiceRegistrar, srv ModelsServiceServer)
- func RegisterModelsWorkerServiceServer(s grpc.ServiceRegistrar, srv ModelsWorkerServiceServer)
- type AdapterType
- func (AdapterType) Descriptor() protoreflect.EnumDescriptor
- func (x AdapterType) Enum() *AdapterType
- func (AdapterType) EnumDescriptor() ([]byte, []int)deprecated
- func (x AdapterType) Number() protoreflect.EnumNumber
- func (x AdapterType) String() string
- func (AdapterType) Type() protoreflect.EnumType
- type BaseModel
- func (*BaseModel) Descriptor() ([]byte, []int)deprecated
- func (x *BaseModel) GetCreated() int64
- func (x *BaseModel) GetId() string
- func (x *BaseModel) GetObject() string
- func (*BaseModel) ProtoMessage()
- func (x *BaseModel) ProtoReflect() protoreflect.Message
- func (x *BaseModel) Reset()
- func (x *BaseModel) String() string
- type CreateBaseModelRequest
- func (*CreateBaseModelRequest) Descriptor() ([]byte, []int)deprecated
- func (x *CreateBaseModelRequest) GetFormats() []ModelFormat
- func (x *CreateBaseModelRequest) GetGgufModelPath() string
- func (x *CreateBaseModelRequest) GetId() string
- func (x *CreateBaseModelRequest) GetPath() string
- func (*CreateBaseModelRequest) ProtoMessage()
- func (x *CreateBaseModelRequest) ProtoReflect() protoreflect.Message
- func (x *CreateBaseModelRequest) Reset()
- func (x *CreateBaseModelRequest) String() string
- type CreateHFModelRepoRequest
- func (*CreateHFModelRepoRequest) Descriptor() ([]byte, []int)deprecated
- func (x *CreateHFModelRepoRequest) GetName() string
- func (*CreateHFModelRepoRequest) ProtoMessage()
- func (x *CreateHFModelRepoRequest) ProtoReflect() protoreflect.Message
- func (x *CreateHFModelRepoRequest) Reset()
- func (x *CreateHFModelRepoRequest) String() string
- type CreateStorageConfigRequest
- func (*CreateStorageConfigRequest) Descriptor() ([]byte, []int)deprecated
- func (x *CreateStorageConfigRequest) GetPathPrefix() string
- func (*CreateStorageConfigRequest) ProtoMessage()
- func (x *CreateStorageConfigRequest) ProtoReflect() protoreflect.Message
- func (x *CreateStorageConfigRequest) Reset()
- func (x *CreateStorageConfigRequest) String() string
- type DeleteModelRequest
- type DeleteModelResponse
- func (*DeleteModelResponse) Descriptor() ([]byte, []int)deprecated
- func (x *DeleteModelResponse) GetDeleted() bool
- func (x *DeleteModelResponse) GetId() string
- func (x *DeleteModelResponse) GetObject() string
- func (*DeleteModelResponse) ProtoMessage()
- func (x *DeleteModelResponse) ProtoReflect() protoreflect.Message
- func (x *DeleteModelResponse) Reset()
- func (x *DeleteModelResponse) String() string
- type GetBaseModelPathRequest
- func (*GetBaseModelPathRequest) Descriptor() ([]byte, []int)deprecated
- func (x *GetBaseModelPathRequest) GetId() string
- func (*GetBaseModelPathRequest) ProtoMessage()
- func (x *GetBaseModelPathRequest) ProtoReflect() protoreflect.Message
- func (x *GetBaseModelPathRequest) Reset()
- func (x *GetBaseModelPathRequest) String() string
- type GetBaseModelPathResponse
- func (*GetBaseModelPathResponse) Descriptor() ([]byte, []int)deprecated
- func (x *GetBaseModelPathResponse) GetFormats() []ModelFormat
- func (x *GetBaseModelPathResponse) GetGgufModelPath() string
- func (x *GetBaseModelPathResponse) GetPath() string
- func (*GetBaseModelPathResponse) ProtoMessage()
- func (x *GetBaseModelPathResponse) ProtoReflect() protoreflect.Message
- func (x *GetBaseModelPathResponse) Reset()
- func (x *GetBaseModelPathResponse) String() string
- type GetHFModelRepoRequest
- func (*GetHFModelRepoRequest) Descriptor() ([]byte, []int)deprecated
- func (x *GetHFModelRepoRequest) GetName() string
- func (*GetHFModelRepoRequest) ProtoMessage()
- func (x *GetHFModelRepoRequest) ProtoReflect() protoreflect.Message
- func (x *GetHFModelRepoRequest) Reset()
- func (x *GetHFModelRepoRequest) String() string
- type GetModelAttributesRequest
- func (*GetModelAttributesRequest) Descriptor() ([]byte, []int)deprecated
- func (x *GetModelAttributesRequest) GetId() string
- func (*GetModelAttributesRequest) ProtoMessage()
- func (x *GetModelAttributesRequest) ProtoReflect() protoreflect.Message
- func (x *GetModelAttributesRequest) Reset()
- func (x *GetModelAttributesRequest) String() string
- type GetModelPathRequest
- func (*GetModelPathRequest) Descriptor() ([]byte, []int)deprecated
- func (x *GetModelPathRequest) GetId() string
- func (*GetModelPathRequest) ProtoMessage()
- func (x *GetModelPathRequest) ProtoReflect() protoreflect.Message
- func (x *GetModelPathRequest) Reset()
- func (x *GetModelPathRequest) String() string
- type GetModelPathResponse
- func (*GetModelPathResponse) Descriptor() ([]byte, []int)deprecated
- func (x *GetModelPathResponse) GetPath() string
- func (*GetModelPathResponse) ProtoMessage()
- func (x *GetModelPathResponse) ProtoReflect() protoreflect.Message
- func (x *GetModelPathResponse) Reset()
- func (x *GetModelPathResponse) String() string
- type GetModelRequest
- type GetStorageConfigRequest
- type HFModelRepo
- type ListBaseModelsRequest
- type ListBaseModelsResponse
- func (*ListBaseModelsResponse) Descriptor() ([]byte, []int)deprecated
- func (x *ListBaseModelsResponse) GetData() []*BaseModel
- func (x *ListBaseModelsResponse) GetObject() string
- func (*ListBaseModelsResponse) ProtoMessage()
- func (x *ListBaseModelsResponse) ProtoReflect() protoreflect.Message
- func (x *ListBaseModelsResponse) Reset()
- func (x *ListBaseModelsResponse) String() string
- type ListModelsRequest
- type ListModelsResponse
- func (*ListModelsResponse) Descriptor() ([]byte, []int)deprecated
- func (x *ListModelsResponse) GetData() []*Model
- func (x *ListModelsResponse) GetObject() string
- func (*ListModelsResponse) ProtoMessage()
- func (x *ListModelsResponse) ProtoReflect() protoreflect.Message
- func (x *ListModelsResponse) Reset()
- func (x *ListModelsResponse) String() string
- type Model
- func (*Model) Descriptor() ([]byte, []int)deprecated
- func (x *Model) GetCreated() int64
- func (x *Model) GetId() string
- func (x *Model) GetObject() string
- func (x *Model) GetOwnedBy() string
- func (*Model) ProtoMessage()
- func (x *Model) ProtoReflect() protoreflect.Message
- func (x *Model) Reset()
- func (x *Model) String() string
- type ModelAttributes
- func (*ModelAttributes) Descriptor() ([]byte, []int)deprecated
- func (x *ModelAttributes) GetAdapter() AdapterType
- func (x *ModelAttributes) GetBaseModel() string
- func (x *ModelAttributes) GetPath() string
- func (x *ModelAttributes) GetQuantization() QuantizationType
- func (*ModelAttributes) ProtoMessage()
- func (x *ModelAttributes) ProtoReflect() protoreflect.Message
- func (x *ModelAttributes) Reset()
- func (x *ModelAttributes) String() string
- type ModelFormat
- func (ModelFormat) Descriptor() protoreflect.EnumDescriptor
- func (x ModelFormat) Enum() *ModelFormat
- func (ModelFormat) EnumDescriptor() ([]byte, []int)deprecated
- func (x ModelFormat) Number() protoreflect.EnumNumber
- func (x ModelFormat) String() string
- func (ModelFormat) Type() protoreflect.EnumType
- type ModelFormats
- type ModelsServiceClient
- type ModelsServiceServer
- type ModelsWorkerServiceClient
- type ModelsWorkerServiceServer
- type PublishModelRequest
- func (*PublishModelRequest) Descriptor() ([]byte, []int)deprecated
- func (x *PublishModelRequest) GetId() string
- func (*PublishModelRequest) ProtoMessage()
- func (x *PublishModelRequest) ProtoReflect() protoreflect.Message
- func (x *PublishModelRequest) Reset()
- func (x *PublishModelRequest) String() string
- type PublishModelResponse
- type QuantizationType
- func (QuantizationType) Descriptor() protoreflect.EnumDescriptor
- func (x QuantizationType) Enum() *QuantizationType
- func (QuantizationType) EnumDescriptor() ([]byte, []int)deprecated
- func (x QuantizationType) Number() protoreflect.EnumNumber
- func (x QuantizationType) String() string
- func (QuantizationType) Type() protoreflect.EnumType
- type RegisterModelRequest
- func (*RegisterModelRequest) Descriptor() ([]byte, []int)deprecated
- func (x *RegisterModelRequest) GetAdapter() AdapterType
- func (x *RegisterModelRequest) GetBaseModel() string
- func (x *RegisterModelRequest) GetId() string
- func (x *RegisterModelRequest) GetOrganizationId() string
- func (x *RegisterModelRequest) GetPath() string
- func (x *RegisterModelRequest) GetProjectId() string
- func (x *RegisterModelRequest) GetQuantization() QuantizationType
- func (x *RegisterModelRequest) GetSuffix() string
- func (*RegisterModelRequest) ProtoMessage()
- func (x *RegisterModelRequest) ProtoReflect() protoreflect.Message
- func (x *RegisterModelRequest) Reset()
- func (x *RegisterModelRequest) String() string
- type RegisterModelResponse
- func (*RegisterModelResponse) Descriptor() ([]byte, []int)deprecated
- func (x *RegisterModelResponse) GetId() string
- func (x *RegisterModelResponse) GetPath() string
- func (*RegisterModelResponse) ProtoMessage()
- func (x *RegisterModelResponse) ProtoReflect() protoreflect.Message
- func (x *RegisterModelResponse) Reset()
- func (x *RegisterModelResponse) String() string
- type StorageConfig
- type UnimplementedModelsServiceServer
- func (UnimplementedModelsServiceServer) DeleteModel(context.Context, *DeleteModelRequest) (*DeleteModelResponse, error)
- func (UnimplementedModelsServiceServer) GetModel(context.Context, *GetModelRequest) (*Model, error)
- func (UnimplementedModelsServiceServer) ListBaseModels(context.Context, *ListBaseModelsRequest) (*ListBaseModelsResponse, error)
- func (UnimplementedModelsServiceServer) ListModels(context.Context, *ListModelsRequest) (*ListModelsResponse, error)
- type UnimplementedModelsWorkerServiceServer
- func (UnimplementedModelsWorkerServiceServer) CreateBaseModel(context.Context, *CreateBaseModelRequest) (*BaseModel, error)
- func (UnimplementedModelsWorkerServiceServer) CreateHFModelRepo(context.Context, *CreateHFModelRepoRequest) (*HFModelRepo, error)
- func (UnimplementedModelsWorkerServiceServer) CreateStorageConfig(context.Context, *CreateStorageConfigRequest) (*StorageConfig, error)
- func (UnimplementedModelsWorkerServiceServer) GetBaseModelPath(context.Context, *GetBaseModelPathRequest) (*GetBaseModelPathResponse, error)
- func (UnimplementedModelsWorkerServiceServer) GetHFModelRepo(context.Context, *GetHFModelRepoRequest) (*HFModelRepo, error)
- func (UnimplementedModelsWorkerServiceServer) GetModel(context.Context, *GetModelRequest) (*Model, error)
- func (UnimplementedModelsWorkerServiceServer) GetModelAttributes(context.Context, *GetModelAttributesRequest) (*ModelAttributes, error)
- func (UnimplementedModelsWorkerServiceServer) GetModelPath(context.Context, *GetModelPathRequest) (*GetModelPathResponse, error)
- func (UnimplementedModelsWorkerServiceServer) GetStorageConfig(context.Context, *GetStorageConfigRequest) (*StorageConfig, error)
- func (UnimplementedModelsWorkerServiceServer) PublishModel(context.Context, *PublishModelRequest) (*PublishModelResponse, error)
- func (UnimplementedModelsWorkerServiceServer) RegisterModel(context.Context, *RegisterModelRequest) (*RegisterModelResponse, error)
- type UnsafeModelsServiceServer
- type UnsafeModelsWorkerServiceServer
Constants ¶
This section is empty.
Variables ¶
var ( ModelFormat_name = map[int32]string{ 0: "MODEL_FORMAT_UNSPECIFIED", 1: "MODEL_FORMAT_GGUF", 2: "MODEL_FORMAT_HUGGING_FACE", 3: "MODEL_FORMAT_NVIDIA_TRITON", } ModelFormat_value = map[string]int32{ "MODEL_FORMAT_UNSPECIFIED": 0, "MODEL_FORMAT_GGUF": 1, "MODEL_FORMAT_HUGGING_FACE": 2, "MODEL_FORMAT_NVIDIA_TRITON": 3, } )
Enum value maps for ModelFormat.
var ( AdapterType_name = map[int32]string{ 0: "ADAPTER_TYPE_UNSPECIFIED", 1: "ADAPTER_TYPE_LORA", 2: "ADAPTER_TYPE_QLORA", } AdapterType_value = map[string]int32{ "ADAPTER_TYPE_UNSPECIFIED": 0, "ADAPTER_TYPE_LORA": 1, "ADAPTER_TYPE_QLORA": 2, } )
Enum value maps for AdapterType.
var ( QuantizationType_name = map[int32]string{ 0: "QUANTIZATION_TYPE_UNSPECIFIED", 1: "QUANTIZATION_TYPE_GGUF", 2: "QUANTIZATION_TYPE_AWQ", } QuantizationType_value = map[string]int32{ "QUANTIZATION_TYPE_UNSPECIFIED": 0, "QUANTIZATION_TYPE_GGUF": 1, "QUANTIZATION_TYPE_AWQ": 2, } )
Enum value maps for QuantizationType.
var File_api_v1_model_manager_service_proto protoreflect.FileDescriptor
var ModelsService_ServiceDesc = grpc.ServiceDesc{ ServiceName: "llmariner.models.server.v1.ModelsService", HandlerType: (*ModelsServiceServer)(nil), Methods: []grpc.MethodDesc{ { MethodName: "ListModels", Handler: _ModelsService_ListModels_Handler, }, { MethodName: "GetModel", Handler: _ModelsService_GetModel_Handler, }, { MethodName: "DeleteModel", Handler: _ModelsService_DeleteModel_Handler, }, { MethodName: "ListBaseModels", Handler: _ModelsService_ListBaseModels_Handler, }, }, Streams: []grpc.StreamDesc{}, Metadata: "api/v1/model_manager_service.proto", }
ModelsService_ServiceDesc is the grpc.ServiceDesc for ModelsService service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)
var ModelsWorkerService_ServiceDesc = grpc.ServiceDesc{ ServiceName: "llmariner.models.server.v1.ModelsWorkerService", HandlerType: (*ModelsWorkerServiceServer)(nil), Methods: []grpc.MethodDesc{ { MethodName: "CreateStorageConfig", Handler: _ModelsWorkerService_CreateStorageConfig_Handler, }, { MethodName: "GetStorageConfig", Handler: _ModelsWorkerService_GetStorageConfig_Handler, }, { MethodName: "GetModel", Handler: _ModelsWorkerService_GetModel_Handler, }, { MethodName: "RegisterModel", Handler: _ModelsWorkerService_RegisterModel_Handler, }, { MethodName: "PublishModel", Handler: _ModelsWorkerService_PublishModel_Handler, }, { MethodName: "GetModelPath", Handler: _ModelsWorkerService_GetModelPath_Handler, }, { MethodName: "GetModelAttributes", Handler: _ModelsWorkerService_GetModelAttributes_Handler, }, { MethodName: "CreateBaseModel", Handler: _ModelsWorkerService_CreateBaseModel_Handler, }, { MethodName: "GetBaseModelPath", Handler: _ModelsWorkerService_GetBaseModelPath_Handler, }, { MethodName: "CreateHFModelRepo", Handler: _ModelsWorkerService_CreateHFModelRepo_Handler, }, { MethodName: "GetHFModelRepo", Handler: _ModelsWorkerService_GetHFModelRepo_Handler, }, }, Streams: []grpc.StreamDesc{}, Metadata: "api/v1/model_manager_service.proto", }
ModelsWorkerService_ServiceDesc is the grpc.ServiceDesc for ModelsWorkerService service. It's only intended for direct use with grpc.RegisterService, and not to be introspected or modified (even as a copy)
Functions ¶
func RegisterModelsServiceHandler ¶
func RegisterModelsServiceHandler(ctx context.Context, mux *runtime.ServeMux, conn *grpc.ClientConn) error
RegisterModelsServiceHandler registers the http handlers for service ModelsService to "mux". The handlers forward requests to the grpc endpoint over "conn".
func RegisterModelsServiceHandlerClient ¶
func RegisterModelsServiceHandlerClient(ctx context.Context, mux *runtime.ServeMux, client ModelsServiceClient) error
RegisterModelsServiceHandlerClient registers the http handlers for service ModelsService to "mux". The handlers forward requests to the grpc endpoint over the given implementation of "ModelsServiceClient". Note: the gRPC framework executes interceptors within the gRPC handler. If the passed in "ModelsServiceClient" doesn't go through the normal gRPC flow (creating a gRPC client etc.) then it will be up to the passed in "ModelsServiceClient" to call the correct interceptors.
func RegisterModelsServiceHandlerFromEndpoint ¶
func RegisterModelsServiceHandlerFromEndpoint(ctx context.Context, mux *runtime.ServeMux, endpoint string, opts []grpc.DialOption) (err error)
RegisterModelsServiceHandlerFromEndpoint is same as RegisterModelsServiceHandler but automatically dials to "endpoint" and closes the connection when "ctx" gets done.
func RegisterModelsServiceHandlerServer ¶
func RegisterModelsServiceHandlerServer(ctx context.Context, mux *runtime.ServeMux, server ModelsServiceServer) error
RegisterModelsServiceHandlerServer registers the http handlers for service ModelsService to "mux". UnaryRPC :call ModelsServiceServer directly. StreamingRPC :currently unsupported pending https://github.com/grpc/grpc-go/issues/906. Note that using this registration option will cause many gRPC library features to stop working. Consider using RegisterModelsServiceHandlerFromEndpoint instead.
func RegisterModelsServiceServer ¶
func RegisterModelsServiceServer(s grpc.ServiceRegistrar, srv ModelsServiceServer)
func RegisterModelsWorkerServiceServer ¶
func RegisterModelsWorkerServiceServer(s grpc.ServiceRegistrar, srv ModelsWorkerServiceServer)
Types ¶
type AdapterType ¶
type AdapterType int32
const ( AdapterType_ADAPTER_TYPE_UNSPECIFIED AdapterType = 0 AdapterType_ADAPTER_TYPE_LORA AdapterType = 1 AdapterType_ADAPTER_TYPE_QLORA AdapterType = 2 )
func (AdapterType) Descriptor ¶
func (AdapterType) Descriptor() protoreflect.EnumDescriptor
func (AdapterType) Enum ¶
func (x AdapterType) Enum() *AdapterType
func (AdapterType) EnumDescriptor
deprecated
func (AdapterType) EnumDescriptor() ([]byte, []int)
Deprecated: Use AdapterType.Descriptor instead.
func (AdapterType) Number ¶
func (x AdapterType) Number() protoreflect.EnumNumber
func (AdapterType) String ¶
func (x AdapterType) String() string
func (AdapterType) Type ¶
func (AdapterType) Type() protoreflect.EnumType
type BaseModel ¶
type BaseModel struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` Created int64 `protobuf:"varint,2,opt,name=created,proto3" json:"created,omitempty"` Object string `protobuf:"bytes,3,opt,name=object,proto3" json:"object,omitempty"` // contains filtered or unexported fields }
func (*BaseModel) Descriptor
deprecated
func (*BaseModel) GetCreated ¶
func (*BaseModel) ProtoMessage ¶
func (*BaseModel) ProtoMessage()
func (*BaseModel) ProtoReflect ¶
func (x *BaseModel) ProtoReflect() protoreflect.Message
type CreateBaseModelRequest ¶
type CreateBaseModelRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` Path string `protobuf:"bytes,2,opt,name=path,proto3" json:"path,omitempty"` // formats is the supported formats of the base model. If not set, the format is considered as GGUF // for backward compatibility. Formats []ModelFormat `protobuf:"varint,4,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"` // gguf_model_path is the path of the GGUF model. Set if the model suppors the GGUF formta. GgufModelPath string `protobuf:"bytes,3,opt,name=gguf_model_path,json=ggufModelPath,proto3" json:"gguf_model_path,omitempty"` // contains filtered or unexported fields }
func (*CreateBaseModelRequest) Descriptor
deprecated
func (*CreateBaseModelRequest) Descriptor() ([]byte, []int)
Deprecated: Use CreateBaseModelRequest.ProtoReflect.Descriptor instead.
func (*CreateBaseModelRequest) GetFormats ¶
func (x *CreateBaseModelRequest) GetFormats() []ModelFormat
func (*CreateBaseModelRequest) GetGgufModelPath ¶
func (x *CreateBaseModelRequest) GetGgufModelPath() string
func (*CreateBaseModelRequest) GetId ¶
func (x *CreateBaseModelRequest) GetId() string
func (*CreateBaseModelRequest) GetPath ¶
func (x *CreateBaseModelRequest) GetPath() string
func (*CreateBaseModelRequest) ProtoMessage ¶
func (*CreateBaseModelRequest) ProtoMessage()
func (*CreateBaseModelRequest) ProtoReflect ¶
func (x *CreateBaseModelRequest) ProtoReflect() protoreflect.Message
func (*CreateBaseModelRequest) Reset ¶
func (x *CreateBaseModelRequest) Reset()
func (*CreateBaseModelRequest) String ¶
func (x *CreateBaseModelRequest) String() string
type CreateHFModelRepoRequest ¶ added in v1.4.0
type CreateHFModelRepoRequest struct { Name string `protobuf:"bytes,1,opt,name=name,proto3" json:"name,omitempty"` // contains filtered or unexported fields }
func (*CreateHFModelRepoRequest) Descriptor
deprecated
added in
v1.4.0
func (*CreateHFModelRepoRequest) Descriptor() ([]byte, []int)
Deprecated: Use CreateHFModelRepoRequest.ProtoReflect.Descriptor instead.
func (*CreateHFModelRepoRequest) GetName ¶ added in v1.4.0
func (x *CreateHFModelRepoRequest) GetName() string
func (*CreateHFModelRepoRequest) ProtoMessage ¶ added in v1.4.0
func (*CreateHFModelRepoRequest) ProtoMessage()
func (*CreateHFModelRepoRequest) ProtoReflect ¶ added in v1.4.0
func (x *CreateHFModelRepoRequest) ProtoReflect() protoreflect.Message
func (*CreateHFModelRepoRequest) Reset ¶ added in v1.4.0
func (x *CreateHFModelRepoRequest) Reset()
func (*CreateHFModelRepoRequest) String ¶ added in v1.4.0
func (x *CreateHFModelRepoRequest) String() string
type CreateStorageConfigRequest ¶
type CreateStorageConfigRequest struct { PathPrefix string `protobuf:"bytes,1,opt,name=path_prefix,json=pathPrefix,proto3" json:"path_prefix,omitempty"` // contains filtered or unexported fields }
func (*CreateStorageConfigRequest) Descriptor
deprecated
func (*CreateStorageConfigRequest) Descriptor() ([]byte, []int)
Deprecated: Use CreateStorageConfigRequest.ProtoReflect.Descriptor instead.
func (*CreateStorageConfigRequest) GetPathPrefix ¶
func (x *CreateStorageConfigRequest) GetPathPrefix() string
func (*CreateStorageConfigRequest) ProtoMessage ¶
func (*CreateStorageConfigRequest) ProtoMessage()
func (*CreateStorageConfigRequest) ProtoReflect ¶
func (x *CreateStorageConfigRequest) ProtoReflect() protoreflect.Message
func (*CreateStorageConfigRequest) Reset ¶
func (x *CreateStorageConfigRequest) Reset()
func (*CreateStorageConfigRequest) String ¶
func (x *CreateStorageConfigRequest) String() string
type DeleteModelRequest ¶
type DeleteModelRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
func (*DeleteModelRequest) Descriptor
deprecated
func (*DeleteModelRequest) Descriptor() ([]byte, []int)
Deprecated: Use DeleteModelRequest.ProtoReflect.Descriptor instead.
func (*DeleteModelRequest) GetId ¶
func (x *DeleteModelRequest) GetId() string
func (*DeleteModelRequest) ProtoMessage ¶
func (*DeleteModelRequest) ProtoMessage()
func (*DeleteModelRequest) ProtoReflect ¶
func (x *DeleteModelRequest) ProtoReflect() protoreflect.Message
func (*DeleteModelRequest) Reset ¶
func (x *DeleteModelRequest) Reset()
func (*DeleteModelRequest) String ¶
func (x *DeleteModelRequest) String() string
type DeleteModelResponse ¶
type DeleteModelResponse struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` Object string `protobuf:"bytes,2,opt,name=object,proto3" json:"object,omitempty"` Deleted bool `protobuf:"varint,3,opt,name=deleted,proto3" json:"deleted,omitempty"` // contains filtered or unexported fields }
func (*DeleteModelResponse) Descriptor
deprecated
func (*DeleteModelResponse) Descriptor() ([]byte, []int)
Deprecated: Use DeleteModelResponse.ProtoReflect.Descriptor instead.
func (*DeleteModelResponse) GetDeleted ¶
func (x *DeleteModelResponse) GetDeleted() bool
func (*DeleteModelResponse) GetId ¶
func (x *DeleteModelResponse) GetId() string
func (*DeleteModelResponse) GetObject ¶
func (x *DeleteModelResponse) GetObject() string
func (*DeleteModelResponse) ProtoMessage ¶
func (*DeleteModelResponse) ProtoMessage()
func (*DeleteModelResponse) ProtoReflect ¶
func (x *DeleteModelResponse) ProtoReflect() protoreflect.Message
func (*DeleteModelResponse) Reset ¶
func (x *DeleteModelResponse) Reset()
func (*DeleteModelResponse) String ¶
func (x *DeleteModelResponse) String() string
type GetBaseModelPathRequest ¶
type GetBaseModelPathRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
func (*GetBaseModelPathRequest) Descriptor
deprecated
func (*GetBaseModelPathRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetBaseModelPathRequest.ProtoReflect.Descriptor instead.
func (*GetBaseModelPathRequest) GetId ¶
func (x *GetBaseModelPathRequest) GetId() string
func (*GetBaseModelPathRequest) ProtoMessage ¶
func (*GetBaseModelPathRequest) ProtoMessage()
func (*GetBaseModelPathRequest) ProtoReflect ¶
func (x *GetBaseModelPathRequest) ProtoReflect() protoreflect.Message
func (*GetBaseModelPathRequest) Reset ¶
func (x *GetBaseModelPathRequest) Reset()
func (*GetBaseModelPathRequest) String ¶
func (x *GetBaseModelPathRequest) String() string
type GetBaseModelPathResponse ¶
type GetBaseModelPathResponse struct { Formats []ModelFormat `protobuf:"varint,3,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"` Path string `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"` // gguf_model_path is the path of the GGUF model. Set if the model suppors the GGUF formta. GgufModelPath string `protobuf:"bytes,2,opt,name=gguf_model_path,json=ggufModelPath,proto3" json:"gguf_model_path,omitempty"` // contains filtered or unexported fields }
func (*GetBaseModelPathResponse) Descriptor
deprecated
func (*GetBaseModelPathResponse) Descriptor() ([]byte, []int)
Deprecated: Use GetBaseModelPathResponse.ProtoReflect.Descriptor instead.
func (*GetBaseModelPathResponse) GetFormats ¶
func (x *GetBaseModelPathResponse) GetFormats() []ModelFormat
func (*GetBaseModelPathResponse) GetGgufModelPath ¶
func (x *GetBaseModelPathResponse) GetGgufModelPath() string
func (*GetBaseModelPathResponse) GetPath ¶
func (x *GetBaseModelPathResponse) GetPath() string
func (*GetBaseModelPathResponse) ProtoMessage ¶
func (*GetBaseModelPathResponse) ProtoMessage()
func (*GetBaseModelPathResponse) ProtoReflect ¶
func (x *GetBaseModelPathResponse) ProtoReflect() protoreflect.Message
func (*GetBaseModelPathResponse) Reset ¶
func (x *GetBaseModelPathResponse) Reset()
func (*GetBaseModelPathResponse) String ¶
func (x *GetBaseModelPathResponse) String() string
type GetHFModelRepoRequest ¶ added in v1.4.0
type GetHFModelRepoRequest struct { Name string `protobuf:"bytes,1,opt,name=name,proto3" json:"name,omitempty"` // contains filtered or unexported fields }
func (*GetHFModelRepoRequest) Descriptor
deprecated
added in
v1.4.0
func (*GetHFModelRepoRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetHFModelRepoRequest.ProtoReflect.Descriptor instead.
func (*GetHFModelRepoRequest) GetName ¶ added in v1.4.0
func (x *GetHFModelRepoRequest) GetName() string
func (*GetHFModelRepoRequest) ProtoMessage ¶ added in v1.4.0
func (*GetHFModelRepoRequest) ProtoMessage()
func (*GetHFModelRepoRequest) ProtoReflect ¶ added in v1.4.0
func (x *GetHFModelRepoRequest) ProtoReflect() protoreflect.Message
func (*GetHFModelRepoRequest) Reset ¶ added in v1.4.0
func (x *GetHFModelRepoRequest) Reset()
func (*GetHFModelRepoRequest) String ¶ added in v1.4.0
func (x *GetHFModelRepoRequest) String() string
type GetModelAttributesRequest ¶
type GetModelAttributesRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
func (*GetModelAttributesRequest) Descriptor
deprecated
func (*GetModelAttributesRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetModelAttributesRequest.ProtoReflect.Descriptor instead.
func (*GetModelAttributesRequest) GetId ¶
func (x *GetModelAttributesRequest) GetId() string
func (*GetModelAttributesRequest) ProtoMessage ¶
func (*GetModelAttributesRequest) ProtoMessage()
func (*GetModelAttributesRequest) ProtoReflect ¶
func (x *GetModelAttributesRequest) ProtoReflect() protoreflect.Message
func (*GetModelAttributesRequest) Reset ¶
func (x *GetModelAttributesRequest) Reset()
func (*GetModelAttributesRequest) String ¶
func (x *GetModelAttributesRequest) String() string
type GetModelPathRequest ¶
type GetModelPathRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
GetModelPathRequest is deprecated, use GetModelAttributesRequest instead.
func (*GetModelPathRequest) Descriptor
deprecated
func (*GetModelPathRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetModelPathRequest.ProtoReflect.Descriptor instead.
func (*GetModelPathRequest) GetId ¶
func (x *GetModelPathRequest) GetId() string
func (*GetModelPathRequest) ProtoMessage ¶
func (*GetModelPathRequest) ProtoMessage()
func (*GetModelPathRequest) ProtoReflect ¶
func (x *GetModelPathRequest) ProtoReflect() protoreflect.Message
func (*GetModelPathRequest) Reset ¶
func (x *GetModelPathRequest) Reset()
func (*GetModelPathRequest) String ¶
func (x *GetModelPathRequest) String() string
type GetModelPathResponse ¶
type GetModelPathResponse struct { Path string `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"` // contains filtered or unexported fields }
GetModelPathResponse is deprecated, use GetModelAttributesResponse instead.
func (*GetModelPathResponse) Descriptor
deprecated
func (*GetModelPathResponse) Descriptor() ([]byte, []int)
Deprecated: Use GetModelPathResponse.ProtoReflect.Descriptor instead.
func (*GetModelPathResponse) GetPath ¶
func (x *GetModelPathResponse) GetPath() string
func (*GetModelPathResponse) ProtoMessage ¶
func (*GetModelPathResponse) ProtoMessage()
func (*GetModelPathResponse) ProtoReflect ¶
func (x *GetModelPathResponse) ProtoReflect() protoreflect.Message
func (*GetModelPathResponse) Reset ¶
func (x *GetModelPathResponse) Reset()
func (*GetModelPathResponse) String ¶
func (x *GetModelPathResponse) String() string
type GetModelRequest ¶
type GetModelRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
func (*GetModelRequest) Descriptor
deprecated
func (*GetModelRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetModelRequest.ProtoReflect.Descriptor instead.
func (*GetModelRequest) GetId ¶
func (x *GetModelRequest) GetId() string
func (*GetModelRequest) ProtoMessage ¶
func (*GetModelRequest) ProtoMessage()
func (*GetModelRequest) ProtoReflect ¶
func (x *GetModelRequest) ProtoReflect() protoreflect.Message
func (*GetModelRequest) Reset ¶
func (x *GetModelRequest) Reset()
func (*GetModelRequest) String ¶
func (x *GetModelRequest) String() string
type GetStorageConfigRequest ¶
type GetStorageConfigRequest struct {
// contains filtered or unexported fields
}
func (*GetStorageConfigRequest) Descriptor
deprecated
func (*GetStorageConfigRequest) Descriptor() ([]byte, []int)
Deprecated: Use GetStorageConfigRequest.ProtoReflect.Descriptor instead.
func (*GetStorageConfigRequest) ProtoMessage ¶
func (*GetStorageConfigRequest) ProtoMessage()
func (*GetStorageConfigRequest) ProtoReflect ¶
func (x *GetStorageConfigRequest) ProtoReflect() protoreflect.Message
func (*GetStorageConfigRequest) Reset ¶
func (x *GetStorageConfigRequest) Reset()
func (*GetStorageConfigRequest) String ¶
func (x *GetStorageConfigRequest) String() string
type HFModelRepo ¶ added in v1.4.0
type HFModelRepo struct { Name string `protobuf:"bytes,1,opt,name=name,proto3" json:"name,omitempty"` // contains filtered or unexported fields }
func (*HFModelRepo) Descriptor
deprecated
added in
v1.4.0
func (*HFModelRepo) Descriptor() ([]byte, []int)
Deprecated: Use HFModelRepo.ProtoReflect.Descriptor instead.
func (*HFModelRepo) GetName ¶ added in v1.4.0
func (x *HFModelRepo) GetName() string
func (*HFModelRepo) ProtoMessage ¶ added in v1.4.0
func (*HFModelRepo) ProtoMessage()
func (*HFModelRepo) ProtoReflect ¶ added in v1.4.0
func (x *HFModelRepo) ProtoReflect() protoreflect.Message
func (*HFModelRepo) Reset ¶ added in v1.4.0
func (x *HFModelRepo) Reset()
func (*HFModelRepo) String ¶ added in v1.4.0
func (x *HFModelRepo) String() string
type ListBaseModelsRequest ¶
type ListBaseModelsRequest struct {
// contains filtered or unexported fields
}
func (*ListBaseModelsRequest) Descriptor
deprecated
func (*ListBaseModelsRequest) Descriptor() ([]byte, []int)
Deprecated: Use ListBaseModelsRequest.ProtoReflect.Descriptor instead.
func (*ListBaseModelsRequest) ProtoMessage ¶
func (*ListBaseModelsRequest) ProtoMessage()
func (*ListBaseModelsRequest) ProtoReflect ¶
func (x *ListBaseModelsRequest) ProtoReflect() protoreflect.Message
func (*ListBaseModelsRequest) Reset ¶
func (x *ListBaseModelsRequest) Reset()
func (*ListBaseModelsRequest) String ¶
func (x *ListBaseModelsRequest) String() string
type ListBaseModelsResponse ¶
type ListBaseModelsResponse struct { Object string `protobuf:"bytes,1,opt,name=object,proto3" json:"object,omitempty"` Data []*BaseModel `protobuf:"bytes,2,rep,name=data,proto3" json:"data,omitempty"` // contains filtered or unexported fields }
func (*ListBaseModelsResponse) Descriptor
deprecated
func (*ListBaseModelsResponse) Descriptor() ([]byte, []int)
Deprecated: Use ListBaseModelsResponse.ProtoReflect.Descriptor instead.
func (*ListBaseModelsResponse) GetData ¶
func (x *ListBaseModelsResponse) GetData() []*BaseModel
func (*ListBaseModelsResponse) GetObject ¶
func (x *ListBaseModelsResponse) GetObject() string
func (*ListBaseModelsResponse) ProtoMessage ¶
func (*ListBaseModelsResponse) ProtoMessage()
func (*ListBaseModelsResponse) ProtoReflect ¶
func (x *ListBaseModelsResponse) ProtoReflect() protoreflect.Message
func (*ListBaseModelsResponse) Reset ¶
func (x *ListBaseModelsResponse) Reset()
func (*ListBaseModelsResponse) String ¶
func (x *ListBaseModelsResponse) String() string
type ListModelsRequest ¶
type ListModelsRequest struct {
// contains filtered or unexported fields
}
func (*ListModelsRequest) Descriptor
deprecated
func (*ListModelsRequest) Descriptor() ([]byte, []int)
Deprecated: Use ListModelsRequest.ProtoReflect.Descriptor instead.
func (*ListModelsRequest) ProtoMessage ¶
func (*ListModelsRequest) ProtoMessage()
func (*ListModelsRequest) ProtoReflect ¶
func (x *ListModelsRequest) ProtoReflect() protoreflect.Message
func (*ListModelsRequest) Reset ¶
func (x *ListModelsRequest) Reset()
func (*ListModelsRequest) String ¶
func (x *ListModelsRequest) String() string
type ListModelsResponse ¶
type ListModelsResponse struct { Object string `protobuf:"bytes,1,opt,name=object,proto3" json:"object,omitempty"` Data []*Model `protobuf:"bytes,2,rep,name=data,proto3" json:"data,omitempty"` // contains filtered or unexported fields }
func (*ListModelsResponse) Descriptor
deprecated
func (*ListModelsResponse) Descriptor() ([]byte, []int)
Deprecated: Use ListModelsResponse.ProtoReflect.Descriptor instead.
func (*ListModelsResponse) GetData ¶
func (x *ListModelsResponse) GetData() []*Model
func (*ListModelsResponse) GetObject ¶
func (x *ListModelsResponse) GetObject() string
func (*ListModelsResponse) ProtoMessage ¶
func (*ListModelsResponse) ProtoMessage()
func (*ListModelsResponse) ProtoReflect ¶
func (x *ListModelsResponse) ProtoReflect() protoreflect.Message
func (*ListModelsResponse) Reset ¶
func (x *ListModelsResponse) Reset()
func (*ListModelsResponse) String ¶
func (x *ListModelsResponse) String() string
type Model ¶
type Model struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` Created int64 `protobuf:"varint,2,opt,name=created,proto3" json:"created,omitempty"` Object string `protobuf:"bytes,3,opt,name=object,proto3" json:"object,omitempty"` OwnedBy string `protobuf:"bytes,4,opt,name=owned_by,json=ownedBy,proto3" json:"owned_by,omitempty"` // contains filtered or unexported fields }
func (*Model) Descriptor
deprecated
func (*Model) GetCreated ¶
func (*Model) GetOwnedBy ¶
func (*Model) ProtoMessage ¶
func (*Model) ProtoMessage()
func (*Model) ProtoReflect ¶
func (x *Model) ProtoReflect() protoreflect.Message
type ModelAttributes ¶
type ModelAttributes struct { Path string `protobuf:"bytes,1,opt,name=path,proto3" json:"path,omitempty"` BaseModel string `protobuf:"bytes,2,opt,name=base_model,json=baseModel,proto3" json:"base_model,omitempty"` Adapter AdapterType `protobuf:"varint,3,opt,name=adapter,proto3,enum=llmariner.models.server.v1.AdapterType" json:"adapter,omitempty"` Quantization QuantizationType `` /* 127-byte string literal not displayed */ // contains filtered or unexported fields }
func (*ModelAttributes) Descriptor
deprecated
func (*ModelAttributes) Descriptor() ([]byte, []int)
Deprecated: Use ModelAttributes.ProtoReflect.Descriptor instead.
func (*ModelAttributes) GetAdapter ¶
func (x *ModelAttributes) GetAdapter() AdapterType
func (*ModelAttributes) GetBaseModel ¶
func (x *ModelAttributes) GetBaseModel() string
func (*ModelAttributes) GetPath ¶
func (x *ModelAttributes) GetPath() string
func (*ModelAttributes) GetQuantization ¶
func (x *ModelAttributes) GetQuantization() QuantizationType
func (*ModelAttributes) ProtoMessage ¶
func (*ModelAttributes) ProtoMessage()
func (*ModelAttributes) ProtoReflect ¶
func (x *ModelAttributes) ProtoReflect() protoreflect.Message
func (*ModelAttributes) Reset ¶
func (x *ModelAttributes) Reset()
func (*ModelAttributes) String ¶
func (x *ModelAttributes) String() string
type ModelFormat ¶
type ModelFormat int32
const ( ModelFormat_MODEL_FORMAT_UNSPECIFIED ModelFormat = 0 ModelFormat_MODEL_FORMAT_GGUF ModelFormat = 1 ModelFormat_MODEL_FORMAT_HUGGING_FACE ModelFormat = 2 // Model format for Nvidia Triton Inference Server. This model files include the tokenizer configuration // of the original model, compiled model files for TensorRT-LLM backend, and configuration files for // Triton Inference Server. ModelFormat_MODEL_FORMAT_NVIDIA_TRITON ModelFormat = 3 )
func (ModelFormat) Descriptor ¶
func (ModelFormat) Descriptor() protoreflect.EnumDescriptor
func (ModelFormat) Enum ¶
func (x ModelFormat) Enum() *ModelFormat
func (ModelFormat) EnumDescriptor
deprecated
func (ModelFormat) EnumDescriptor() ([]byte, []int)
Deprecated: Use ModelFormat.Descriptor instead.
func (ModelFormat) Number ¶
func (x ModelFormat) Number() protoreflect.EnumNumber
func (ModelFormat) String ¶
func (x ModelFormat) String() string
func (ModelFormat) Type ¶
func (ModelFormat) Type() protoreflect.EnumType
type ModelFormats ¶
type ModelFormats struct { Formats []ModelFormat `protobuf:"varint,1,rep,packed,name=formats,proto3,enum=llmariner.models.server.v1.ModelFormat" json:"formats,omitempty"` // contains filtered or unexported fields }
ModelFormats is a list of model formats. Used to store marshalled data into a store.
func (*ModelFormats) Descriptor
deprecated
func (*ModelFormats) Descriptor() ([]byte, []int)
Deprecated: Use ModelFormats.ProtoReflect.Descriptor instead.
func (*ModelFormats) GetFormats ¶
func (x *ModelFormats) GetFormats() []ModelFormat
func (*ModelFormats) ProtoMessage ¶
func (*ModelFormats) ProtoMessage()
func (*ModelFormats) ProtoReflect ¶
func (x *ModelFormats) ProtoReflect() protoreflect.Message
func (*ModelFormats) Reset ¶
func (x *ModelFormats) Reset()
func (*ModelFormats) String ¶
func (x *ModelFormats) String() string
type ModelsServiceClient ¶
type ModelsServiceClient interface { ListModels(ctx context.Context, in *ListModelsRequest, opts ...grpc.CallOption) (*ListModelsResponse, error) GetModel(ctx context.Context, in *GetModelRequest, opts ...grpc.CallOption) (*Model, error) DeleteModel(ctx context.Context, in *DeleteModelRequest, opts ...grpc.CallOption) (*DeleteModelResponse, error) // The following API endpoints are not part of the OpenAPI API specification. ListBaseModels(ctx context.Context, in *ListBaseModelsRequest, opts ...grpc.CallOption) (*ListBaseModelsResponse, error) }
ModelsServiceClient is the client API for ModelsService service.
For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.
func NewModelsServiceClient ¶
func NewModelsServiceClient(cc grpc.ClientConnInterface) ModelsServiceClient
type ModelsServiceServer ¶
type ModelsServiceServer interface { ListModels(context.Context, *ListModelsRequest) (*ListModelsResponse, error) GetModel(context.Context, *GetModelRequest) (*Model, error) DeleteModel(context.Context, *DeleteModelRequest) (*DeleteModelResponse, error) // The following API endpoints are not part of the OpenAPI API specification. ListBaseModels(context.Context, *ListBaseModelsRequest) (*ListBaseModelsResponse, error) // contains filtered or unexported methods }
ModelsServiceServer is the server API for ModelsService service. All implementations must embed UnimplementedModelsServiceServer for forward compatibility
type ModelsWorkerServiceClient ¶
type ModelsWorkerServiceClient interface { // CreateStorageConfig creates a new storage config. Used by model-manager-loader. CreateStorageConfig(ctx context.Context, in *CreateStorageConfigRequest, opts ...grpc.CallOption) (*StorageConfig, error) // GetStorageConfig gets a storage config. Used by model-manager-loader. GetStorageConfig(ctx context.Context, in *GetStorageConfigRequest, opts ...grpc.CallOption) (*StorageConfig, error) // GetModel gets a model. Used by inference-manager-engine. GetModel(ctx context.Context, in *GetModelRequest, opts ...grpc.CallOption) (*Model, error) // RegisterModel registers a new fine-tuned model. Used by job-manager-dispatcher and model-manager-loader. // The model is not published until PublishModel is called. RegisterModel(ctx context.Context, in *RegisterModelRequest, opts ...grpc.CallOption) (*RegisterModelResponse, error) // PublishModel publishes the fine-tuned model. Used by job-manager-dispatcher and model-manager-loader. PublishModel(ctx context.Context, in *PublishModelRequest, opts ...grpc.CallOption) (*PublishModelResponse, error) // GetModelPath returns the path of the model. Used by inference-manager-engine and model-manager-loader. GetModelPath(ctx context.Context, in *GetModelPathRequest, opts ...grpc.CallOption) (*GetModelPathResponse, error) // GetModelAttributes returns the attributes of the model. Used by inference-manager-engine. GetModelAttributes(ctx context.Context, in *GetModelAttributesRequest, opts ...grpc.CallOption) (*ModelAttributes, error) // CreateBaseModel creates a new base model. Used by model-manager-loader. CreateBaseModel(ctx context.Context, in *CreateBaseModelRequest, opts ...grpc.CallOption) (*BaseModel, error) // GetBaseModelPath returns the path of the base model. Used by job-manager-dispatcher, // inference-manager-engine, and model-manager-loader. GetBaseModelPath(ctx context.Context, in *GetBaseModelPathRequest, opts ...grpc.CallOption) (*GetBaseModelPathResponse, error) // CreateHFModelRepo creates a HuggingFace model repo. CreateHFModelRepo(ctx context.Context, in *CreateHFModelRepoRequest, opts ...grpc.CallOption) (*HFModelRepo, error) // GetHFModelRepo returns the HuggingFace model repo that has been downloaded. Used by model-manager-loader. GetHFModelRepo(ctx context.Context, in *GetHFModelRepoRequest, opts ...grpc.CallOption) (*HFModelRepo, error) }
ModelsWorkerServiceClient is the client API for ModelsWorkerService service.
For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.
func NewModelsWorkerServiceClient ¶
func NewModelsWorkerServiceClient(cc grpc.ClientConnInterface) ModelsWorkerServiceClient
type ModelsWorkerServiceServer ¶
type ModelsWorkerServiceServer interface { // CreateStorageConfig creates a new storage config. Used by model-manager-loader. CreateStorageConfig(context.Context, *CreateStorageConfigRequest) (*StorageConfig, error) // GetStorageConfig gets a storage config. Used by model-manager-loader. GetStorageConfig(context.Context, *GetStorageConfigRequest) (*StorageConfig, error) // GetModel gets a model. Used by inference-manager-engine. GetModel(context.Context, *GetModelRequest) (*Model, error) // RegisterModel registers a new fine-tuned model. Used by job-manager-dispatcher and model-manager-loader. // The model is not published until PublishModel is called. RegisterModel(context.Context, *RegisterModelRequest) (*RegisterModelResponse, error) // PublishModel publishes the fine-tuned model. Used by job-manager-dispatcher and model-manager-loader. PublishModel(context.Context, *PublishModelRequest) (*PublishModelResponse, error) // GetModelPath returns the path of the model. Used by inference-manager-engine and model-manager-loader. GetModelPath(context.Context, *GetModelPathRequest) (*GetModelPathResponse, error) // GetModelAttributes returns the attributes of the model. Used by inference-manager-engine. GetModelAttributes(context.Context, *GetModelAttributesRequest) (*ModelAttributes, error) // CreateBaseModel creates a new base model. Used by model-manager-loader. CreateBaseModel(context.Context, *CreateBaseModelRequest) (*BaseModel, error) // GetBaseModelPath returns the path of the base model. Used by job-manager-dispatcher, // inference-manager-engine, and model-manager-loader. GetBaseModelPath(context.Context, *GetBaseModelPathRequest) (*GetBaseModelPathResponse, error) // CreateHFModelRepo creates a HuggingFace model repo. CreateHFModelRepo(context.Context, *CreateHFModelRepoRequest) (*HFModelRepo, error) // GetHFModelRepo returns the HuggingFace model repo that has been downloaded. Used by model-manager-loader. GetHFModelRepo(context.Context, *GetHFModelRepoRequest) (*HFModelRepo, error) // contains filtered or unexported methods }
ModelsWorkerServiceServer is the server API for ModelsWorkerService service. All implementations must embed UnimplementedModelsWorkerServiceServer for forward compatibility
type PublishModelRequest ¶
type PublishModelRequest struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // contains filtered or unexported fields }
func (*PublishModelRequest) Descriptor
deprecated
func (*PublishModelRequest) Descriptor() ([]byte, []int)
Deprecated: Use PublishModelRequest.ProtoReflect.Descriptor instead.
func (*PublishModelRequest) GetId ¶
func (x *PublishModelRequest) GetId() string
func (*PublishModelRequest) ProtoMessage ¶
func (*PublishModelRequest) ProtoMessage()
func (*PublishModelRequest) ProtoReflect ¶
func (x *PublishModelRequest) ProtoReflect() protoreflect.Message
func (*PublishModelRequest) Reset ¶
func (x *PublishModelRequest) Reset()
func (*PublishModelRequest) String ¶
func (x *PublishModelRequest) String() string
type PublishModelResponse ¶
type PublishModelResponse struct {
// contains filtered or unexported fields
}
func (*PublishModelResponse) Descriptor
deprecated
func (*PublishModelResponse) Descriptor() ([]byte, []int)
Deprecated: Use PublishModelResponse.ProtoReflect.Descriptor instead.
func (*PublishModelResponse) ProtoMessage ¶
func (*PublishModelResponse) ProtoMessage()
func (*PublishModelResponse) ProtoReflect ¶
func (x *PublishModelResponse) ProtoReflect() protoreflect.Message
func (*PublishModelResponse) Reset ¶
func (x *PublishModelResponse) Reset()
func (*PublishModelResponse) String ¶
func (x *PublishModelResponse) String() string
type QuantizationType ¶
type QuantizationType int32
const ( QuantizationType_QUANTIZATION_TYPE_UNSPECIFIED QuantizationType = 0 QuantizationType_QUANTIZATION_TYPE_GGUF QuantizationType = 1 QuantizationType_QUANTIZATION_TYPE_AWQ QuantizationType = 2 )
func (QuantizationType) Descriptor ¶
func (QuantizationType) Descriptor() protoreflect.EnumDescriptor
func (QuantizationType) Enum ¶
func (x QuantizationType) Enum() *QuantizationType
func (QuantizationType) EnumDescriptor
deprecated
func (QuantizationType) EnumDescriptor() ([]byte, []int)
Deprecated: Use QuantizationType.Descriptor instead.
func (QuantizationType) Number ¶
func (x QuantizationType) Number() protoreflect.EnumNumber
func (QuantizationType) String ¶
func (x QuantizationType) String() string
func (QuantizationType) Type ¶
func (QuantizationType) Type() protoreflect.EnumType
type RegisterModelRequest ¶
type RegisterModelRequest struct { // id is the model name. Id string `protobuf:"bytes,7,opt,name=id,proto3" json:"id,omitempty"` BaseModel string `protobuf:"bytes,1,opt,name=base_model,json=baseModel,proto3" json:"base_model,omitempty"` // suffix is deprecated, use adapter and quantization instead. Suffix string `protobuf:"bytes,2,opt,name=suffix,proto3" json:"suffix,omitempty"` OrganizationId string `protobuf:"bytes,3,opt,name=organization_id,json=organizationId,proto3" json:"organization_id,omitempty"` ProjectId string `protobuf:"bytes,4,opt,name=project_id,json=projectId,proto3" json:"project_id,omitempty"` Adapter AdapterType `protobuf:"varint,5,opt,name=adapter,proto3,enum=llmariner.models.server.v1.AdapterType" json:"adapter,omitempty"` Quantization QuantizationType `` /* 127-byte string literal not displayed */ Path string `protobuf:"bytes,8,opt,name=path,proto3" json:"path,omitempty"` // contains filtered or unexported fields }
func (*RegisterModelRequest) Descriptor
deprecated
func (*RegisterModelRequest) Descriptor() ([]byte, []int)
Deprecated: Use RegisterModelRequest.ProtoReflect.Descriptor instead.
func (*RegisterModelRequest) GetAdapter ¶
func (x *RegisterModelRequest) GetAdapter() AdapterType
func (*RegisterModelRequest) GetBaseModel ¶
func (x *RegisterModelRequest) GetBaseModel() string
func (*RegisterModelRequest) GetId ¶ added in v0.119.0
func (x *RegisterModelRequest) GetId() string
func (*RegisterModelRequest) GetOrganizationId ¶
func (x *RegisterModelRequest) GetOrganizationId() string
func (*RegisterModelRequest) GetPath ¶ added in v0.119.0
func (x *RegisterModelRequest) GetPath() string
func (*RegisterModelRequest) GetProjectId ¶
func (x *RegisterModelRequest) GetProjectId() string
func (*RegisterModelRequest) GetQuantization ¶
func (x *RegisterModelRequest) GetQuantization() QuantizationType
func (*RegisterModelRequest) GetSuffix ¶
func (x *RegisterModelRequest) GetSuffix() string
func (*RegisterModelRequest) ProtoMessage ¶
func (*RegisterModelRequest) ProtoMessage()
func (*RegisterModelRequest) ProtoReflect ¶
func (x *RegisterModelRequest) ProtoReflect() protoreflect.Message
func (*RegisterModelRequest) Reset ¶
func (x *RegisterModelRequest) Reset()
func (*RegisterModelRequest) String ¶
func (x *RegisterModelRequest) String() string
type RegisterModelResponse ¶
type RegisterModelResponse struct { Id string `protobuf:"bytes,1,opt,name=id,proto3" json:"id,omitempty"` // path is the path where the model is stored. Path string `protobuf:"bytes,2,opt,name=path,proto3" json:"path,omitempty"` // contains filtered or unexported fields }
func (*RegisterModelResponse) Descriptor
deprecated
func (*RegisterModelResponse) Descriptor() ([]byte, []int)
Deprecated: Use RegisterModelResponse.ProtoReflect.Descriptor instead.
func (*RegisterModelResponse) GetId ¶
func (x *RegisterModelResponse) GetId() string
func (*RegisterModelResponse) GetPath ¶
func (x *RegisterModelResponse) GetPath() string
func (*RegisterModelResponse) ProtoMessage ¶
func (*RegisterModelResponse) ProtoMessage()
func (*RegisterModelResponse) ProtoReflect ¶
func (x *RegisterModelResponse) ProtoReflect() protoreflect.Message
func (*RegisterModelResponse) Reset ¶
func (x *RegisterModelResponse) Reset()
func (*RegisterModelResponse) String ¶
func (x *RegisterModelResponse) String() string
type StorageConfig ¶
type StorageConfig struct { PathPrefix string `protobuf:"bytes,1,opt,name=path_prefix,json=pathPrefix,proto3" json:"path_prefix,omitempty"` // contains filtered or unexported fields }
func (*StorageConfig) Descriptor
deprecated
func (*StorageConfig) Descriptor() ([]byte, []int)
Deprecated: Use StorageConfig.ProtoReflect.Descriptor instead.
func (*StorageConfig) GetPathPrefix ¶
func (x *StorageConfig) GetPathPrefix() string
func (*StorageConfig) ProtoMessage ¶
func (*StorageConfig) ProtoMessage()
func (*StorageConfig) ProtoReflect ¶
func (x *StorageConfig) ProtoReflect() protoreflect.Message
func (*StorageConfig) Reset ¶
func (x *StorageConfig) Reset()
func (*StorageConfig) String ¶
func (x *StorageConfig) String() string
type UnimplementedModelsServiceServer ¶
type UnimplementedModelsServiceServer struct { }
UnimplementedModelsServiceServer must be embedded to have forward compatible implementations.
func (UnimplementedModelsServiceServer) DeleteModel ¶
func (UnimplementedModelsServiceServer) DeleteModel(context.Context, *DeleteModelRequest) (*DeleteModelResponse, error)
func (UnimplementedModelsServiceServer) GetModel ¶
func (UnimplementedModelsServiceServer) GetModel(context.Context, *GetModelRequest) (*Model, error)
func (UnimplementedModelsServiceServer) ListBaseModels ¶
func (UnimplementedModelsServiceServer) ListBaseModels(context.Context, *ListBaseModelsRequest) (*ListBaseModelsResponse, error)
func (UnimplementedModelsServiceServer) ListModels ¶
func (UnimplementedModelsServiceServer) ListModels(context.Context, *ListModelsRequest) (*ListModelsResponse, error)
type UnimplementedModelsWorkerServiceServer ¶
type UnimplementedModelsWorkerServiceServer struct { }
UnimplementedModelsWorkerServiceServer must be embedded to have forward compatible implementations.
func (UnimplementedModelsWorkerServiceServer) CreateBaseModel ¶
func (UnimplementedModelsWorkerServiceServer) CreateBaseModel(context.Context, *CreateBaseModelRequest) (*BaseModel, error)
func (UnimplementedModelsWorkerServiceServer) CreateHFModelRepo ¶ added in v1.4.0
func (UnimplementedModelsWorkerServiceServer) CreateHFModelRepo(context.Context, *CreateHFModelRepoRequest) (*HFModelRepo, error)
func (UnimplementedModelsWorkerServiceServer) CreateStorageConfig ¶
func (UnimplementedModelsWorkerServiceServer) CreateStorageConfig(context.Context, *CreateStorageConfigRequest) (*StorageConfig, error)
func (UnimplementedModelsWorkerServiceServer) GetBaseModelPath ¶
func (UnimplementedModelsWorkerServiceServer) GetBaseModelPath(context.Context, *GetBaseModelPathRequest) (*GetBaseModelPathResponse, error)
func (UnimplementedModelsWorkerServiceServer) GetHFModelRepo ¶ added in v1.4.0
func (UnimplementedModelsWorkerServiceServer) GetHFModelRepo(context.Context, *GetHFModelRepoRequest) (*HFModelRepo, error)
func (UnimplementedModelsWorkerServiceServer) GetModel ¶
func (UnimplementedModelsWorkerServiceServer) GetModel(context.Context, *GetModelRequest) (*Model, error)
func (UnimplementedModelsWorkerServiceServer) GetModelAttributes ¶
func (UnimplementedModelsWorkerServiceServer) GetModelAttributes(context.Context, *GetModelAttributesRequest) (*ModelAttributes, error)
func (UnimplementedModelsWorkerServiceServer) GetModelPath ¶
func (UnimplementedModelsWorkerServiceServer) GetModelPath(context.Context, *GetModelPathRequest) (*GetModelPathResponse, error)
func (UnimplementedModelsWorkerServiceServer) GetStorageConfig ¶
func (UnimplementedModelsWorkerServiceServer) GetStorageConfig(context.Context, *GetStorageConfigRequest) (*StorageConfig, error)
func (UnimplementedModelsWorkerServiceServer) PublishModel ¶
func (UnimplementedModelsWorkerServiceServer) PublishModel(context.Context, *PublishModelRequest) (*PublishModelResponse, error)
func (UnimplementedModelsWorkerServiceServer) RegisterModel ¶
func (UnimplementedModelsWorkerServiceServer) RegisterModel(context.Context, *RegisterModelRequest) (*RegisterModelResponse, error)
type UnsafeModelsServiceServer ¶
type UnsafeModelsServiceServer interface {
// contains filtered or unexported methods
}
UnsafeModelsServiceServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to ModelsServiceServer will result in compilation errors.
type UnsafeModelsWorkerServiceServer ¶
type UnsafeModelsWorkerServiceServer interface {
// contains filtered or unexported methods
}
UnsafeModelsWorkerServiceServer may be embedded to opt out of forward compatibility for this service. Use of this interface is not recommended, as added methods to ModelsWorkerServiceServer will result in compilation errors.