vllmclient

package
v0.11.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Nov 27, 2024 License: Apache-2.0 Imports: 7 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

This section is empty.

Functions

This section is empty.

Types

type Client

type Client struct {
	HTTPClient *http.Client
}

func (*Client) LoadLoraAdapter

func (c *Client) LoadLoraAdapter(ctx context.Context, addr string, req LoadAdapterRequest) error

Load a LoRa adapter into the VLLM model server. See: https://docs.vllm.ai/en/latest/models/lora.html#dynamically-serving-lora-adapters

func (*Client) UnloadLoraAdapter

func (c *Client) UnloadLoraAdapter(ctx context.Context, addr string, req UnloadAdapterRequest) error

Unload a LoRa adapter from the VLLM model server. See: https://docs.vllm.ai/en/latest/models/lora.html#dynamically-serving-lora-adapters

type LoadAdapterRequest

type LoadAdapterRequest struct {
	LoraName string `json:"lora_name"`
	LoraPath string `json:"lora_path"`

	Options LoadAdapterRequestOptions `json:"-"`
}

type LoadAdapterRequestOptions

type LoadAdapterRequestOptions struct {
	IgnoreAlreadyLoaded bool
}

type UnloadAdapterRequest

type UnloadAdapterRequest struct {
	LoraName string `json:"lora_name"`

	Options UnloadAdapterRequestOptions `json:"-"`
}

type UnloadAdapterRequestOptions

type UnloadAdapterRequestOptions struct {
	IgnoreNotFound bool
}

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL