Documentation
¶
Index ¶
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
Types ¶
type ErrReprocessInputs ¶
type ErrReprocessInputs struct {
Inputs []input
}
func (*ErrReprocessInputs) Error ¶
func (e *ErrReprocessInputs) Error() string
type ImageContext ¶
type ImageContext struct {
// contains filtered or unexported fields
}
func NewImageContext ¶
func NewImageContext(llamaContext *llama.Context, modelPath string) (*ImageContext, error)
func (*ImageContext) BatchSize ¶
func (c *ImageContext) BatchSize(configuredBatchSize int) int
func (*ImageContext) Free ¶
func (c *ImageContext) Free(modelPath string)
func (*ImageContext) MultimodalTokenize ¶
type InputCache ¶
type InputCache struct {
// contains filtered or unexported fields
}
func NewInputCache ¶
func (*InputCache) LoadCacheSlot ¶
func (c *InputCache) LoadCacheSlot(prompt []input, cachePrompt bool) (*InputCacheSlot, []input, error)
func (*InputCache) ShiftCacheSlot ¶
func (c *InputCache) ShiftCacheSlot(slot *InputCacheSlot, numKeep int) error
ShiftCacheSlot frees up space in the KV cache by deleting the oldest half of history and shifting the newest half into that space (saving numKeep inputs at the beginning).
Assumes that at least 1 entry can be freed up by shifting (i.e. numKeep < numCtx)
func (*InputCache) ShiftDiscard ¶
func (c *InputCache) ShiftDiscard(inputLen int, numKeep int) int
type InputCacheSlot ¶
type NewSequenceParams ¶
type NewSequenceParams struct {
// contains filtered or unexported fields
}
Click to show internal directories.
Click to hide internal directories.