num parallel embed
This commit is contained in:
parent
ec4c35fe99
commit
2647a0e443
@ -132,6 +132,8 @@ func (s *Scheduler) processPending(ctx context.Context) {
|
|||||||
if len(pending.model.ProjectorPaths) > 0 && numParallel != 1 {
|
if len(pending.model.ProjectorPaths) > 0 && numParallel != 1 {
|
||||||
numParallel = 1
|
numParallel = 1
|
||||||
slog.Warn("multimodal models don't support parallel requests yet")
|
slog.Warn("multimodal models don't support parallel requests yet")
|
||||||
|
} else if strings.Contains(pending.model.Config.ModelFamily, "bert") {
|
||||||
|
numParallel = runtime.NumCPU()
|
||||||
}
|
}
|
||||||
|
|
||||||
for {
|
for {
|
||||||
|
Loading…
x
Reference in New Issue
Block a user