Compare commits
merge into: jeans:main
jeans:main
jeans:tool-parsing
jeans:jessegross/post_predict
jeans:jessegross/vision_graph
jeans:jmorganca/qwen25vl
jeans:drifkin/thinking-api-support
jeans:jessegross/worst-multimodal
jeans:drifkin/array-head-count-simple
jeans:brucemacd/model-forward-test-ext
jeans:parth/python-function-parsing
jeans:mxyng/qwen3
jeans:mxyng/multiple-eos-tokens
jeans:jmorganca/cuda-compression-none
jeans:drifkin/num-parallel
jeans:drifkin/chat-truncation-fix
jeans:jmorganca/sync
jeans:mxyng/parallel-write-blobs
jeans:parth/python-tools-calling
jeans:drifkin/array-head-count
jeans:brucemacd/create-no-loop
jeans:parth/server-enable-content-stream-with-tools
jeans:qwen25omni
jeans:mxyng/v3
jeans:brucemacd/ropeconfig
jeans:jmorganca/silence-tokenizer
jeans:parth/sample-so-test
jeans:parth/sampling-structured-outputs
jeans:brucemacd/doc-go-engine
jeans:parth/constrained-sampling-json
jeans:jmorganca/mistral-wip
jeans:brucemacd/mistral-small-convert
jeans:parth/sample-unmarshal-json-for-params
jeans:brucemacd/runner-completion
jeans:brucemacd/jomorganca/mistral
jeans:pdevine/bfloat16
jeans:jmorganca/mistral
jeans:brucemacd/mistral
jeans:pdevine/logging
jeans:parth/sample-correctness-fix
jeans:parth/sample-fix-sorting
jeans:jmorgan/sample-fix-sorting-extras
jeans:jmorganca/temp-0-images
jeans:brucemacd/parallel-embed-models
jeans:brucemacd/shim-grammar
jeans:jmorganca/fix-gguf-error
jeans:bmizerany/nameswork
jeans:jmorganca/faster-releases
jeans:bmizerany/validatenames
jeans:brucemacd/err-no-vocab
jeans:brucemacd/rope-config
jeans:brucemacd/err-hint
jeans:brucemacd/qwen2_5
jeans:brucemacd/logprobs
jeans:brucemacd/new_runner_graph_bench
jeans:progress-flicker
jeans:brucemacd/forward-test
jeans:brucemacd/go_qwen2
jeans:pdevine/gemma2
jeans:jmorganca/add-missing-symlink-eval
jeans:mxyng/next-bert
jeans:mxyng/next-debug
jeans:parth/set-context-size-openai
jeans:brucemacd/next-bpe-bench
jeans:brucemacd/next-bpe-test
jeans:brucemacd/new_runner_e2e
jeans:brucemacd/new_runner_qwen2
jeans:pdevine/convert-cohere2
jeans:brucemacd/convert-cli
jeans:parth/log-probs
jeans:mxyng/next-mlx
jeans:mxyng/cmd-history
jeans:parth/templating
jeans:parth/tokenize-detokenize
jeans:brucemacd/check-key-register
jeans:bmizerany/grammar
jeans:jmorganca/vendor-081b29bd
jeans:mxyng/func-checks
jeans:jmorganca/fix-null-format
jeans:parth/fix-default-to-warn-json
jeans:jmorganca/qwen2vl
jeans:jmorganca/no-concat
jeans:parth/cmd-cleanup-SO
jeans:brucemacd/check-key-register-structured-err
jeans:parth/openai-stream-usage
jeans:parth/fix-referencing-so
jeans:stream-tools-stop
jeans:jmorganca/degin-1
jeans:brucemacd/install-path-clean
jeans:brucemacd/push-name-validation
jeans:brucemacd/browser-key-register
jeans:jmorganca/openai-fix-first-message
jeans:jmorganca/fix-proxy
jeans:jessegross/sample
jeans:parth/disallow-streaming-tools
jeans:dhiltgen/remove_submodule
jeans:jmorganca/ga
jeans:jmorganca/mllama
jeans:pdevine/newlines
jeans:mxyng/environ-2
jeans:pdevine/geems-2b
jeans:jmorganca/llama-bump
jeans:mxyng/modelname-7
jeans:mxyng/gin-slog
jeans:mxyng/modelname-6
jeans:jyan/convert-prog
jeans:jyan/quant5
jeans:paligemma-support
jeans:pdevine/import-docs
jeans:jmorganca/openai-context
jeans:jyan/paligemma
jeans:jyan/p2
jeans:jyan/palitest
jeans:bmizerany/embedspeedup
jeans:jmorganca/llama-vit
jeans:brucemacd/allow-ollama
jeans:royh/ep-methods
jeans:royh/whisper
jeans:mxyng/api-models
jeans:mxyng/fix-memory
jeans:jyan/q4_4/8
jeans:jyan/ollama-v
jeans:royh/stream-tools
jeans:roy-embed-parallel
jeans:bmizerany/hrm
jeans:revert-5963-revert-5924-mxyng/llama3.1-rope
jeans:royh/embed-viz
jeans:jyan/local2
jeans:jyan/auth
jeans:jyan/local
jeans:jyan/parse-temp
jeans:jmorganca/template-mistral
jeans:jyan/reord-g
jeans:royh-openai-suffixdocs
jeans:royh-imgembed
jeans:royh-embed-parallel
jeans:jyan/quant4
jeans:royh-precision
jeans:jyan/progress
jeans:pdevine/fix-template
jeans:jyan/quant3
jeans:pdevine/ggla
jeans:mxyng/update-registry-domain
jeans:jmorganca/ggml-static
jeans:mxyng/create-context
jeans:jyan/v0.146
jeans:mxyng/layers-from-files
jeans:build_dist
jeans:bmizerany/noseek
jeans:royh-ls
jeans:royh-name
jeans:timeout
jeans:mxyng/server-timestamp
jeans:bmizerany/nosillyggufslurps
jeans:royh-params
jeans:jmorganca/llama-cpp-7c26775
jeans:royh-openai-delete
jeans:royh-show-rigid
jeans:jmorganca/enable-fa
jeans:jmorganca/no-error-template
jeans:jyan/format
jeans:royh-testdelete
jeans:bmizerany/fastverify
jeans:language_support
jeans:pdevine/ps-glitches
jeans:brucemacd/tokenize
jeans:bruce/iq-quants
jeans:bmizerany/filepathwithcoloninhost
jeans:mxyng/split-bin
jeans:bmizerany/client-registry
jeans:jmorganca/if-none-match
jeans:native
jeans:jmorganca/native
jeans:jmorganca/batch-embeddings
jeans:jmorganca/initcmake
jeans:jmorganca/mm
jeans:pdevine/showggmlinfo
jeans:modenameenforcealphanum
jeans:bmizerany/modenameenforcealphanum
jeans:jmorganca/done-reason
jeans:jmorganca/llama-cpp-8960fe8
jeans:ollama.com
jeans:bmizerany/filepathnobuild
jeans:bmizerany/types/model/defaultfix
jeans:rmdisplaylong
jeans:nogogen
jeans:bmizerany/x
jeans:modelfile-readme
jeans:bmizerany/replacecolon
jeans:jmorganca/limit
jeans:jmorganca/execstack
jeans:jmorganca/replace-assets
jeans:mxyng/tune-concurrency
jeans:jmorganca/testing
jeans:whitespace-detection
jeans:jmorganca/options
jeans:upgrade-all
jeans:scratch
jeans:cuda-search
jeans:mattw/airenamer
jeans:mattw/allmodelsonhuggingface
jeans:mattw/quantcontext
jeans:mattw/whatneedstorun
jeans:brucemacd/llama-mem-calc
jeans:mattw/faq-context
jeans:mattw/communitylinks
jeans:mattw/noprune
jeans:mattw/python-functioncalling
jeans:rename
jeans:mxyng/install
jeans:pulse
jeans:remove-first
jeans:editor
jeans:mattw/selfqueryingretrieval
jeans:cgo
jeans:mattw/howtoquant
jeans:api
jeans:matt/streamingapi
jeans:format-config
jeans:mxyng/extra-args
jeans:shell
jeans:update-nous-hermes
jeans:cp-model
jeans:upload-progress
jeans:fix-unknown-model
jeans:fix-model-names
jeans:delete-fix
jeans:insecure-registry
jeans:ls
jeans:deletemodels
jeans:progressbar
jeans:readme-updates
jeans:license-layers
jeans:skip-list
jeans:list-models
jeans:modelpath
jeans:matt/examplemodelfiles
jeans:distribution
jeans:go-opts
jeans:v0.7.0-rc1
jeans:v0.7.0-rc0
jeans:v0.6.8-rc0
jeans:v0.6.8
jeans:v0.6.7
jeans:v0.6.7-rc2
jeans:v0.6.7-rc1
jeans:v0.6.7-rc0
jeans:v0.6.6
jeans:v0.6.6-rc2
jeans:v0.6.6-rc1
jeans:v0.6.6-rc0
jeans:v0.6.5-rc1
jeans:v0.6.5
jeans:v0.6.5-rc0
jeans:v0.6.4-rc0
jeans:v0.6.4
jeans:v0.6.3-rc1
jeans:v0.6.3
jeans:v0.6.3-rc0
jeans:v0.6.2-rc0
jeans:v0.6.2
jeans:v0.6.1
jeans:v0.6.1-rc0
jeans:v0.6.0-rc0
jeans:v0.6.0
jeans:v0.5.13
jeans:v0.5.13-rc6
jeans:v0.5.13-rc5
jeans:v0.5.13-rc4
jeans:v0.5.13-rc3
jeans:v0.5.13-rc2
jeans:v0.5.13-rc1
jeans:v0.5.13-rc0
jeans:v0.5.12
jeans:v0.5.12-rc1
jeans:v0.5.12-rc0
jeans:v0.5.11
jeans:v0.5.10
jeans:v0.5.9
jeans:v0.5.9-rc0
jeans:v0.5.8-rc13
jeans:v0.5.8
jeans:v0.5.8-rc12
jeans:v0.5.8-rc11
jeans:v0.5.8-rc10
jeans:v0.5.8-rc9
jeans:v0.5.8-rc8
jeans:v0.5.8-rc7
jeans:v0.5.8-rc6
jeans:v0.5.8-rc5
jeans:v0.5.8-rc4
jeans:v0.5.8-rc3
jeans:v0.5.8-rc2
jeans:v0.5.8-rc1
jeans:v0.5.8-rc0
jeans:v0.5.7
jeans:v0.5.6
jeans:v0.5.5
jeans:v0.5.5-rc0
jeans:v0.5.4
jeans:v0.5.3
jeans:v0.5.3-rc0
jeans:v0.5.2
jeans:v0.5.2-rc3
jeans:v0.5.2-rc2
jeans:v0.5.2-rc1
jeans:v0.5.2-rc0
jeans:v0.5.1
jeans:v0.5.0-rc1
jeans:v0.5.0
jeans:v0.4.8-rc0
jeans:v0.4.7
jeans:v0.4.6
jeans:v0.4.5
jeans:v0.4.4
jeans:v0.4.3
jeans:v0.4.3-rc0
jeans:v0.4.2
jeans:v0.4.2-rc1
jeans:v0.4.2-rc0
jeans:v0.4.1-rc0
jeans:v0.4.1
jeans:v0.4.0
jeans:v0.4.0-rc8
jeans:v0.4.0-rc7
jeans:v0.4.0-rc6
jeans:v0.4.0-rc5
jeans:v0.4.0-rc4
jeans:v0.4.0-rc3
jeans:v0.4.0-rc2
jeans:v0.4.0-rc1
jeans:v0.4.0-rc0
jeans:v0.4.0-ci3
jeans:v0.3.14-rc0
jeans:v0.3.14
jeans:v0.3.13
jeans:v0.3.12
jeans:v0.3.12-rc5
jeans:v0.3.12-rc4
jeans:v0.3.12-rc3
jeans:v0.3.12-rc2
jeans:v0.3.12-rc1
jeans:v0.3.11
jeans:v0.3.11-rc4
jeans:v0.3.11-rc3
jeans:v0.3.11-rc2
jeans:v0.3.11-rc1
jeans:v0.3.10
jeans:v0.3.10-rc1
jeans:v0.3.9
jeans:v0.3.8
jeans:v0.3.7
jeans:v0.3.7-rc6
jeans:v0.3.7-rc5
jeans:v0.3.7-rc4
jeans:v0.3.7-rc3
jeans:v0.3.7-rc2
jeans:v0.3.7-rc1
jeans:v0.3.6
jeans:v0.3.5
jeans:v0.3.4
jeans:v0.3.3
jeans:v0.3.2
jeans:v0.3.1
jeans:v0.3.0
jeans:v0.2.8
jeans:v0.2.8-rc2
jeans:v0.2.8-rc1
jeans:v0.2.7
jeans:v0.2.6
jeans:v0.2.5
jeans:v0.2.4
jeans:v0.2.3
jeans:v0.2.2
jeans:v0.2.2-rc2
jeans:v0.2.2-rc1
jeans:v0.2.1
jeans:v0.2.0
jeans:v0.1.49-rc14
jeans:v0.1.49-rc13
jeans:v0.1.49-rc12
jeans:v0.1.49-rc11
jeans:v0.1.49-rc10
jeans:v0.1.49-rc9
jeans:v0.1.49-rc8
jeans:v0.1.49-rc7
jeans:v0.1.49-rc6
jeans:v0.1.49-rc5
jeans:v0.1.49-rc4
jeans:v0.1.49-rc3
jeans:v0.1.49-rc2
jeans:v0.1.49-rc1
jeans:v0.1.48
jeans:v0.1.47
jeans:v0.1.46
jeans:v0.1.45-rc5
jeans:v0.1.45
jeans:v0.1.45-rc4
jeans:v0.1.45-rc3
jeans:v0.1.45-rc2
jeans:v0.1.45-rc1
jeans:v0.1.44
jeans:v0.1.43
jeans:v0.1.42
jeans:v0.1.41
jeans:v0.1.40
jeans:v0.1.40-rc1
jeans:v0.1.39
jeans:v0.1.39-rc2
jeans:v0.1.39-rc1
jeans:v0.1.38
jeans:v0.1.37
jeans:v0.1.36
jeans:v0.1.35
jeans:v0.1.35-rc1
jeans:v0.1.34
jeans:v0.1.34-rc1
jeans:v0.1.33
jeans:v0.1.33-rc7
jeans:v0.1.33-rc6
jeans:v0.1.33-rc5
jeans:v0.1.33-rc4
jeans:v0.1.33-rc3
jeans:v0.1.33-rc2
jeans:v0.1.33-rc1
jeans:v0.1.32
jeans:v0.1.32-rc2
jeans:v0.1.32-rc1
jeans:v0.1.31
jeans:v0.1.30
jeans:v0.1.29
jeans:v0.1.28
jeans:v0.1.27
jeans:v0.1.26
jeans:v0.1.25
jeans:v0.1.24
jeans:v0.1.23
jeans:v0.1.22
jeans:v0.1.21
jeans:v0.1.20
jeans:v0.1.19
jeans:v0.1.18
jeans:v0.1.17
jeans:v0.1.16
jeans:v0.1.15
jeans:v0.1.14
jeans:v0.1.13
jeans:v0.1.12
jeans:v0.1.11
jeans:v0.1.10
jeans:v0.1.9
jeans:v0.1.8
jeans:v0.1.7
jeans:v0.1.6
jeans:v0.1.5
jeans:v0.1.4
jeans:v0.1.3
jeans:v0.1.2
jeans:v0.1.1
jeans:v0.1.0
jeans:v0.0.21
jeans:v0.0.20
jeans:v0.0.19
jeans:v0.0.18
jeans:v0.0.17
jeans:v0.0.16
jeans:v0.0.15
jeans:v0.0.14
jeans:v0.0.13
jeans:v0.0.12
jeans:v0.0.11
jeans:v0.0.10
jeans:v0.0.9
jeans:v0.0.8
jeans:v0.0.7
jeans:v0.0.6
jeans:v0.0.5
jeans:v0.0.4
jeans:v0.0.3
jeans:v0.0.2
jeans:v0.0.1
...
pull from: jeans:drifkin/num-parallel
jeans:main
jeans:tool-parsing
jeans:jessegross/post_predict
jeans:jessegross/vision_graph
jeans:jmorganca/qwen25vl
jeans:drifkin/thinking-api-support
jeans:jessegross/worst-multimodal
jeans:drifkin/array-head-count-simple
jeans:brucemacd/model-forward-test-ext
jeans:parth/python-function-parsing
jeans:mxyng/qwen3
jeans:mxyng/multiple-eos-tokens
jeans:jmorganca/cuda-compression-none
jeans:drifkin/num-parallel
jeans:drifkin/chat-truncation-fix
jeans:jmorganca/sync
jeans:mxyng/parallel-write-blobs
jeans:parth/python-tools-calling
jeans:drifkin/array-head-count
jeans:brucemacd/create-no-loop
jeans:parth/server-enable-content-stream-with-tools
jeans:qwen25omni
jeans:mxyng/v3
jeans:brucemacd/ropeconfig
jeans:jmorganca/silence-tokenizer
jeans:parth/sample-so-test
jeans:parth/sampling-structured-outputs
jeans:brucemacd/doc-go-engine
jeans:parth/constrained-sampling-json
jeans:jmorganca/mistral-wip
jeans:brucemacd/mistral-small-convert
jeans:parth/sample-unmarshal-json-for-params
jeans:brucemacd/runner-completion
jeans:brucemacd/jomorganca/mistral
jeans:pdevine/bfloat16
jeans:jmorganca/mistral
jeans:brucemacd/mistral
jeans:pdevine/logging
jeans:parth/sample-correctness-fix
jeans:parth/sample-fix-sorting
jeans:jmorgan/sample-fix-sorting-extras
jeans:jmorganca/temp-0-images
jeans:brucemacd/parallel-embed-models
jeans:brucemacd/shim-grammar
jeans:jmorganca/fix-gguf-error
jeans:bmizerany/nameswork
jeans:jmorganca/faster-releases
jeans:bmizerany/validatenames
jeans:brucemacd/err-no-vocab
jeans:brucemacd/rope-config
jeans:brucemacd/err-hint
jeans:brucemacd/qwen2_5
jeans:brucemacd/logprobs
jeans:brucemacd/new_runner_graph_bench
jeans:progress-flicker
jeans:brucemacd/forward-test
jeans:brucemacd/go_qwen2
jeans:pdevine/gemma2
jeans:jmorganca/add-missing-symlink-eval
jeans:mxyng/next-bert
jeans:mxyng/next-debug
jeans:parth/set-context-size-openai
jeans:brucemacd/next-bpe-bench
jeans:brucemacd/next-bpe-test
jeans:brucemacd/new_runner_e2e
jeans:brucemacd/new_runner_qwen2
jeans:pdevine/convert-cohere2
jeans:brucemacd/convert-cli
jeans:parth/log-probs
jeans:mxyng/next-mlx
jeans:mxyng/cmd-history
jeans:parth/templating
jeans:parth/tokenize-detokenize
jeans:brucemacd/check-key-register
jeans:bmizerany/grammar
jeans:jmorganca/vendor-081b29bd
jeans:mxyng/func-checks
jeans:jmorganca/fix-null-format
jeans:parth/fix-default-to-warn-json
jeans:jmorganca/qwen2vl
jeans:jmorganca/no-concat
jeans:parth/cmd-cleanup-SO
jeans:brucemacd/check-key-register-structured-err
jeans:parth/openai-stream-usage
jeans:parth/fix-referencing-so
jeans:stream-tools-stop
jeans:jmorganca/degin-1
jeans:brucemacd/install-path-clean
jeans:brucemacd/push-name-validation
jeans:brucemacd/browser-key-register
jeans:jmorganca/openai-fix-first-message
jeans:jmorganca/fix-proxy
jeans:jessegross/sample
jeans:parth/disallow-streaming-tools
jeans:dhiltgen/remove_submodule
jeans:jmorganca/ga
jeans:jmorganca/mllama
jeans:pdevine/newlines
jeans:mxyng/environ-2
jeans:pdevine/geems-2b
jeans:jmorganca/llama-bump
jeans:mxyng/modelname-7
jeans:mxyng/gin-slog
jeans:mxyng/modelname-6
jeans:jyan/convert-prog
jeans:jyan/quant5
jeans:paligemma-support
jeans:pdevine/import-docs
jeans:jmorganca/openai-context
jeans:jyan/paligemma
jeans:jyan/p2
jeans:jyan/palitest
jeans:bmizerany/embedspeedup
jeans:jmorganca/llama-vit
jeans:brucemacd/allow-ollama
jeans:royh/ep-methods
jeans:royh/whisper
jeans:mxyng/api-models
jeans:mxyng/fix-memory
jeans:jyan/q4_4/8
jeans:jyan/ollama-v
jeans:royh/stream-tools
jeans:roy-embed-parallel
jeans:bmizerany/hrm
jeans:revert-5963-revert-5924-mxyng/llama3.1-rope
jeans:royh/embed-viz
jeans:jyan/local2
jeans:jyan/auth
jeans:jyan/local
jeans:jyan/parse-temp
jeans:jmorganca/template-mistral
jeans:jyan/reord-g
jeans:royh-openai-suffixdocs
jeans:royh-imgembed
jeans:royh-embed-parallel
jeans:jyan/quant4
jeans:royh-precision
jeans:jyan/progress
jeans:pdevine/fix-template
jeans:jyan/quant3
jeans:pdevine/ggla
jeans:mxyng/update-registry-domain
jeans:jmorganca/ggml-static
jeans:mxyng/create-context
jeans:jyan/v0.146
jeans:mxyng/layers-from-files
jeans:build_dist
jeans:bmizerany/noseek
jeans:royh-ls
jeans:royh-name
jeans:timeout
jeans:mxyng/server-timestamp
jeans:bmizerany/nosillyggufslurps
jeans:royh-params
jeans:jmorganca/llama-cpp-7c26775
jeans:royh-openai-delete
jeans:royh-show-rigid
jeans:jmorganca/enable-fa
jeans:jmorganca/no-error-template
jeans:jyan/format
jeans:royh-testdelete
jeans:bmizerany/fastverify
jeans:language_support
jeans:pdevine/ps-glitches
jeans:brucemacd/tokenize
jeans:bruce/iq-quants
jeans:bmizerany/filepathwithcoloninhost
jeans:mxyng/split-bin
jeans:bmizerany/client-registry
jeans:jmorganca/if-none-match
jeans:native
jeans:jmorganca/native
jeans:jmorganca/batch-embeddings
jeans:jmorganca/initcmake
jeans:jmorganca/mm
jeans:pdevine/showggmlinfo
jeans:modenameenforcealphanum
jeans:bmizerany/modenameenforcealphanum
jeans:jmorganca/done-reason
jeans:jmorganca/llama-cpp-8960fe8
jeans:ollama.com
jeans:bmizerany/filepathnobuild
jeans:bmizerany/types/model/defaultfix
jeans:rmdisplaylong
jeans:nogogen
jeans:bmizerany/x
jeans:modelfile-readme
jeans:bmizerany/replacecolon
jeans:jmorganca/limit
jeans:jmorganca/execstack
jeans:jmorganca/replace-assets
jeans:mxyng/tune-concurrency
jeans:jmorganca/testing
jeans:whitespace-detection
jeans:jmorganca/options
jeans:upgrade-all
jeans:scratch
jeans:cuda-search
jeans:mattw/airenamer
jeans:mattw/allmodelsonhuggingface
jeans:mattw/quantcontext
jeans:mattw/whatneedstorun
jeans:brucemacd/llama-mem-calc
jeans:mattw/faq-context
jeans:mattw/communitylinks
jeans:mattw/noprune
jeans:mattw/python-functioncalling
jeans:rename
jeans:mxyng/install
jeans:pulse
jeans:remove-first
jeans:editor
jeans:mattw/selfqueryingretrieval
jeans:cgo
jeans:mattw/howtoquant
jeans:api
jeans:matt/streamingapi
jeans:format-config
jeans:mxyng/extra-args
jeans:shell
jeans:update-nous-hermes
jeans:cp-model
jeans:upload-progress
jeans:fix-unknown-model
jeans:fix-model-names
jeans:delete-fix
jeans:insecure-registry
jeans:ls
jeans:deletemodels
jeans:progressbar
jeans:readme-updates
jeans:license-layers
jeans:skip-list
jeans:list-models
jeans:modelpath
jeans:matt/examplemodelfiles
jeans:distribution
jeans:go-opts
jeans:v0.7.0-rc1
jeans:v0.7.0-rc0
jeans:v0.6.8-rc0
jeans:v0.6.8
jeans:v0.6.7
jeans:v0.6.7-rc2
jeans:v0.6.7-rc1
jeans:v0.6.7-rc0
jeans:v0.6.6
jeans:v0.6.6-rc2
jeans:v0.6.6-rc1
jeans:v0.6.6-rc0
jeans:v0.6.5-rc1
jeans:v0.6.5
jeans:v0.6.5-rc0
jeans:v0.6.4-rc0
jeans:v0.6.4
jeans:v0.6.3-rc1
jeans:v0.6.3
jeans:v0.6.3-rc0
jeans:v0.6.2-rc0
jeans:v0.6.2
jeans:v0.6.1
jeans:v0.6.1-rc0
jeans:v0.6.0-rc0
jeans:v0.6.0
jeans:v0.5.13
jeans:v0.5.13-rc6
jeans:v0.5.13-rc5
jeans:v0.5.13-rc4
jeans:v0.5.13-rc3
jeans:v0.5.13-rc2
jeans:v0.5.13-rc1
jeans:v0.5.13-rc0
jeans:v0.5.12
jeans:v0.5.12-rc1
jeans:v0.5.12-rc0
jeans:v0.5.11
jeans:v0.5.10
jeans:v0.5.9
jeans:v0.5.9-rc0
jeans:v0.5.8-rc13
jeans:v0.5.8
jeans:v0.5.8-rc12
jeans:v0.5.8-rc11
jeans:v0.5.8-rc10
jeans:v0.5.8-rc9
jeans:v0.5.8-rc8
jeans:v0.5.8-rc7
jeans:v0.5.8-rc6
jeans:v0.5.8-rc5
jeans:v0.5.8-rc4
jeans:v0.5.8-rc3
jeans:v0.5.8-rc2
jeans:v0.5.8-rc1
jeans:v0.5.8-rc0
jeans:v0.5.7
jeans:v0.5.6
jeans:v0.5.5
jeans:v0.5.5-rc0
jeans:v0.5.4
jeans:v0.5.3
jeans:v0.5.3-rc0
jeans:v0.5.2
jeans:v0.5.2-rc3
jeans:v0.5.2-rc2
jeans:v0.5.2-rc1
jeans:v0.5.2-rc0
jeans:v0.5.1
jeans:v0.5.0-rc1
jeans:v0.5.0
jeans:v0.4.8-rc0
jeans:v0.4.7
jeans:v0.4.6
jeans:v0.4.5
jeans:v0.4.4
jeans:v0.4.3
jeans:v0.4.3-rc0
jeans:v0.4.2
jeans:v0.4.2-rc1
jeans:v0.4.2-rc0
jeans:v0.4.1-rc0
jeans:v0.4.1
jeans:v0.4.0
jeans:v0.4.0-rc8
jeans:v0.4.0-rc7
jeans:v0.4.0-rc6
jeans:v0.4.0-rc5
jeans:v0.4.0-rc4
jeans:v0.4.0-rc3
jeans:v0.4.0-rc2
jeans:v0.4.0-rc1
jeans:v0.4.0-rc0
jeans:v0.4.0-ci3
jeans:v0.3.14-rc0
jeans:v0.3.14
jeans:v0.3.13
jeans:v0.3.12
jeans:v0.3.12-rc5
jeans:v0.3.12-rc4
jeans:v0.3.12-rc3
jeans:v0.3.12-rc2
jeans:v0.3.12-rc1
jeans:v0.3.11
jeans:v0.3.11-rc4
jeans:v0.3.11-rc3
jeans:v0.3.11-rc2
jeans:v0.3.11-rc1
jeans:v0.3.10
jeans:v0.3.10-rc1
jeans:v0.3.9
jeans:v0.3.8
jeans:v0.3.7
jeans:v0.3.7-rc6
jeans:v0.3.7-rc5
jeans:v0.3.7-rc4
jeans:v0.3.7-rc3
jeans:v0.3.7-rc2
jeans:v0.3.7-rc1
jeans:v0.3.6
jeans:v0.3.5
jeans:v0.3.4
jeans:v0.3.3
jeans:v0.3.2
jeans:v0.3.1
jeans:v0.3.0
jeans:v0.2.8
jeans:v0.2.8-rc2
jeans:v0.2.8-rc1
jeans:v0.2.7
jeans:v0.2.6
jeans:v0.2.5
jeans:v0.2.4
jeans:v0.2.3
jeans:v0.2.2
jeans:v0.2.2-rc2
jeans:v0.2.2-rc1
jeans:v0.2.1
jeans:v0.2.0
jeans:v0.1.49-rc14
jeans:v0.1.49-rc13
jeans:v0.1.49-rc12
jeans:v0.1.49-rc11
jeans:v0.1.49-rc10
jeans:v0.1.49-rc9
jeans:v0.1.49-rc8
jeans:v0.1.49-rc7
jeans:v0.1.49-rc6
jeans:v0.1.49-rc5
jeans:v0.1.49-rc4
jeans:v0.1.49-rc3
jeans:v0.1.49-rc2
jeans:v0.1.49-rc1
jeans:v0.1.48
jeans:v0.1.47
jeans:v0.1.46
jeans:v0.1.45-rc5
jeans:v0.1.45
jeans:v0.1.45-rc4
jeans:v0.1.45-rc3
jeans:v0.1.45-rc2
jeans:v0.1.45-rc1
jeans:v0.1.44
jeans:v0.1.43
jeans:v0.1.42
jeans:v0.1.41
jeans:v0.1.40
jeans:v0.1.40-rc1
jeans:v0.1.39
jeans:v0.1.39-rc2
jeans:v0.1.39-rc1
jeans:v0.1.38
jeans:v0.1.37
jeans:v0.1.36
jeans:v0.1.35
jeans:v0.1.35-rc1
jeans:v0.1.34
jeans:v0.1.34-rc1
jeans:v0.1.33
jeans:v0.1.33-rc7
jeans:v0.1.33-rc6
jeans:v0.1.33-rc5
jeans:v0.1.33-rc4
jeans:v0.1.33-rc3
jeans:v0.1.33-rc2
jeans:v0.1.33-rc1
jeans:v0.1.32
jeans:v0.1.32-rc2
jeans:v0.1.32-rc1
jeans:v0.1.31
jeans:v0.1.30
jeans:v0.1.29
jeans:v0.1.28
jeans:v0.1.27
jeans:v0.1.26
jeans:v0.1.25
jeans:v0.1.24
jeans:v0.1.23
jeans:v0.1.22
jeans:v0.1.21
jeans:v0.1.20
jeans:v0.1.19
jeans:v0.1.18
jeans:v0.1.17
jeans:v0.1.16
jeans:v0.1.15
jeans:v0.1.14
jeans:v0.1.13
jeans:v0.1.12
jeans:v0.1.11
jeans:v0.1.10
jeans:v0.1.9
jeans:v0.1.8
jeans:v0.1.7
jeans:v0.1.6
jeans:v0.1.5
jeans:v0.1.4
jeans:v0.1.3
jeans:v0.1.2
jeans:v0.1.1
jeans:v0.1.0
jeans:v0.0.21
jeans:v0.0.20
jeans:v0.0.19
jeans:v0.0.18
jeans:v0.0.17
jeans:v0.0.16
jeans:v0.0.15
jeans:v0.0.14
jeans:v0.0.13
jeans:v0.0.12
jeans:v0.0.11
jeans:v0.0.10
jeans:v0.0.9
jeans:v0.0.8
jeans:v0.0.7
jeans:v0.0.6
jeans:v0.0.5
jeans:v0.0.4
jeans:v0.0.3
jeans:v0.0.2
jeans:v0.0.1
1 Commits
main
...
drifkin/nu
Author | SHA1 | Message | Date | |
---|---|---|---|---|
![]() |
67335dede2
|
lower default NUM_PARALLEL to 2
this is in part to "pay" for #10452, which doubled the default context length. The combination isn't fully neutral though, because even though the old 4x2k limit and the new 2x4k limit are memory equivalent, the 1x fallback is larger with 4k |
1 changed files with 1 additions and 1 deletions
|
@ -58,7 +58,7 @@ var defaultModelsPerGPU = 3
|
|||
// Default automatic value for parallel setting
|
||||
// Model will still need to fit in VRAM. If this setting won't fit
|
||||
// we'll back off down to 1 to try to get it to fit
|
||||
var defaultParallel = 4
|
||||
var defaultParallel = 2
|
||||
|
||||
var ErrMaxQueue = errors.New("server busy, please try again. maximum pending requests exceeded")
|
||||
|
||||
|
|
Write
Preview
Loading…
x
Reference in New Issue
Block a user
Blocking a user prevents them from interacting with repositories, such as opening or commenting on pull requests or issues. Learn more about blocking a user.