Installed with: LOCALAI=http://localhost:31245 curl $LOCALAI/models/apply -H "Content-Type: application/json" -d '{ "config_url": "https://gist.github.com/tnpb-encora/ccf1b39c1fc154d1b32aa36e23a5d13f/raw/0de37af43d5165987e1564c2d43e82c26357b8a5/ggml-model-q4.yaml" }' ##################################################################################################################################################################### rest embedding Command: curl http://localhost:31245/embeddings -X POST -H "Content-Type: application/json" -d '{host:31245/embeddings -X POST -H "Content-Type: application/json" -d '{ "input": "Your text string goes here", "model": "ggml-q4-embeddings" }' | jq "." % Total % Received % Xferd Average Speed Time Time Time Current Dload Upload Total Spent Left Speed 100 167 100 91 100 76 6 5 0:00:15 0:00:14 0:00:01 23 { "error": { "code": 500, "message": "rpc error: code = Unknown desc = unimplemented", "type": "" } } ##################################################################################################################################################################### 6:47PM DBG Request received: {"model":"ggml-q4-embeddings","language":"","n":0,"top_p":null,"top_k":null,"temperature":null,"max_tokens":null,"echo":false,"batch":0,"ignore_eos":false,"repeat_penalty":0,"n_keep":0,"frequency_penalty":0,"presence_penalty":0,"tfz":null,"typical_p":null,"seed":null,"negative_prompt":"","rope_freq_base":0,"rope_freq_scale":0,"negative_prompt_scale":0,"use_fast_tokenizer":false,"clip_skip":0,"tokenizer":"","file":"","response_format":{},"size":"","prompt":null,"instruction":"","input":"Your text string goes here","stop":null,"messages":null,"functions":null,"function_call":null,"stream":false,"mode":0,"step":0,"grammar":"","grammar_json_functions":null,"backend":"","model_base_name":""} 6:47PM DBG Parameter Config: &{PredictionOptions:{Model: Language: N:0 TopP:0xc0002d5148 TopK:0xc0002d5150 Temperature:0xc0002d5158 Maxtokens:0xc0002d5188 Echo:false Batch:0 IgnoreEOS:false RepeatPenalty:0 Keep:0 FrequencyPenalty:0 PresencePenalty:0 TFZ:0xc0002d5180 TypicalP:0xc0002d5178 Seed:0xc0002d51a0 NegativePrompt: RopeFreqBase:0 RopeFreqScale:0 NegativePromptScale:0 UseFastTokenizer:false ClipSkip:0 Tokenizer:} Name:ggml-q4-embeddings F16:0xc0002d5140 Threads:0xc0002d5138 Debug:0xc0002865e0 Roles:map[] Embeddings:false Backend: TemplateConfig:{Chat: ChatMessage: Completion: Edit: Functions: UseTokenizerTemplate:false} PromptStrings:[] InputStrings:[Your text string goes here] InputToken:[] functionCallString: functionCallNameString: FunctionsConfig:{DisableNoAction:false NoActionFunctionName: NoActionDescriptionName: ParallelCalls:false NoGrammar:false ResponseRegex:} FeatureFlag:map[] LLMConfig:{SystemPrompt: TensorSplit: MainGPU: RMSNormEps:0 NGQA:0 PromptCachePath: PromptCacheAll:false PromptCacheRO:false MirostatETA:0xc0002d5170 MirostatTAU:0xc0002d5168 Mirostat:0xc0002d5160 NGPULayers:0xc0002d5190 MMap:0xc0002d5198 MMlock:0xc0002d5199 LowVRAM:0xc0002d5199 Grammar: StopWords:[] Cutstrings:[] TrimSpace:[] TrimSuffix:[] ContextSize:0xc0002d5130 NUMA:false LoraAdapter: LoraBase: LoraScale:0 NoMulMatQ:false DraftModel: NDraft:0 Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: ModelType: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0} AutoGPTQ:{ModelBaseName: Device: Triton:false UseFastTokenizer:false} Diffusers:{CUDA:false PipelineType: SchedulerType: EnableParameters: CFGScale:0 IMG2IMG:false ClipSkip:0 ClipModel: ClipSubFolder: ControlNet:} Step:0 GRPC:{Attempts:0 AttemptsSleepTime:0} VallE:{AudioPath:} CUDA:false DownloadFiles:[] Description:Bert model that can be used for embeddings Usage:} 6:47PM INF [llama-cpp] Attempting to load 6:47PM INF Loading model with backend llama-cpp 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: llama-cpp): {backendString:llama-cpp model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/llama-cpp 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:36869' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager324751868 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:36869): stdout Server listening on 127.0.0.1:36869 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath: RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:36869): stderr gguf_init_from_file: invalid magic characters '' 6:47PM DBG GRPC(-127.0.0.1:36869): stderr llama_model_load: error loading model: llama_model_loader: failed to load model from /build/models 6:47PM DBG GRPC(-127.0.0.1:36869): stderr 6:47PM DBG GRPC(-127.0.0.1:36869): stderr llama_load_model_from_file: failed to load model 6:47PM DBG GRPC(-127.0.0.1:36869): stderr llama_init_from_gpt_params: error: failed to load model '/build/models' 6:47PM DBG GRPC(-127.0.0.1:36869): stdout {"timestamp":1714157252,"level":"ERROR","function":"load_model","line":464,"message":"unable to load model","model":"/build/models"} 6:47PM INF [llama-cpp] Fails: could not load model: rpc error: code = Canceled desc = 6:47PM INF [llama-ggml] Attempting to load 6:47PM INF Loading model with backend llama-ggml 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: llama-ggml): {backendString:llama-ggml model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/llama-ggml 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:39035' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager2418100101 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 2024/04/26 18:47:32 gRPC Server listening at 127.0.0.1:39035 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath: RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:39035): stderr create_gpt_params: loading model /build/models 6:47PM DBG GRPC(-127.0.0.1:39035): stderr SIGILL: illegal instruction 6:47PM DBG GRPC(-127.0.0.1:39035): stderr PC=0x8af8dd m=5 sigcode=2 6:47PM DBG GRPC(-127.0.0.1:39035): stderr signal arrived during cgo execution 6:47PM DBG GRPC(-127.0.0.1:39035): stderr instruction bytes: 0xc4 0xe2 0x71 0xa9 0x15 0x3a 0xd7 0x20 0x0 0xc5 0xfa 0x11 0x4c 0x24 0x10 0xc5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 50 gp=0xc0001e3500 m=5 mp=0xc0000bb808 [syscall]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.cgocall(0x8434a0, 0xc000433640) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/cgocall.go:157 +0x4b fp=0xc000433618 sp=0xc0004335e0 pc=0x4145eb 6:47PM DBG GRPC(-127.0.0.1:39035): stderr github.com/go-skynet/go-llama%2ecpp._Cfunc_load_model(0x22009e0, 0x400, 0x0, 0x0, 0x0, 0x0, 0x1, 0x0, 0x5f5e0ff, 0x200, ...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr _cgo_gotypes.go:254 +0x4c fp=0xc000433640 sp=0xc000433618 pc=0x83706c 6:47PM DBG GRPC(-127.0.0.1:39035): stderr github.com/go-skynet/go-llama%2ecpp.New({0xc00010e220, 0xd}, {0xc00011e1c0, 0x8, 0x92c8a0?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/sources/go-llama.cpp/llama.go:28 +0x28a fp=0xc0004337c0 sp=0xc000433640 pc=0x83780a 6:47PM DBG GRPC(-127.0.0.1:39035): stderr main.(*LLM).Load(0xc0000376a0, 0xc00014a000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/backend/go/llm/llama-ggml/llama.go:73 +0x92e fp=0xc000433900 sp=0xc0004337c0 pc=0x84096e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr github.com/go-skynet/LocalAI/pkg/grpc.(*server).LoadModel(0xc000037750, {0x9b4400?, 0xc0000c49e8?}, 0xc00014a000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/pkg/grpc/server.go:50 +0xe7 fp=0xc0004339a8 sp=0xc000433900 pc=0x83d6c7 6:47PM DBG GRPC(-127.0.0.1:39035): stderr github.com/go-skynet/LocalAI/pkg/grpc/proto._Backend_LoadModel_Handler({0x9b4400, 0xc000037750}, {0xa97320, 0xc00011c2d0}, 0xc000120080, 0x0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/pkg/grpc/proto/backend_grpc.pb.go:352 +0x1a6 fp=0xc0004339f8 sp=0xc0004339a8 pc=0x831646 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).processUnaryRPC(0xc00024c1e0, {0xa97320, 0xc00011c210}, {0xa9ad00, 0xc000426000}, 0xc00013a000, 0xc000260300, 0xdd71d0, 0x0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:1343 +0xdd1 fp=0xc000433df0 sp=0xc0004339f8 pc=0x8185b1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).handleStream(0xc00024c1e0, {0xa9ad00, 0xc000426000}, 0xc00013a000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:1737 +0xc47 fp=0xc000433f78 sp=0xc000433df0 pc=0x81d567 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).serveStreams.func1.1() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:986 +0x86 fp=0xc000433fe0 sp=0xc000433f78 pc=0x816486 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc000433fe8 sp=0xc000433fe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by google.golang.org/grpc.(*Server).serveStreams.func1 in goroutine 36 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:997 +0x136 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 1 gp=0xc0000061c0 m=nil [IO wait]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0xc000044a08?, 0x0?, 0xc0?, 0x61?, 0xc000245b60?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc000245b28 sp=0xc000245b08 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.netpollblock(0xc000245bc0?, 0x413d86?, 0x0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/netpoll.go:573 +0xf7 fp=0xc000245b60 sp=0xc000245b28 pc=0x443a17 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.runtime_pollWait(0x7f5b31dbbf20, 0x72) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/netpoll.go:345 +0x85 fp=0xc000245b80 sp=0xc000245b60 pc=0x477785 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*pollDesc).wait(0x3?, 0x1?, 0x0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc000245ba8 sp=0xc000245b80 pc=0x4e1fa7 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*pollDesc).waitRead(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_poll_runtime.go:89 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*FD).Accept(0xc0001f4e00) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_unix.go:611 +0x2ac fp=0xc000245c50 sp=0xc000245ba8 pc=0x4e734c 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*netFD).accept(0xc0001f4e00) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/net/fd_unix.go:172 +0x29 fp=0xc000245d08 sp=0xc000245c50 pc=0x56bdc9 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*TCPListener).accept(0xc0000d45a0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/net/tcpsock_posix.go:159 +0x1e fp=0xc000245d30 sp=0xc000245d08 pc=0x58317e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*TCPListener).Accept(0xc0000d45a0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/net/tcpsock.go:327 +0x30 fp=0xc000245d60 sp=0xc000245d30 pc=0x582370 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).Serve(0xc00024c1e0, {0xa96930, 0xc0000d45a0}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:852 +0x469 fp=0xc000245e98 sp=0xc000245d60 pc=0x815109 6:47PM DBG GRPC(-127.0.0.1:39035): stderr github.com/go-skynet/LocalAI/pkg/grpc.StartServer({0x7ffd84530990?, 0xc000024280?}, {0xa9d010, 0xc0000376a0}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/pkg/grpc/server.go:226 +0x170 fp=0xc000245f20 sp=0xc000245e98 pc=0x83fd90 6:47PM DBG GRPC(-127.0.0.1:39035): stderr main.main() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /build/backend/go/llm/llama-ggml/main.go:16 +0x85 fp=0xc000245f50 sp=0xc000245f20 pc=0x8429c5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.main() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:271 +0x29d fp=0xc000245fe0 sp=0xc000245f50 pc=0x44a7dd 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc000245fe8 sp=0xc000245fe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 2 gp=0xc000006c40 m=nil [force gc (idle)]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc0000b4fa8 sp=0xc0000b4f88 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goparkunlock(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:408 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.forcegchelper() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:326 +0xb3 fp=0xc0000b4fe0 sp=0xc0000b4fa8 pc=0x44aa93 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc0000b4fe8 sp=0xc0000b4fe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by runtime.init.6 in goroutine 1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:314 +0x1a 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 3 gp=0xc000007180 m=nil [GC sweep wait]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc0000b5780 sp=0xc0000b5760 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goparkunlock(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:408 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.bgsweep(0xc0000de000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgcsweep.go:278 +0x94 fp=0xc0000b57c8 sp=0xc0000b5780 pc=0x436214 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gcenable.gowrap1() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgc.go:203 +0x25 fp=0xc0000b57e0 sp=0xc0000b57c8 pc=0x42ab65 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc0000b57e8 sp=0xc0000b57e0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by runtime.gcenable in goroutine 1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgc.go:203 +0x66 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 4 gp=0xc000007340 m=nil [GC scavenge wait]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0xc0000de000?, 0xa8ee10?, 0x1?, 0x0?, 0xc000007340?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc0000b5f78 sp=0xc0000b5f58 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goparkunlock(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:408 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.(*scavengerState).park(0xe240e0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgcscavenge.go:425 +0x49 fp=0xc0000b5fa8 sp=0xc0000b5f78 pc=0x433c09 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.bgscavenge(0xc0000de000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgcscavenge.go:653 +0x3c fp=0xc0000b5fc8 sp=0xc0000b5fa8 pc=0x43419c 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gcenable.gowrap2() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgc.go:204 +0x25 fp=0xc0000b5fe0 sp=0xc0000b5fc8 pc=0x42ab05 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc0000b5fe8 sp=0xc0000b5fe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by runtime.gcenable in goroutine 1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mgc.go:204 +0xa5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 5 gp=0xc000007c00 m=nil [finalizer wait]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0xc0000b4648?, 0x41e245?, 0xa8?, 0x1?, 0xc0000061c0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc0000b4620 sp=0xc0000b4600 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.runfinq() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mfinal.go:194 +0x107 fp=0xc0000b47e0 sp=0xc0000b4620 pc=0x429ba7 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc0000b47e8 sp=0xc0000b47e0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by runtime.createfing in goroutine 1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/mfinal.go:164 +0x3d 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 34 gp=0xc00043a000 m=nil [select]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0xc00012bf00?, 0x2?, 0x1e?, 0x0?, 0xc00012bed4?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc00012bd80 sp=0xc00012bd60 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.selectgo(0xc00012bf00, 0xc00012bed0, 0x7afd96?, 0x0, 0xc000410000?, 0x1) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/select.go:327 +0x725 fp=0xc00012bea0 sp=0xc00012bd80 pc=0x45bf85 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.(*controlBuffer).get(0xc00040e050, 0x1) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/controlbuf.go:418 +0x113 fp=0xc00012bf30 sp=0xc00012bea0 pc=0x78ecb3 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.(*loopyWriter).run(0xc000122000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/controlbuf.go:552 +0x86 fp=0xc00012bf90 sp=0xc00012bf30 pc=0x78f406 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.NewServerTransport.func2() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:336 +0xd5 fp=0xc00012bfe0 sp=0xc00012bf90 pc=0x7a5cf5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc00012bfe8 sp=0xc00012bfe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by google.golang.org/grpc/internal/transport.NewServerTransport in goroutine 19 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:333 +0x1a8c 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 35 gp=0xc00043a1c0 m=nil [select]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0xc000440740?, 0x4?, 0xf0?, 0x5?, 0xc0004406c0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc000440558 sp=0xc000440538 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.selectgo(0xc000440740, 0xc0004406b8, 0x0?, 0x0, 0x0?, 0x1) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/select.go:327 +0x725 fp=0xc000440678 sp=0xc000440558 pc=0x45bf85 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.(*http2Server).keepalive(0xc000426000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:1152 +0x205 fp=0xc0004407c8 sp=0xc000440678 pc=0x7ace45 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.NewServerTransport.gowrap1() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:339 +0x25 fp=0xc0004407e0 sp=0xc0004407c8 pc=0x7a5be5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc0004407e8 sp=0xc0004407e0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by google.golang.org/grpc/internal/transport.NewServerTransport in goroutine 19 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:339 +0x1ace 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr goroutine 36 gp=0xc00043a380 m=nil [IO wait]: 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.gopark(0x9962c0?, 0xc00011c1e0?, 0xe8?, 0x70?, 0xb?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/proc.go:402 +0xce fp=0xc00028cab0 sp=0xc00028ca90 pc=0x44ac0e 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.netpollblock(0x4c8078?, 0x413d86?, 0x0?) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/netpoll.go:573 +0xf7 fp=0xc00028cae8 sp=0xc00028cab0 pc=0x443a17 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.runtime_pollWait(0x7f5b31dbbe28, 0x72) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/netpoll.go:345 +0x85 fp=0xc00028cb08 sp=0xc00028cae8 pc=0x477785 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*pollDesc).wait(0xc000340400?, 0xc000406000?, 0x0) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc00028cb30 sp=0xc00028cb08 pc=0x4e1fa7 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*pollDesc).waitRead(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_poll_runtime.go:89 6:47PM DBG GRPC(-127.0.0.1:39035): stderr internal/poll.(*FD).Read(0xc000340400, {0xc000406000, 0x8000, 0x8000}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/internal/poll/fd_unix.go:164 +0x27a fp=0xc00028cbc8 sp=0xc00028cb30 pc=0x4e329a 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*netFD).Read(0xc000340400, {0xc000406000?, 0x1060100000000?, 0x8?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/net/fd_posix.go:55 +0x25 fp=0xc00028cc10 sp=0xc00028cbc8 pc=0x569de5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*conn).Read(0xc00033c050, {0xc000406000?, 0x800010601?, 0xc000000000?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/net/net.go:179 +0x45 fp=0xc00028cc58 sp=0xc00028cc10 pc=0x57a385 6:47PM DBG GRPC(-127.0.0.1:39035): stderr net.(*TCPConn).Read(0x0?, {0xc000406000?, 0xc00028ccb0?, 0x46a5ed?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr :1 +0x25 fp=0xc00028cc88 sp=0xc00028cc58 pc=0x58c4a5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr bufio.(*Reader).Read(0xc000404000, {0xc000418040, 0x9, 0xc0000bb008?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/bufio/bufio.go:241 +0x197 fp=0xc00028ccc0 sp=0xc00028cc88 pc=0x52f657 6:47PM DBG GRPC(-127.0.0.1:39035): stderr io.ReadAtLeast({0xa93fa0, 0xc000404000}, {0xc000418040, 0x9, 0x9}, 0x9) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/io/io.go:335 +0x90 fp=0xc00028cd08 sp=0xc00028ccc0 pc=0x4c1eb0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr io.ReadFull(...) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/io/io.go:354 6:47PM DBG GRPC(-127.0.0.1:39035): stderr golang.org/x/net/http2.readFrameHeader({0xc000418040, 0x9, 0xc00042a030?}, {0xa93fa0?, 0xc000404000?}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/x/net@v0.24.0/http2/frame.go:237 +0x65 fp=0xc00028cd58 sp=0xc00028cd08 pc=0x77be25 6:47PM DBG GRPC(-127.0.0.1:39035): stderr golang.org/x/net/http2.(*Framer).ReadFrame(0xc000418000) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/x/net@v0.24.0/http2/frame.go:498 +0x85 fp=0xc00028ce00 sp=0xc00028cd58 pc=0x77c565 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc/internal/transport.(*http2Server).HandleStreams(0xc000426000, 0xc00041c210) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/internal/transport/http2_server.go:636 +0x145 fp=0xc00028cf08 sp=0xc00028ce00 pc=0x7a8d85 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).serveStreams(0xc00024c1e0, {0xa9ad00, 0xc000426000}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:979 +0x1aa fp=0xc00028cf80 sp=0xc00028cf08 pc=0x81624a 6:47PM DBG GRPC(-127.0.0.1:39035): stderr google.golang.org/grpc.(*Server).handleRawConn.func1() 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:920 +0x45 fp=0xc00028cfe0 sp=0xc00028cf80 pc=0x815aa5 6:47PM DBG GRPC(-127.0.0.1:39035): stderr runtime.goexit({}) 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/golang.org/toolchain@v0.0.1-go1.22.2.linux-amd64/src/runtime/asm_amd64.s:1695 +0x1 fp=0xc00028cfe8 sp=0xc00028cfe0 pc=0x47c8c1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr created by google.golang.org/grpc.(*Server).handleRawConn in goroutine 19 6:47PM DBG GRPC(-127.0.0.1:39035): stderr /root/go/pkg/mod/google.golang.org/grpc@v1.59.0/server.go:919 +0x15b 6:47PM DBG GRPC(-127.0.0.1:39035): stderr 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rax 0x0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rbx 0xeca420 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rcx 0x18 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rdx 0x2383ec66 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rdi 0x1 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rsi 0x12b0f6 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rbp 0xeea420 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rsp 0x7f5b32df47f0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r8 0xd 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r9 0x0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r10 0x7ffd845cf080 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r11 0x7ffd845cf090 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r12 0xf0a420 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r13 0xf2a420 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r14 0xe8a420 6:47PM DBG GRPC(-127.0.0.1:39035): stderr r15 0x0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rip 0x8af8dd 6:47PM DBG GRPC(-127.0.0.1:39035): stderr rflags 0x10206 6:47PM DBG GRPC(-127.0.0.1:39035): stderr cs 0x33 6:47PM DBG GRPC(-127.0.0.1:39035): stderr fs 0x0 6:47PM DBG GRPC(-127.0.0.1:39035): stderr gs 0x0 6:47PM INF [llama-ggml] Fails: could not load model: rpc error: code = Unavailable desc = error reading from server: EOF 6:47PM INF [gpt4all] Attempting to load 6:47PM INF Loading model with backend gpt4all 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: gpt4all): {backendString:gpt4all model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/gpt4all 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:37251' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager2469591872 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:37251): stderr 2024/04/26 18:47:34 gRPC Server listening at 127.0.0.1:37251 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath:/tmp/localai/backend_data/backend-assets/gpt4all RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:37251): stderr load_model: error 'Is a directory' 6:47PM INF [gpt4all] Fails: could not load model: rpc error: code = Unknown desc = failed loading model 6:47PM INF [bert-embeddings] Attempting to load 6:47PM INF Loading model with backend bert-embeddings 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: bert-embeddings): {backendString:bert-embeddings model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/bert-embeddings 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:34329' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager3445786936 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:34329): stderr 2024/04/26 18:47:36 gRPC Server listening at 127.0.0.1:34329 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath:/tmp/localai/backend_data/backend-assets/gpt4all RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:34329): stderr bert_load_from_file: invalid model file '/build/models' (bad magic) 6:47PM DBG GRPC(-127.0.0.1:34329): stderr bert_bootstrap: failed to load model from '/build/models' 6:47PM INF [bert-embeddings] Fails: could not load model: rpc error: code = Unknown desc = failed loading model 6:47PM INF [rwkv] Attempting to load 6:47PM INF Loading model with backend rwkv 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: rwkv): {backendString:rwkv model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/rwkv 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:37343' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager3492388391 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:37343): stderr 2024/04/26 18:47:38 gRPC Server listening at 127.0.0.1:37343 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath:/tmp/localai/backend_data/backend-assets/gpt4all RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:37343): stderr 6:47PM DBG GRPC(-127.0.0.1:37343): stderr /build/sources/go-rwkv.cpp/rwkv.cpp/rwkv_file_format.inc:92: rwkv_fread_data(file, sizeof(struct rwkv_file_header), &header) 6:47PM DBG GRPC(-127.0.0.1:37343): stderr Invalid file header 6:47PM DBG GRPC(-127.0.0.1:37343): stderr /build/sources/go-rwkv.cpp/rwkv.cpp/rwkv_model_loading.inc:158: rwkv_fread_file_header(file.file, model.header) 6:47PM DBG GRPC(-127.0.0.1:37343): stderr 6:47PM DBG GRPC(-127.0.0.1:37343): stderr /build/sources/go-rwkv.cpp/rwkv.cpp/rwkv.cpp:63: rwkv_load_model_from_file(file_path, *ctx->model) 6:47PM DBG GRPC(-127.0.0.1:37343): stderr 2024/04/26 18:47:40 InitFromFile /build/models failed 6:47PM INF [rwkv] Fails: could not load model: rpc error: code = Unavailable desc = error reading from server: EOF 6:47PM INF [whisper] Attempting to load 6:47PM INF Loading model with backend whisper 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: whisper): {backendString:whisper model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/whisper 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:44093' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager811867827 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:44093): stderr 2024/04/26 18:47:40 gRPC Server listening at 127.0.0.1:44093 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath:/tmp/localai/backend_data/backend-assets/gpt4all RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM DBG GRPC(-127.0.0.1:44093): stderr whisper_init_from_file_with_params_no_state: loading model from '/build/models' 6:47PM DBG GRPC(-127.0.0.1:44093): stderr whisper_model_load: loading model 6:47PM DBG GRPC(-127.0.0.1:44093): stderr whisper_model_load: invalid model data (bad magic) 6:47PM DBG GRPC(-127.0.0.1:44093): stderr whisper_init_with_params_no_state: failed to load model 6:47PM INF [whisper] Fails: could not load model: rpc error: code = Unknown desc = unable to load model 6:47PM INF [stablediffusion] Attempting to load 6:47PM INF Loading model with backend stablediffusion 6:47PM DBG Loading model in memory from file: /build/models 6:47PM DBG Loading Model with gRPC (file: /build/models) (backend: stablediffusion): {backendString:stablediffusion model: threads:4 assetDir:/tmp/localai/backend_data context:{emptyCtx:{}} gRPCOptions:0xc000249800 externalBackends:map[autogptq:/build/backend/python/autogptq/run.sh bark:/build/backend/python/bark/run.sh coqui:/build/backend/python/coqui/run.sh diffusers:/build/backend/python/diffusers/run.sh exllama:/build/backend/python/exllama/run.sh exllama2:/build/backend/python/exllama2/run.sh huggingface-embeddings:/build/backend/python/sentencetransformers/run.sh mamba:/build/backend/python/mamba/run.sh parler-tts:/build/backend/python/parler-tts/run.sh petals:/build/backend/python/petals/run.sh rerankers:/build/backend/python/rerankers/run.sh sentencetransformers:/build/backend/python/sentencetransformers/run.sh transformers:/build/backend/python/transformers/run.sh transformers-musicgen:/build/backend/python/transformers-musicgen/run.sh vall-e-x:/build/backend/python/vall-e-x/run.sh vllm:/build/backend/python/vllm/run.sh] grpcAttempts:20 grpcAttemptsDelay:2 singleActiveBackend:false parallelRequests:false} 6:47PM DBG Loading GRPC Process: /tmp/localai/backend_data/backend-assets/grpc/stablediffusion 6:47PM DBG GRPC Service for will be running at: '127.0.0.1:37735' 6:47PM DBG GRPC Service state dir: /tmp/go-processmanager3733982432 6:47PM DBG GRPC Service Started 6:47PM DBG GRPC(-127.0.0.1:37735): stderr 2024/04/26 18:47:42 gRPC Server listening at 127.0.0.1:37735 6:47PM DBG GRPC Service Ready 6:47PM DBG GRPC: Loading model with options: {state:{NoUnkeyedLiterals:{} DoNotCompare:[] DoNotCopy:[] atomicMessageInfo:} sizeCache:0 unknownFields:[] Model: ContextSize:1024 Seed:318952489 NBatch:512 F16Memory:false MLock:false MMap:true VocabOnly:false LowVRAM:false Embeddings:false NUMA:false NGPULayers:99999999 MainGPU: TensorSplit: Threads:4 LibrarySearchPath:/tmp/localai/backend_data/backend-assets/gpt4all RopeFreqBase:0 RopeFreqScale:0 RMSNormEps:0 NGQA:0 ModelFile:/build/models Device: UseTriton:false ModelBaseName: UseFastTokenizer:false PipelineType: SchedulerType: CUDA:false CFGScale:0 IMG2IMG:false CLIPModel: CLIPSubfolder: CLIPSkip:0 ControlNet: Tokenizer: LoraBase: LoraAdapter: LoraScale:0 NoMulMatQ:false DraftModel: AudioPath: Quantization: GPUMemoryUtilization:0 TrustRemoteCode:false EnforceEager:false SwapSpace:0 MaxModelLen:0 TensorParallelSize:0 MMProj: RopeScaling: YarnExtFactor:0 YarnAttnFactor:0 YarnBetaFast:0 YarnBetaSlow:0 Type:} 6:47PM INF [stablediffusion] Loads OK 6:47PM ERR Server error error="rpc error: code = Unknown desc = unimplemented" ip=192.168.96.1 latency=14.087513709s method=POST status=500 url=/embeddings