Created
November 13, 2024 15:55
-
-
Save sshaaf/354d87dcaef7c37cb8a2caf9f604bb03 to your computer and use it in GitHub Desktop.
Jlama, Quarkus, langchain4J.. stack trace.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
┌───────────────────> 🐠 | |
│quarkus-drools-llm is 📦 v1.0.0-SNAPSHOT | |
└─> java --enable-preview --enable-native-access=ALL-UNNAMED --add-modules jdk.incubator.vector -jar target/quarkus-app/quarkus-run.jar (base) | |
WARNING: Using incubator modules: jdk.incubator.vector | |
__ ____ __ _____ ___ __ ____ ______ | |
--/ __ \/ / / / _ | / _ \/ //_/ / / / __/ | |
-/ /_/ / /_/ / __ |/ , _/ ,< / /_/ /\ \ | |
--\___\_\____/_/ |_/_/|_/_/|_|\____/___/ | |
2024-11-13 16:43:16,187 INFO [io.quarkus] (main) quarkus-drools-llm 1.0.0-SNAPSHOT on JVM (powered by Quarkus 3.15.1) started in 0.476s. Listening on: http://0.0.0.0:8080 | |
2024-11-13 16:43:16,191 INFO [io.quarkus] (main) Profile prod activated. | |
2024-11-13 16:43:16,191 INFO [io.quarkus] (main) Installed features: [cdi, langchain4j, langchain4j-jlama, qute, rest, rest-jackson, smallrye-context-propagation, vertx] | |
2024-11-13 16:44:11,678 WARN [com.git.tja.jla.ten.ope.uti.JarSupport] (executor-thread-1) jlama-native shared library not found | |
2024-11-13 16:44:11,680 WARN [com.git.tja.jla.ten.ope.TensorOperationsProvider] (executor-thread-1) Native operations not available. Consider adding 'com.github.tjake:jlama-native' to the classpath | |
2024-11-13 16:44:11,691 INFO [com.git.tja.jla.ten.ope.TensorOperationsProvider] (executor-thread-1) Using Panama Vector Operations (OffHeap) | |
2024-11-13 16:44:11,698 INFO [com.git.tja.jla.mod.AbstractModel] (executor-thread-1) Model type = Q4, Working memory type = F32, Quantized memory type = I8 | |
2024-11-13 16:45:40,422 ERROR [io.qua.ver.htt.run.QuarkusErrorHandler] (executor-thread-1) HTTP Request to /hybridai/password failed, error id: 2c753feb-9c82-478d-89c5-96f08e5b6cf8-1: java.lang.ArrayIndexOutOfBoundsException: Index 65536 out of bounds for length 65536 | |
at com.github.tjake.jlama.model.CausalSelfAttention.lambda$forward$6(CausalSelfAttention.java:260) | |
at java.base/java.util.Optional.ifPresent(Optional.java:178) | |
at com.github.tjake.jlama.model.CausalSelfAttention.forward(CausalSelfAttention.java:242) | |
at com.github.tjake.jlama.model.TransformerBlock.forward(TransformerBlock.java:173) | |
at com.github.tjake.jlama.model.AbstractModel.forward(AbstractModel.java:299) | |
at com.github.tjake.jlama.model.AbstractModel.forward(AbstractModel.java:262) | |
at com.github.tjake.jlama.model.AbstractModel.forward(AbstractModel.java:238) | |
at com.github.tjake.jlama.model.AbstractModel.generate(AbstractModel.java:566) | |
at io.quarkiverse.langchain4j.jlama.JlamaChatModel.generate(JlamaChatModel.java:98) | |
at io.quarkiverse.langchain4j.jlama.JlamaChatModel.generate(JlamaChatModel.java:84) | |
at dev.langchain4j.model.chat.ChatLanguageModel__PxWa8wCyNr7CdT_Jb6ikK30HAo_Synthetic_ClientProxy.generate(Unknown Source) | |
at io.quarkiverse.langchain4j.runtime.aiservice.AiServiceMethodImplementationSupport.doImplement(AiServiceMethodImplementationSupport.java:320) | |
at io.quarkiverse.langchain4j.runtime.aiservice.AiServiceMethodImplementationSupport.implement(AiServiceMethodImplementationSupport.java:129) | |
at org.hybridai.password.PasswordGenerator$$QuarkusImpl.generatePassword(Unknown Source) | |
at org.hybridai.password.PasswordEndpoint.password(PasswordEndpoint.java:29) | |
at org.hybridai.password.PasswordEndpoint$quarkusrestinvoker$password_5b3ee46f2a27aa9a0f9cd9904c089c2b5ff850f4.invoke(Unknown Source) | |
at org.jboss.resteasy.reactive.server.handlers.InvocationHandler.handle(InvocationHandler.java:29) | |
at io.quarkus.resteasy.reactive.server.runtime.QuarkusResteasyReactiveRequestContext.invokeHandler(QuarkusResteasyReactiveRequestContext.java:141) | |
at org.jboss.resteasy.reactive.common.core.AbstractResteasyReactiveContext.run(AbstractResteasyReactiveContext.java:147) | |
at io.quarkus.vertx.core.runtime.VertxCoreRecorder$14.runWith(VertxCoreRecorder.java:635) | |
at org.jboss.threads.EnhancedQueueExecutor$Task.doRunWith(EnhancedQueueExecutor.java:2516) | |
at org.jboss.threads.EnhancedQueueExecutor$Task.run(EnhancedQueueExecutor.java:2495) | |
at org.jboss.threads.EnhancedQueueExecutor$ThreadBody.run(EnhancedQueueExecutor.java:1521) | |
at org.jboss.threads.DelegatingRunnable.run(DelegatingRunnable.java:11) | |
at org.jboss.threads.ThreadLocalResettingRunnable.run(ThreadLocalResettingRunnable.java:11) | |
at io.netty.util.concurrent.FastThreadLocalRunnable.run(FastThreadLocalRunnable.java:30) | |
at java.base/java.lang.Thread.run(Thread.java:1583) | |
2024-11-13 16:50:01,204 INFO [org.hyb.ref.RefundChatbotEndpoint] (executor-thread-1) message = something | |
2024-11-13 16:50:01,205 INFO [org.hyb.ref.RefundChatbotEndpoint] (executor-thread-1) sessionId = ctf1yhv8qn4 | |
2024-11-13 16:50:01,205 INFO [org.hyb.ref.RefundChatbotEndpoint] (executor-thread-1) sessionData = SessionData{customer=null, flight=null} | |
2024-11-13 16:50:01,207 INFO [org.hyb.ref.StateManager] (executor-thread-1) Extracting customer from something | |
2024-11-13 16:50:01,520 INFO [com.git.tja.jla.mod.AbstractModel] (executor-thread-1) Model type = Q4, Working memory type = F32, Quantized memory type = I8 | |
2024-11-13 16:50:01,524 INFO [io.qua.lan.jla.JlamaChatModel] (executor-thread-1) Request: [UserMessage { name = null contents = [TextContent { text = "Extract information about a customer from this text 'something. '. The response must contain only the JSON with customer's data and without any other sentence. | |
You must answer strictly in the following JSON format: { | |
"firstName": (type: string), | |
"lastName": (type: string), | |
"age": (type: integer) | |
}" }] }] | |
2024-11-13 16:50:24,065 INFO [io.qua.lan.jla.JlamaChatModel] (executor-thread-1) Request: [SystemMessage { text = "You are a chat bot of an airline company. Your goal is asking questions to gather information | |
about a customer | |
" }, UserMessage { name = null contents = [TextContent { text = "Ask question to the customer regarding his name and age, also replying to his message 'something' | |
" }] }] | |
2024-11-13 16:50:38,984 ERROR [io.qua.ver.htt.run.QuarkusErrorHandler] (executor-thread-1) HTTP Request to /hybridai/chatbot/ctf1yhv8qn4/refund failed, error id: 2c753feb-9c82-478d-89c5-96f08e5b6cf8-2: java.lang.UnsupportedOperationException: java.lang.UnsupportedOperationException: ARM_128 | |
at java.base/jdk.internal.reflect.DirectConstructorHandleAccessor.newInstance(DirectConstructorHandleAccessor.java:62) | |
at java.base/java.lang.reflect.Constructor.newInstanceWithCaller(Constructor.java:502) | |
at java.base/java.lang.reflect.Constructor.newInstance(Constructor.java:486) | |
at java.base/java.util.concurrent.ForkJoinTask.getThrowableException(ForkJoinTask.java:540) | |
at java.base/java.util.concurrent.ForkJoinTask.reportException(ForkJoinTask.java:567) | |
at java.base/java.util.concurrent.ForkJoinTask.join(ForkJoinTask.java:653) | |
at com.github.tjake.jlama.util.PhysicalCoreExecutor.execute(PhysicalCoreExecutor.java:55) | |
at com.github.tjake.jlama.math.VectorMath.pchunk(VectorMath.java:56) | |
at com.github.tjake.jlama.model.AbstractModel.sample(AbstractModel.java:421) | |
at com.github.tjake.jlama.model.AbstractModel.generate(AbstractModel.java:549) | |
at io.quarkiverse.langchain4j.jlama.JlamaChatModel.generate(JlamaChatModel.java:98) | |
at io.quarkiverse.langchain4j.jlama.JlamaChatModel.generate(JlamaChatModel.java:84) | |
at dev.langchain4j.model.chat.ChatLanguageModel_XNMsOaekknG7BdNZ5YSUkjh1SqE_Synthetic_ClientProxy.generate(Unknown Source) | |
at io.quarkiverse.langchain4j.runtime.aiservice.AiServiceMethodImplementationSupport.doImplement(AiServiceMethodImplementationSupport.java:320) | |
at io.quarkiverse.langchain4j.runtime.aiservice.AiServiceMethodImplementationSupport.implement(AiServiceMethodImplementationSupport.java:129) | |
at org.hybridai.refund.aiservices.CustomerChatService$$QuarkusImpl.chat(Unknown Source) | |
at org.hybridai.refund.StateManager$ChatbotState.chat(StateManager.java:92) | |
at org.hybridai.refund.RefundChatbotEndpoint.chat(RefundChatbotEndpoint.java:48) | |
at org.hybridai.refund.RefundChatbotEndpoint$quarkusrestinvoker$chat_72574ea1f50311db5f7c11ce82a1a35240b9b431.invoke(Unknown Source) | |
at org.jboss.resteasy.reactive.server.handlers.InvocationHandler.handle(InvocationHandler.java:29) | |
at io.quarkus.resteasy.reactive.server.runtime.QuarkusResteasyReactiveRequestContext.invokeHandler(QuarkusResteasyReactiveRequestContext.java:141) | |
at org.jboss.resteasy.reactive.common.core.AbstractResteasyReactiveContext.run(AbstractResteasyReactiveContext.java:147) | |
at io.quarkus.vertx.core.runtime.VertxCoreRecorder$14.runWith(VertxCoreRecorder.java:635) | |
at org.jboss.threads.EnhancedQueueExecutor$Task.doRunWith(EnhancedQueueExecutor.java:2516) | |
at org.jboss.threads.EnhancedQueueExecutor$Task.run(EnhancedQueueExecutor.java:2495) | |
at org.jboss.threads.EnhancedQueueExecutor$ThreadBody.run(EnhancedQueueExecutor.java:1521) | |
at org.jboss.threads.DelegatingRunnable.run(DelegatingRunnable.java:11) | |
at org.jboss.threads.ThreadLocalResettingRunnable.run(ThreadLocalResettingRunnable.java:11) | |
at io.netty.util.concurrent.FastThreadLocalRunnable.run(FastThreadLocalRunnable.java:30) | |
at java.base/java.lang.Thread.run(Thread.java:1583) | |
Caused by: java.lang.UnsupportedOperationException: ARM_128 | |
at com.github.tjake.jlama.tensor.operations.PanamaTensorOperations.batchDotProduct(PanamaTensorOperations.java:125) | |
at com.github.tjake.jlama.tensor.operations.TensorOperations.dotProductChunk(TensorOperations.java:76) | |
at com.github.tjake.jlama.model.AbstractModel.lambda$sample$4(AbstractModel.java:423) | |
at com.github.tjake.jlama.math.VectorMath.lambda$pchunk$1(VectorMath.java:60) | |
at java.base/java.util.stream.ForEachOps$ForEachOp$OfInt.accept(ForEachOps.java:205) | |
at java.base/java.util.stream.Streams$RangeIntSpliterator.forEachRemaining(Streams.java:104) | |
at java.base/java.util.Spliterator$OfInt.forEachRemaining(Spliterator.java:712) | |
at java.base/java.util.stream.AbstractPipeline.copyInto(AbstractPipeline.java:509) | |
at java.base/java.util.stream.ForEachOps$ForEachTask.compute(ForEachOps.java:291) | |
at java.base/java.util.concurrent.CountedCompleter.exec(CountedCompleter.java:754) | |
at java.base/java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:387) | |
at java.base/java.util.concurrent.ForkJoinTask.invoke(ForkJoinTask.java:667) | |
at java.base/java.util.stream.ForEachOps$ForEachOp.evaluateParallel(ForEachOps.java:160) | |
at java.base/java.util.stream.ForEachOps$ForEachOp$OfInt.evaluateParallel(ForEachOps.java:189) | |
at java.base/java.util.stream.AbstractPipeline.evaluate(AbstractPipeline.java:233) | |
at java.base/java.util.stream.IntPipeline.forEach(IntPipeline.java:463) | |
at java.base/java.util.stream.IntPipeline$Head.forEach(IntPipeline.java:620) | |
at com.github.tjake.jlama.math.VectorMath.lambda$pchunk$2(VectorMath.java:59) | |
at java.base/java.util.concurrent.ForkJoinTask$AdaptedRunnableAction.exec(ForkJoinTask.java:1403) | |
at java.base/java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:387) | |
at java.base/java.util.concurrent.ForkJoinPool$WorkQueue.topLevelExec(ForkJoinPool.java:1312) | |
at java.base/java.util.concurrent.ForkJoinPool.scan(ForkJoinPool.java:1843) | |
at java.base/java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1808) | |
at java.base/java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:188) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment