diff --git a/lib/chatbot/application.ex b/lib/chatbot/application.ex index 6eaa18e..834fb07 100644 --- a/lib/chatbot/application.ex +++ b/lib/chatbot/application.ex @@ -8,12 +8,6 @@ defmodule Chatbot.Application do @impl true def start(_type, _args) do children = [ - {Nx.Serving, - [ - serving: Chatbot.Rag.Serving.build_llm_serving(), - name: Rag.LLMServing, - batch_timeout: 100 - ]}, {Nx.Serving, [ serving: Chatbot.Rag.Serving.build_embedding_serving(), diff --git a/lib/chatbot/rag.ex b/lib/chatbot/rag.ex index 745516d..3b2602e 100644 --- a/lib/chatbot/rag.ex +++ b/lib/chatbot/rag.ex @@ -5,7 +5,7 @@ defmodule Chatbot.Rag do import Ecto.Query import Pgvector.Ecto.Query - @provider Ai.Nx.new(%{embeddings_serving: Rag.EmbeddingServing, text_serving: Rag.LLMServing}) + @provider Ai.Nx.new(%{embeddings_serving: Rag.EmbeddingServing}) def ingest(path) do path