Was soll ich tun, um die Startzeit meines Kafka -Arbeiters und der Fastapi -App zu verkürzen. class = "Lang-Py PrettyPrint-Override">
Code: Select all
@asynccontextmanager
async def lifespan(app: FastAPI):
logger.info("Starting up RecallAI...")
start = time.time()
async def warmup():
logger.info("Warming up models and vector store...")
get_embeddings_model()
get_llm()
get_vectorstore()
logger.info(f"Warmup complete in {time.time() - start:.2f} seconds")
asyncio.create_task(warmup())
yield
logger.info("Shutting down RecallAI...")
Code: Select all
@cache
def get_embeddings_model():
return HuggingFaceEmbeddings(model_name="BAAI/bge-small-en-v1.5")
@cache
def get_llm():
return ChatGroq(groq_api_key=os.getenv("GROQ_API_KEY"), model_name="llama-3-70b")
def get_vectorstore():
embeddings = get_embeddings_model()
return FAISS.load_local("img_vector_store", embeddings, allow_dangerous_deserialization=True)
< /code>
Hier ist der Kafka -Arbeiter: < /p>
from recall_ai.vector_embeddings.store_vector_embedding import store_embeddings
def insert_batch(batch):
try:
res = store_embeddings()
...