docker run --rm -p 8081:80 michaelf34/infinity:latest --model-name-or-path Xenova/bge-large-en-v1.5 --port 80
WARNING 2024-01-11 16:49:24,197 SentenceTransformer.py:805
sentence_transformers.SentenceTransformer
WARNING: No sentence-transformers model
found with name
/app/.cache/torch/Xenova_bge-large-en-v1.5.
Creating a new one with MEAN pooling.
ERROR: Traceback (most recent call last):
File "/app/.venv/lib/python3.10/site-packages/starlette/routing.py", line 677, in lifespan
async with self.lifespan_context(app) as maybe_state:
File "/app/.venv/lib/python3.10/site-packages/starlette/routing.py", line 566, in __aenter__
await self._router.startup()
File "/app/.venv/lib/python3.10/site-packages/starlette/routing.py", line 654, in startup
await handler()
File "/app/infinity_emb/infinity_server.py", line 67, in _startup
app.model = AsyncEmbeddingEngine(
File "/app/infinity_emb/engine.py", line 60, in __init__
self._model, self._min_inference_t = select_model(
File "/app/infinity_emb/inference/select_model.py", line 64, in select_model
loaded_engine = unloaded_engine.value(model_name_or_path, device=device.value)
File "/app/infinity_emb/transformer/embedder/sentence_transformer.py", line 47, in __init__
super().__init__(model_name_or_path, **kwargs)
File "/app/.venv/lib/python3.10/site-packages/sentence_transformers/SentenceTransformer.py", line 97, in __init__
modules = self._load_auto_model(model_path)
File "/app/.venv/lib/python3.10/site-packages/sentence_transformers/SentenceTransformer.py", line 806, in _load_auto_model
transformer_model = Transformer(model_name_or_path)
File "/app/.venv/lib/python3.10/site-packages/sentence_transformers/models/Transformer.py", line 29, in __init__
self._load_model(model_name_or_path, config, cache_dir)
File "/app/.venv/lib/python3.10/site-packages/sentence_transformers/models/Transformer.py", line 49, in _load_model
self.auto_model = AutoModel.from_pretrained(model_name_or_path, config=config, cache_dir=cache_dir)
File "/app/.venv/lib/python3.10/site-packages/transformers/models/auto/auto_factory.py", line 566, in from_pretrained
return model_class.from_pretrained(
File "/app/.venv/lib/python3.10/site-packages/transformers/modeling_utils.py", line 3206, in from_pretrained
raise EnvironmentError(
OSError: Error no file named pytorch_model.bin, tf_model.h5, model.ckpt.index or flax_model.msgpack found in directory /app/.cache/torch/Xenova_bge-large-en-v1.5.