mirror of
https://github.com/tcsenpai/pensieve.git
synced 2025-06-10 04:57:12 +00:00
feat: update default config for embedding and vlm
This commit is contained in:
parent
9db92908a6
commit
75bb7aeef9
@ -3,10 +3,14 @@ from pathlib import Path
|
|||||||
from pydantic_settings import BaseSettings, SettingsConfigDict
|
from pydantic_settings import BaseSettings, SettingsConfigDict
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
|
||||||
|
|
||||||
class VLMSettings(BaseModel):
|
class VLMSettings(BaseModel):
|
||||||
enabled: bool = False
|
enabled: bool = True
|
||||||
modelname: str = "internvl-1.5"
|
modelname: str = "moondream"
|
||||||
endpoint: str = "http://localhost:11434"
|
endpoint: str = "https://localhost:11434"
|
||||||
|
token: str = ""
|
||||||
|
concurrency: int = 4
|
||||||
|
|
||||||
|
|
||||||
class OCRSettings(BaseModel):
|
class OCRSettings(BaseModel):
|
||||||
enabled: bool = True
|
enabled: bool = True
|
||||||
@ -16,9 +20,9 @@ class OCRSettings(BaseModel):
|
|||||||
|
|
||||||
|
|
||||||
class EmbeddingSettings(BaseModel):
|
class EmbeddingSettings(BaseModel):
|
||||||
num_dim: int = 1536
|
num_dim: int = 768
|
||||||
ollama_endpoint: str = "http://host.docker.internal:11434"
|
ollama_endpoint: str = "http://localhost:11434"
|
||||||
ollama_model: str = "arkohut/gte-qwen2-1.5b-instruct:q8_0"
|
ollama_model: str = "jina/jina-embeddings-v2-base-en"
|
||||||
|
|
||||||
|
|
||||||
class Settings(BaseSettings):
|
class Settings(BaseSettings):
|
||||||
@ -34,8 +38,9 @@ class Settings(BaseSettings):
|
|||||||
typesense_port: str = "8108"
|
typesense_port: str = "8108"
|
||||||
typesense_protocol: str = "http"
|
typesense_protocol: str = "http"
|
||||||
typesense_api_key: str = "xyz"
|
typesense_api_key: str = "xyz"
|
||||||
typesense_connection_timeout_seconds: int = 2
|
typesense_connection_timeout_seconds: int = 10
|
||||||
typesense_collection_name: str = "entities"
|
typesense_collection_name: str = "entities"
|
||||||
|
|
||||||
# Server settings
|
# Server settings
|
||||||
server_port: int = 8080
|
server_port: int = 8080
|
||||||
|
|
||||||
|
@ -62,7 +62,7 @@ def get_embeddings(texts: List[str]) -> List[List[float]]:
|
|||||||
for embedding in response.json()["embeddings"]
|
for embedding in response.json()["embeddings"]
|
||||||
]
|
]
|
||||||
else:
|
else:
|
||||||
raise Exception(f"Failed to get embeddings: {response.text}")
|
raise Exception(f"Failed to get embeddings: {response.text} {response.status_code}")
|
||||||
|
|
||||||
|
|
||||||
def generate_metadata_text(metadata_entries):
|
def generate_metadata_text(metadata_entries):
|
||||||
|
Loading…
x
Reference in New Issue
Block a user