letta-ai
diff --git a/‎.github/workflows/notify-letta-cloud.yml‎
Lines changed: 0 additions & 19 deletions b/‎.github/workflows/notify-letta-cloud.yml‎
Lines changed: 0 additions & 19 deletions
diff --git a/‎examples/files/README.md‎
Lines changed: 1 addition & 1 deletion b/‎examples/files/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/files/main.py‎
Lines changed: 0 additions & 1 deletion b/‎examples/files/main.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎letta/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎letta/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎letta/constants.py‎
Lines changed: 4 additions & 1 deletion b/‎letta/constants.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎letta/embeddings.py‎
Lines changed: 6 additions & 5 deletions b/‎letta/embeddings.py‎
Lines changed: 6 additions & 5 deletions
@@ -31,4 +31,4 @@ The demo will:
 3. Create an agent named "Clippy"
 4. Start an interactive chat session
 
-Type 'quit' or 'exit' to end the conversation.
+Type 'quit' or 'exit' to end the conversation.
@@ -63,7 +63,6 @@
 # 1. From an existing file
 # 2. From a string by encoding it into a base64 string
 #
-#
 
 # 1. From an existing file
 # "rb" means "read binary"
 
@@ -5,7 +5,7 @@
     __version__ = version("letta")
 except PackageNotFoundError:
     # Fallback for development installations
-    __version__ = "0.10.0"
+    __version__ = "0.11.0"
 
 if os.environ.get("LETTA_VERSION"):
     __version__ = os.environ["LETTA_VERSION"]
 
@@ -10,6 +10,7 @@
 
 ADMIN_PREFIX = "/v1/admin"
 API_PREFIX = "/v1"
+OLLAMA_API_PREFIX = "/v1"
 OPENAI_API_PREFIX = "/openai"
 
 COMPOSIO_ENTITY_ENV_VAR_KEY = "COMPOSIO_ENTITY"
@@ -50,8 +51,9 @@
 # Max steps for agent loop
 DEFAULT_MAX_STEPS = 50
 
-# minimum context window size
+# context window size
 MIN_CONTEXT_WINDOW = 4096
+DEFAULT_CONTEXT_WINDOW = 32000
 
 # number of concurrent embedding requests to sent
 EMBEDDING_BATCH_SIZE = 200
@@ -63,6 +65,7 @@
 # embeddings
 MAX_EMBEDDING_DIM = 4096  # maximum supported embeding size - do NOT change or else DBs will need to be reset
 DEFAULT_EMBEDDING_CHUNK_SIZE = 300
+DEFAULT_EMBEDDING_DIM = 1024
 
 # tokenizers
 EMBEDDING_TO_TOKENIZER_MAP = {
 
@@ -139,10 +139,11 @@ def get_text_embedding(self, text: str):
 
 class OllamaEmbeddings:
 
+    # Uses OpenAI API standard
     # Format:
-    # curl http://localhost:11434/api/embeddings -d '{
+    # curl http://localhost:11434/v1/embeddings -d '{
     #   "model": "mxbai-embed-large",
-    #   "prompt": "Llamas are members of the camelid family"
+    #   "input": "Llamas are members of the camelid family"
     # }'
 
     def __init__(self, model: str, base_url: str, ollama_additional_kwargs: dict):
@@ -154,18 +155,18 @@ def get_text_embedding(self, text: str):
         import httpx
 
         headers = {"Content-Type": "application/json"}
-        json_data = {"model": self.model, "prompt": text}
+        json_data = {"model": self.model, "input": text}
         json_data.update(self.ollama_additional_kwargs)
 
         with httpx.Client() as client:
             response = client.post(
-                f"{self.base_url}/api/embeddings",
+                f"{self.base_url}/embeddings",
                 headers=headers,
                 json=json_data,
             )
 
         response_json = response.json()
-        return response_json["embedding"]
+        return response_json["data"][0]["embedding"]
 
 
 class GoogleEmbeddings:
Original file line number	Diff line number	Diff line change
`@@ -63,7 +63,6 @@`
`63`	`63`	`# 1. From an existing file`
`64`	`64`	`# 2. From a string by encoding it into a base64 string`
`65`	`65`	`#`
`66`		`-#`
`67`	`66`
`68`	`67`	`# 1. From an existing file`
`69`	`68`	`# "rb" means "read binary"`