Release 0.7.3 (#1357 )

Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: himself65 <himself65@users.noreply.github.com>
fix(core): inline python-format-js (#1356 )
2026-07-01 22:14:03 -04:00 · 2024-10-20 20:15:51 -07:00 · 2024-10-20 20:07:48 -07:00 · 2024-10-20 19:22:59 -07:00 · 2024-10-20 17:11:09 -07:00 · 2024-10-20 15:29:19 -07:00
182 changed files with 7607 additions and 5988 deletions
@@ -25,4 +25,4 @@ jobs:
        run: pnpm run build

      - name: Pre Release
-        run: pnpx pkg-pr-new publish ./packages/*
+        run: pnpx pkg-pr-new publish ./packages/* ./packages/providers/*
@@ -136,27 +136,26 @@ jobs:
        run: pnpm run build
      - name: Copy examples
        run: rsync -rv --exclude=node_modules ./examples ${{ runner.temp }}
-      - name: Pack @llamaindex/cloud
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/cloud
-      - name: Pack @llamaindex/openai
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/llm/openai
-      - name: Pack @llamaindex/groq
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/llm/groq
-      - name: Pack @llamaindex/ollama
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/llm/ollama
-      - name: Pack @llamaindex/core
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/core
-      - name: Pack @llamaindex/env
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/env
-      - name: Pack llamaindex
-        run: pnpm pack --pack-destination ${{ runner.temp }}
-        working-directory: packages/llamaindex
+      - name: Pack packages
+        run: |
+          for dir in packages/*; do
+            if [ -d "$dir" ] && [ -f "$dir/package.json" ] && [[ ! "$dir" =~ autotool ]]; then
+              echo "Packing $dir"
+              pnpm pack --pack-destination ${{ runner.temp }} -C $dir
+            else
+              echo "Skipping $dir, no package.json found"
+            fi
+          done
+      - name: Pack provider packages
+        run: |
+          for dir in packages/providers/*; do
+            if [ -d "$dir" ] && [ -f "$dir/package.json" ]; then
+              echo "Packing $dir"
+              pnpm pack --pack-destination ${{ runner.temp }} -C $dir
+            else
+              echo "Skipping $dir, no package.json found"
+            fi
+          done
      - name: Install
        run: npm add ${{ runner.temp }}/*.tgz
        working-directory: ${{ runner.temp }}/examples
@@ -1,5 +1,59 @@
 # docs

+## 0.0.95
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.0.94
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.0.93
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.0.92
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+  - @llamaindex/examples@0.0.9
+
+## 0.0.91
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.0.90
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.0.89
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.0.88

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "docs",
-  "version": "0.0.88",
+  "version": "0.0.95",
  "private": true,
  "scripts": {
    "docusaurus": "docusaurus",
@@ -1,5 +1,16 @@
 # examples

+## 0.0.9
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [96fc69c]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+  - @llamaindex/core@0.3.0
+
 ## 0.0.8

 ### Patch Changes
@@ -1,6 +1,7 @@
 import {
  AstraDBVectorStore,
  Document,
+  MetadataFilters,
  storageContextFromDefaults,
  VectorStoreIndex,
 } from "llamaindex";
@@ -42,8 +43,10 @@ async function main() {
    const index = await VectorStoreIndex.fromDocuments(docs, {
      storageContext: ctx,
    });
-
-    const queryEngine = index.asQueryEngine();
+    const preFilters: MetadataFilters = {
+      filters: [{ key: "id", operator: "in", value: [123, 789] }],
+    }; // try changing the filters to see the different results
+    const queryEngine = index.asQueryEngine({ preFilters });
    const response = await queryEngine.query({
      query: "Describe AstraDB.",
    });
@@ -1,57 +1,83 @@
 import {
  ChromaVectorStore,
  Document,
+  MetadataFilters,
  VectorStoreIndex,
  storageContextFromDefaults,
 } from "llamaindex";

-const collectionName = "dog_colors";
+const collectionName = "dogs_with_color";

 async function main() {
  try {
-    const docs = [
-      new Document({
-        text: "The dog is brown",
-        metadata: {
-          dogId: "1",
-        },
-      }),
-      new Document({
-        text: "The dog is red",
-        metadata: {
-          dogId: "2",
-        },
-      }),
-    ];
-
-    console.log("Creating ChromaDB vector store");
    const chromaVS = new ChromaVectorStore({ collectionName });
-    const ctx = await storageContextFromDefaults({ vectorStore: chromaVS });
+    const index = await VectorStoreIndex.fromVectorStore(chromaVS);

-    console.log("Embedding documents and adding to index");
-    const index = await VectorStoreIndex.fromDocuments(docs, {
-      storageContext: ctx,
-    });
+    const queryFn = async (filters?: MetadataFilters) => {
+      console.log("\nQuerying dogs by filters: ", JSON.stringify(filters));
+      const query = "List all colors of dogs";
+      const queryEngine = index.asQueryEngine({
+        preFilters: filters,
+        similarityTopK: 3,
+      });
+      const response = await queryEngine.query({ query });
+      console.log(response.toString());
+    };

-    console.log("Querying index");
-    const queryEngine = index.asQueryEngine({
-      preFilters: {
-        filters: [
-          {
-            key: "dogId",
-            value: "2",
-            operator: "==",
-          },
-        ],
-      },
-    });
-    const response = await queryEngine.query({
-      query: "What is the color of the dog?",
-    });
-    console.log(response.toString());
+    await queryFn(); // red, brown, yellow
+    await queryFn({ filters: [{ key: "dogId", value: "1", operator: "==" }] }); // brown
+    await queryFn({ filters: [{ key: "dogId", value: "1", operator: "!=" }] }); // red, yellow
+    await queryFn({
+      filters: [
+        { key: "dogId", value: "1", operator: "==" },
+        { key: "dogId", value: "3", operator: "==" },
+      ],
+      condition: "or",
+    }); // brown, yellow
+    await queryFn({
+      filters: [{ key: "dogId", value: ["1", "2"], operator: "in" }],
+    }); // red, brown
  } catch (e) {
    console.error(e);
  }
 }

-void main();
+async function generate() {
+  const docs = [
+    new Document({
+      id_: "doc1",
+      text: "The dog is brown",
+      metadata: {
+        dogId: "1",
+      },
+    }),
+    new Document({
+      id_: "doc2",
+      text: "The dog is red",
+      metadata: {
+        dogId: "2",
+      },
+    }),
+    new Document({
+      id_: "doc3",
+      text: "The dog is yellow",
+      metadata: {
+        dogId: "3",
+      },
+    }),
+  ];
+
+  console.log("Creating ChromaDB vector store");
+  const chromaVS = new ChromaVectorStore({ collectionName });
+  const ctx = await storageContextFromDefaults({ vectorStore: chromaVS });
+
+  console.log("Embedding documents and adding to index");
+  await VectorStoreIndex.fromDocuments(docs, {
+    storageContext: ctx,
+  });
+}
+
+(async () => {
+  await generate();
+  await main();
+})();
@@ -1,12 +1,12 @@
 {
  "name": "@llamaindex/examples",
  "private": true,
-  "version": "0.0.8",
+  "version": "0.0.9",
  "dependencies": {
    "@aws-crypto/sha256-js": "^5.2.0",
    "@azure/identity": "^4.4.1",
    "@datastax/astra-db-ts": "^1.4.1",
-    "@llamaindex/core": "^0.2.0",
+    "@llamaindex/core": "^0.3.0",
    "@notionhq/client": "^2.2.15",
    "@pinecone-database/pinecone": "^3.0.2",
    "@vercel/postgres": "^0.10.0",
@@ -15,7 +15,7 @@
    "commander": "^12.1.0",
    "dotenv": "^16.4.5",
    "js-tiktoken": "^1.0.14",
-    "llamaindex": "^0.6.0",
+    "llamaindex": "^0.7.0",
    "mongodb": "^6.7.0",
    "pathe": "^1.1.2",
    "postgres": "^3.4.4"
@@ -1,4 +1,5 @@
 import {
+  BaseVectorStore,
  getResponseSynthesizer,
  OpenAI,
  OpenAIEmbedding,
@@ -6,7 +7,6 @@ import {
  Settings,
  TextNode,
  VectorIndexRetriever,
-  VectorStore,
  VectorStoreIndex,
  VectorStoreQuery,
  VectorStoreQueryResult,
@@ -24,7 +24,7 @@ Settings.llm = new OpenAI({
 * Please do not use this class in production; it's only for demonstration purposes.
 */
 class PineconeVectorStore<T extends RecordMetadata = RecordMetadata>
-  implements VectorStore
+  implements BaseVectorStore
 {
  storesText = true;
  isEmbeddingQuery = false;
@@ -39,9 +39,6 @@
    "overrides": {
      "trim": "1.0.1",
      "protobufjs": "7.2.6"
-    },
-    "patchedDependencies": {
-      "python-format-js@1.4.3": "patches/python-format-js@1.4.3.patch"
    }
  },
  "lint-staged": {
@@ -1,5 +1,59 @@
 # @llamaindex/autotool

+## 4.0.3
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 4.0.2
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 4.0.1
+
+### Patch Changes
+
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 4.0.0
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 3.0.22
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 3.0.21
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 3.0.20
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 3.0.19

 ### Patch Changes
@@ -1,5 +1,65 @@
 # @llamaindex/autotool-01-node-example

+## 0.0.35
+
+### Patch Changes
+
+- llamaindex@0.7.3
+- @llamaindex/autotool@4.0.3
+
+## 0.0.34
+
+### Patch Changes
+
+- llamaindex@0.7.2
+- @llamaindex/autotool@4.0.2
+
+## 0.0.33
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+  - @llamaindex/autotool@4.0.1
+
+## 0.0.32
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+  - @llamaindex/autotool@4.0.0
+
+## 0.0.31
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+  - @llamaindex/autotool@3.0.22
+
+## 0.0.30
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+  - @llamaindex/autotool@3.0.21
+
+## 0.0.29
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+  - @llamaindex/autotool@3.0.20
+
 ## 0.0.28

 ### Patch Changes
@@ -13,5 +13,5 @@
  "scripts": {
    "start": "node --import tsx --import @llamaindex/autotool/node ./src/index.ts"
  },
-  "version": "0.0.28"
+  "version": "0.0.35"
 }
@@ -1,5 +1,65 @@
 # @llamaindex/autotool-02-next-example

+## 0.1.79
+
+### Patch Changes
+
+- llamaindex@0.7.3
+- @llamaindex/autotool@4.0.3
+
+## 0.1.78
+
+### Patch Changes
+
+- llamaindex@0.7.2
+- @llamaindex/autotool@4.0.2
+
+## 0.1.77
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+  - @llamaindex/autotool@4.0.1
+
+## 0.1.76
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+  - @llamaindex/autotool@4.0.0
+
+## 0.1.75
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+  - @llamaindex/autotool@3.0.22
+
+## 0.1.74
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+  - @llamaindex/autotool@3.0.21
+
+## 0.1.73
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+  - @llamaindex/autotool@3.0.20
+
 ## 0.1.72

 ### Patch Changes
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/autotool-02-next-example",
  "private": true,
-  "version": "0.1.72",
+  "version": "0.1.79",
  "scripts": {
    "dev": "next dev",
    "build": "next build",
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/autotool",
  "type": "module",
-  "version": "3.0.19",
+  "version": "4.0.3",
  "description": "auto transpile your JS function to LLM Agent compatible",
  "files": [
    "dist",
@@ -70,7 +70,7 @@
    "@swc/types": "^0.1.12",
    "@types/json-schema": "^7.0.15",
    "@types/node": "^22.5.1",
-    "bunchee": "5.3.2",
+    "bunchee": "5.5.1",
    "llamaindex": "workspace:*",
    "next": "14.2.11",
    "rollup": "^4.21.2",
@@ -1,5 +1,40 @@
 # @llamaindex/cloud

+## 1.0.3
+
+### Patch Changes
+
+- Updated dependencies [0493f67]
+  - @llamaindex/core@0.3.3
+
+## 1.0.2
+
+### Patch Changes
+
+- Updated dependencies [4ba2cfe]
+  - @llamaindex/env@0.1.15
+  - @llamaindex/core@0.3.2
+
+## 1.0.1
+
+### Patch Changes
+
+- 4c38c1b: fix(cloud): do not detect file type in llama parse
+- 24d065f: Log Parse Job Errors when verbose is enabled
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [a75af83]
+  - @llamaindex/env@0.1.14
+  - @llamaindex/core@0.3.1
+
+## 1.0.0
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [96fc69c]
+  - @llamaindex/core@0.3.0
+
 ## 0.2.14

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/cloud",
-  "version": "0.2.14",
+  "version": "1.0.3",
  "type": "module",
  "license": "MIT",
  "scripts": {
@@ -53,13 +53,10 @@
    "@hey-api/openapi-ts": "^0.53.0",
    "@llamaindex/core": "workspace:*",
    "@llamaindex/env": "workspace:*",
-    "bunchee": "5.3.2"
+    "bunchee": "5.5.1"
  },
  "peerDependencies": {
    "@llamaindex/core": "workspace:*",
    "@llamaindex/env": "workspace:*"
-  },
-  "dependencies": {
-    "magic-bytes.js": "^1.10.0"
  }
 }
@@ -1,7 +1,6 @@
 import { type Client, createClient, createConfig } from "@hey-api/client-fetch";
 import { Document, FileReader } from "@llamaindex/core/schema";
 import { fs, getEnv, path } from "@llamaindex/env";
-import { filetypeinfo } from "magic-bytes.js";
 import {
  type Body_upload_file_api_v1_parsing_upload_post,
  type ParserLanguages,
@@ -13,99 +12,6 @@ export type Language = ParserLanguages;

 export type ResultType = "text" | "markdown" | "json";

-const SUPPORT_FILE_EXT: string[] = [
-  ".pdf",
-  // document and presentations
-  ".602",
-  ".abw",
-  ".cgm",
-  ".cwk",
-  ".doc",
-  ".docx",
-  ".docm",
-  ".dot",
-  ".dotm",
-  ".hwp",
-  ".key",
-  ".lwp",
-  ".mw",
-  ".mcw",
-  ".pages",
-  ".pbd",
-  ".ppt",
-  ".pptm",
-  ".pptx",
-  ".pot",
-  ".potm",
-  ".potx",
-  ".rtf",
-  ".sda",
-  ".sdd",
-  ".sdp",
-  ".sdw",
-  ".sgl",
-  ".sti",
-  ".sxi",
-  ".sxw",
-  ".stw",
-  ".sxg",
-  ".txt",
-  ".uof",
-  ".uop",
-  ".uot",
-  ".vor",
-  ".wpd",
-  ".wps",
-  ".xml",
-  ".zabw",
-  ".epub",
-  // images
-  ".jpg",
-  ".jpeg",
-  ".png",
-  ".gif",
-  ".bmp",
-  ".svg",
-  ".tiff",
-  ".webp",
-  // web
-  ".htm",
-  ".html",
-  // spreadsheets
-  ".xlsx",
-  ".xls",
-  ".xlsm",
-  ".xlsb",
-  ".xlw",
-  ".csv",
-  ".dif",
-  ".sylk",
-  ".slk",
-  ".prn",
-  ".numbers",
-  ".et",
-  ".ods",
-  ".fods",
-  ".uos1",
-  ".uos2",
-  ".dbf",
-  ".wk1",
-  ".wk2",
-  ".wk3",
-  ".wk4",
-  ".wks",
-  ".123",
-  ".wq1",
-  ".wq2",
-  ".wb1",
-  ".wb2",
-  ".wb3",
-  ".qpw",
-  ".xlr",
-  ".eth",
-  ".tsv",
-];
-
 //todo: should move into @llamaindex/env
 type WriteStream = {
  write: (text: string) => void;
@@ -239,17 +145,12 @@ export class LlamaParseReader extends FileReader {

  // Create a job for the LlamaParse API
  private async createJob(data: Uint8Array): Promise<string> {
-    // Load data, set the mime type
-    const { mime } = await LlamaParseReader.getMimeType(data);
-
    if (this.verbose) {
      console.log("Started uploading the file");
    }

    const body = {
-      file: new Blob([data], {
-        type: mime,
-      }),
+      file: new Blob([data]),
      language: this.language,
      parsing_instruction: this.parsingInstruction,
      skip_diagonal_text: this.skipDiagonalText,
@@ -368,6 +269,11 @@ export class LlamaParseReader extends FileReader {
        }
        tries++;
      } else {
+        if (this.verbose) {
+          console.error(
+            `Recieved Error response ${status} for job ${jobId}.  Got Error Code: ${data.error_code} and Error Message: ${data.error_message}`,
+          );
+        }
        throw new Error(
          `Failed to parse the file: ${jobId}, status: ${status}`,
        );
@@ -564,24 +470,4 @@ export class LlamaParseReader extends FileReader {
        }),
    );
  }
-
-  static async getMimeType(
-    data: Uint8Array,
-  ): Promise<{ mime: string; extension: string }> {
-    const typeinfos = filetypeinfo(data);
-    // find the first type info that matches the supported MIME types
-    // It could be happened that docx file is recognized as zip file, so we need to check the mime type
-    const info = typeinfos.find((info) => {
-      if (info.extension && SUPPORT_FILE_EXT.includes(`.${info.extension}`)) {
-        return info;
-      }
-    });
-    if (!info || !info.mime || !info.extension) {
-      const ext = SUPPORT_FILE_EXT.join(", ");
-      throw new Error(
-        `File has type which does not match supported MIME Types. Supported formats include: ${ext}`,
-      );
-    }
-    return { mime: info.mime, extension: info.extension };
-  }
 }
@@ -1,5 +1,38 @@
 # @llamaindex/community

+## 0.0.51
+
+### Patch Changes
+
+- Updated dependencies [0493f67]
+  - @llamaindex/core@0.3.3
+
+## 0.0.50
+
+### Patch Changes
+
+- Updated dependencies [4ba2cfe]
+  - @llamaindex/env@0.1.15
+  - @llamaindex/core@0.3.2
+
+## 0.0.49
+
+### Patch Changes
+
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [a75af83]
+  - @llamaindex/env@0.1.14
+  - @llamaindex/core@0.3.1
+
+## 0.0.48
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [96fc69c]
+  - @llamaindex/core@0.3.0
+
 ## 0.0.47

 ### Patch Changes
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/community",
  "description": "Community package for LlamaIndexTS",
-  "version": "0.0.47",
+  "version": "0.0.51",
  "type": "module",
  "types": "dist/type/index.d.ts",
  "main": "dist/cjs/index.js",
@@ -43,11 +43,11 @@
  },
  "devDependencies": {
    "@types/node": "^22.5.1",
-    "bunchee": "5.3.2"
+    "bunchee": "5.5.1"
  },
  "dependencies": {
-    "@aws-sdk/client-bedrock-runtime": "^3.642.0",
    "@aws-sdk/client-bedrock-agent-runtime": "^3.642.0",
+    "@aws-sdk/client-bedrock-runtime": "^3.642.0",
    "@llamaindex/core": "workspace:*",
    "@llamaindex/env": "workspace:*"
  }
@@ -1,5 +1,34 @@
 # @llamaindex/core

+## 0.3.3
+
+### Patch Changes
+
+- 0493f67: fix(core): inline `python-format-js`
+
+## 0.3.2
+
+### Patch Changes
+
+- Updated dependencies [4ba2cfe]
+  - @llamaindex/env@0.1.15
+
+## 0.3.1
+
+### Patch Changes
+
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [a75af83]
+  - @llamaindex/env@0.1.14
+
+## 0.3.0
+
+### Minor Changes
+
+- 1364e8e: update metadata extractors to use PromptTemplate
+- 96fc69c: add defaultQuestionExtractPrompt
+
 ## 0.2.12

 ### Patch Changes
@@ -0,0 +1,8 @@
+{
+  "type": "module",
+  "main": "./dist/index.cjs",
+  "module": "./dist/index.js",
+  "types": "./dist/index.d.ts",
+  "exports": "./dist/index.js",
+  "private": true
+}
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/core",
  "type": "module",
-  "version": "0.2.12",
+  "version": "0.3.3",
  "description": "LlamaIndex Core Module",
  "exports": {
    "./agent": {
@@ -258,16 +258,44 @@
    },
    "./vector-store": {
      "require": {
-        "types": "./dist/vector-store/index.d.cts",
-        "default": "./dist/vector-store/index.cjs"
+        "types": "./vector-store/dist/index.d.cts",
+        "default": "./vector-store/dist/index.cjs"
      },
      "import": {
-        "types": "./dist/vector-store/index.d.ts",
-        "default": "./dist/vector-store/index.js"
+        "types": "./vector-store/dist/index.d.ts",
+        "default": "./vector-store/dist/index.js"
      },
      "default": {
-        "types": "./dist/vector-store/index.d.ts",
-        "default": "./dist/vector-store/index.js"
+        "types": "./vector-store/dist/index.d.ts",
+        "default": "./vector-store/dist/index.js"
+      }
+    },
+    "./tools": {
+      "require": {
+        "types": "./tools/dist/index.d.cts",
+        "default": "./tools/dist/index.cjs"
+      },
+      "import": {
+        "types": "./tools/dist/index.d.ts",
+        "default": "./tools/dist/index.js"
+      },
+      "default": {
+        "types": "./tools/dist/index.d.ts",
+        "default": "./tools/dist/index.js"
+      }
+    },
+    "./data-structs": {
+      "require": {
+        "types": "./data-structs/dist/index.d.cts",
+        "default": "./data-structs/dist/index.cjs"
+      },
+      "import": {
+        "types": "./data-structs/dist/index.d.ts",
+        "default": "./data-structs/dist/index.js"
+      },
+      "default": {
+        "types": "./data-structs/dist/index.d.ts",
+        "default": "./data-structs/dist/index.js"
      }
    }
  },
@@ -289,7 +317,10 @@
    "./storage",
    "./response-synthesizers",
    "./chat-engine",
-    "./retriever"
+    "./retriever",
+    "./vector-store",
+    "./tools",
+    "./data-structs"
  ],
  "scripts": {
    "dev": "bunchee --watch",
@@ -303,15 +334,15 @@
  "devDependencies": {
    "@edge-runtime/vm": "^4.0.3",
    "ajv": "^8.17.1",
-    "bunchee": "5.3.2",
+    "bunchee": "5.5.1",
    "happy-dom": "^15.7.4",
-    "natural": "^8.0.1",
-    "python-format-js": "^1.4.3"
+    "natural": "^8.0.1"
  },
  "dependencies": {
    "@llamaindex/env": "workspace:*",
    "@types/node": "^22.5.1",
    "magic-bytes.js": "^1.10.0",
-    "zod": "^3.23.8"
+    "zod": "^3.23.8",
+    "zod-to-json-schema": "^3.23.3"
  }
 }
@@ -0,0 +1,67 @@
+import { randomUUID } from "@llamaindex/env";
+import type { UUID } from "../global";
+import { IndexStructType } from "./struct-type";
+
+export abstract class IndexStruct {
+  indexId: string;
+  summary: string | undefined;
+
+  constructor(
+    indexId: UUID = randomUUID(),
+    summary: string | undefined = undefined,
+  ) {
+    this.indexId = indexId;
+    this.summary = summary;
+  }
+
+  toJson(): Record<string, unknown> {
+    return {
+      indexId: this.indexId,
+      summary: this.summary,
+    };
+  }
+
+  getSummary(): string {
+    if (this.summary === undefined) {
+      throw new Error("summary field of the index struct is not set");
+    }
+    return this.summary;
+  }
+}
+
+// A table of keywords mapping keywords to text chunks.
+export class KeywordTable extends IndexStruct {
+  table: Map<string, Set<string>> = new Map();
+  type: IndexStructType = IndexStructType.KEYWORD_TABLE;
+
+  addNode(keywords: string[], nodeId: string): void {
+    keywords.forEach((keyword) => {
+      if (!this.table.has(keyword)) {
+        this.table.set(keyword, new Set());
+      }
+      this.table.get(keyword)!.add(nodeId);
+    });
+  }
+
+  deleteNode(keywords: string[], nodeId: string) {
+    keywords.forEach((keyword) => {
+      if (this.table.has(keyword)) {
+        this.table.get(keyword)!.delete(nodeId);
+      }
+    });
+  }
+
+  toJson(): Record<string, unknown> {
+    return {
+      ...super.toJson(),
+      table: Array.from(this.table.entries()).reduce(
+        (acc, [keyword, nodeIds]) => {
+          acc[keyword] = Array.from(nodeIds);
+          return acc;
+        },
+        {} as Record<string, string[]>,
+      ),
+      type: this.type,
+    };
+  }
+}
@@ -0,0 +1,2 @@
+export { IndexStruct, KeywordTable } from "./data-structs";
+export { IndexStructType } from "./struct-type";
@@ -0,0 +1,39 @@
+export const IndexStructType = {
+  NODE: "node",
+  TREE: "tree",
+  LIST: "list",
+  KEYWORD_TABLE: "keyword_table",
+  DICT: "dict",
+  SIMPLE_DICT: "simple_dict",
+  WEAVIATE: "weaviate",
+  PINECONE: "pinecone",
+  QDRANT: "qdrant",
+  LANCEDB: "lancedb",
+  MILVUS: "milvus",
+  CHROMA: "chroma",
+  MYSCALE: "myscale",
+  CLICKHOUSE: "clickhouse",
+  VECTOR_STORE: "vector_store",
+  OPENSEARCH: "opensearch",
+  DASHVECTOR: "dashvector",
+  CHATGPT_RETRIEVAL_PLUGIN: "chatgpt_retrieval_plugin",
+  DEEPLAKE: "deeplake",
+  EPSILLA: "epsilla",
+  MULTIMODAL_VECTOR_STORE: "multimodal",
+  SQL: "sql",
+  KG: "kg",
+  SIMPLE_KG: "simple_kg",
+  SIMPLE_LPG: "simple_lpg",
+  NEBULAGRAPH: "nebulagraph",
+  FALKORDB: "falkordb",
+  EMPTY: "empty",
+  COMPOSITE: "composite",
+  PANDAS: "pandas",
+  DOCUMENT_SUMMARY: "document_summary",
+  VECTARA: "vectara",
+  ZILLIZ_CLOUD_PIPELINE: "zilliz_cloud_pipeline",
+  POSTGRESML: "postgresml",
+} as const;
+
+export type IndexStructType =
+  (typeof IndexStructType)[keyof typeof IndexStructType];
@@ -1,7 +1,7 @@
-import format from "python-format-js";
 import type { ChatMessage } from "../llms";
 import type { BaseOutputParser, Metadata } from "../schema";
 import { objectEntries } from "../utils";
+import { format } from "./format";
 import { PromptType } from "./prompt-type";

 type MappingFn<TemplatesVar extends string[] = string[]> = (
@@ -0,0 +1,207 @@
+/**
+ * MIT License
+ *
+ * Copyright (c) 2019 jhonararipe
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in all
+ * copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+"use strict";
+function formatImpl(this: string, ...args_: any[]) {
+  // Create variables
+  let self = this;
+  const __patterns__ = self.match(/({.*?})/g);
+  const {
+    REF,
+    FILL_CHAR,
+    MASK_NUMBER,
+    ALIGN_OP,
+    CROP_SIZE,
+    DOT,
+    FRACTION,
+    TYPE_VAR,
+  } = {
+    REF: 1,
+    FILL_CHAR: 2,
+    MASK_NUMBER: 3,
+    ALIGN_OP: 4,
+    CROP_SIZE: 5,
+    DOT: 6,
+    FRACTION: 7,
+    TYPE_VAR: 8,
+  };
+  const DEFAULT_PLACE = 6;
+  const ALL_REGEXP =
+    /{(\w+)?:([^>\^<\d#]|0)?([#%,])?([>^<\.])?(\d+)?(\.)?(\d+)?([eEfFgGdxXobn#%])?}/g;
+  const regExpBasic = /{\[?(\w+)\]?}/; // it's not best solution
+  const isObject = typeof args_[0] === "object";
+  // types/use logic
+  __patterns__?.map((pattern, patt_index) => {
+    const kargs = ALL_REGEXP.exec(pattern) || ALL_REGEXP.exec(pattern);
+    const wargs = regExpBasic.exec(pattern);
+
+    // Insert values (one 2 one / array / object)
+    const INDEX_VAR =
+      (wargs ? wargs[REF] : kargs ? kargs[REF] : patt_index) || patt_index;
+    // @ts-expect-error
+    const NATUAL_VALUE = isObject ? args_[0][INDEX_VAR] : args_[INDEX_VAR];
+    // @ts-expect-error
+    let ACTUAL_VALUE = isObject ? args_[0][INDEX_VAR] : args_[INDEX_VAR];
+
+    // Verify sintax/semantic
+    if (ACTUAL_VALUE === null || ACTUAL_VALUE === undefined)
+      throw new Error(
+        `Replacement index ${INDEX_VAR} out of range for positional args tuple`,
+      );
+    if (kargs) {
+      // If TYPE_VAR is not defined and the first argument is a number, pad a string should from left, so set TYPE_VAR to "d"
+      if (kargs[TYPE_VAR] === undefined && typeof ACTUAL_VALUE === "number") {
+        kargs[TYPE_VAR] = "d";
+      }
+      const LETTER =
+        (!kargs[FILL_CHAR]
+          ? false
+          : !kargs[ALIGN_OP] &&
+              [..."FfbefoxXn"].includes(kargs[FILL_CHAR].toLowerCase())
+            ? kargs[FILL_CHAR]
+            : kargs[TYPE_VAR]) || kargs[TYPE_VAR];
+      //  padronaze
+      if (LETTER) {
+        const floatSize = pattern.includes(".")
+          ? Number(kargs[FRACTION] || kargs[CROP_SIZE])
+          : DEFAULT_PLACE;
+        switch (LETTER) {
+          case "E":
+            ACTUAL_VALUE =
+              ACTUAL_VALUE.toExponential(DEFAULT_PLACE).toUpperCase();
+            break;
+          case "e":
+            ACTUAL_VALUE = ACTUAL_VALUE.toExponential(DEFAULT_PLACE);
+            break;
+          case "X":
+            ACTUAL_VALUE = ACTUAL_VALUE.toString(16).toUpperCase();
+            break;
+          case "x":
+            ACTUAL_VALUE = ACTUAL_VALUE.toString(16); // Hexadecimal
+            break;
+          case "b":
+            ACTUAL_VALUE = ACTUAL_VALUE.toString(2); // Binary
+            break;
+          case "f":
+          case "F":
+            ACTUAL_VALUE = ACTUAL_VALUE.toFixed(floatSize);
+            break;
+          case "o":
+            ACTUAL_VALUE = ACTUAL_VALUE.toString(8); // Octal
+            break;
+          default:
+            break;
+        }
+        //  mask
+        switch (kargs[MASK_NUMBER]) {
+          case "#":
+            const MASK = {
+              x: "0x",
+              X: "0X",
+              o: "0o",
+              b: "0b",
+            }[LETTER];
+            ACTUAL_VALUE = MASK + ACTUAL_VALUE;
+            break;
+        }
+      }
+      // signal
+      if (
+        // @ts-expect-error
+        [..." +-,%"].includes(kargs[FILL_CHAR]) &&
+        typeof NATUAL_VALUE === "number"
+      ) {
+        ACTUAL_VALUE = ACTUAL_VALUE.toString().replace("-", "");
+        if (NATUAL_VALUE >= 0)
+          switch (kargs[FILL_CHAR]) {
+            case "+":
+              ACTUAL_VALUE = "+" + ACTUAL_VALUE;
+              break;
+            case " ":
+              ACTUAL_VALUE = " " + ACTUAL_VALUE;
+              break;
+            case ",":
+              ACTUAL_VALUE = NATUAL_VALUE.toString()
+                .split(/(?=(?:...)*$)/)
+                .join(kargs[FILL_CHAR]);
+              break;
+            case "%":
+              ACTUAL_VALUE =
+                (NATUAL_VALUE * 100).toFixed(
+                  // @ts-expect-error
+                  kargs[FRACTION] || DEFAULT_PLACE,
+                ) + "%";
+              break;
+          }
+        else ACTUAL_VALUE = "-" + ACTUAL_VALUE;
+      }
+      // space / order / trim
+      if (kargs[CROP_SIZE]) {
+        ACTUAL_VALUE = ACTUAL_VALUE.toString();
+        const FILL_ELEMENT = kargs[FILL_CHAR] || " ";
+        const SIZE_STRING = ACTUAL_VALUE.length;
+        const SIZE_ARG = kargs[CROP_SIZE];
+        const FILL_LENGTH = SIZE_STRING > SIZE_ARG ? SIZE_STRING : SIZE_ARG;
+        const FILL = FILL_ELEMENT.repeat(FILL_LENGTH);
+
+        switch (kargs[ALIGN_OP] || kargs[FILL_CHAR]) {
+          case "<":
+            ACTUAL_VALUE = ACTUAL_VALUE.padEnd(FILL_LENGTH, FILL_ELEMENT);
+            break;
+          case ".":
+            if (!(LETTER && /[fF]/.test(LETTER)))
+              ACTUAL_VALUE = ACTUAL_VALUE.slice(0, SIZE_ARG);
+            break;
+          case ">":
+            ACTUAL_VALUE = ACTUAL_VALUE.padStart(FILL_LENGTH, FILL_ELEMENT);
+            break;
+          case "^":
+            const length_start = Math.floor((FILL_LENGTH - SIZE_STRING) / 2);
+            const string_start =
+              length_start > 0
+                ? FILL_ELEMENT.repeat(length_start) + ACTUAL_VALUE
+                : ACTUAL_VALUE;
+
+            ACTUAL_VALUE = FILL.replace(
+              RegExp(`.{${string_start.length}}`),
+              string_start,
+            );
+            break;
+          default:
+            ACTUAL_VALUE = LETTER
+              ? ACTUAL_VALUE.padStart(FILL_LENGTH, FILL_ELEMENT)
+              : ACTUAL_VALUE.padEnd(FILL_LENGTH, FILL_ELEMENT);
+            break;
+        }
+      }
+    }
+
+    // SET Definitive value
+    self = self.replace(pattern, ACTUAL_VALUE);
+  });
+
+  return self;
+}
+
+export const format = (inputString: string, ...param: any[]) =>
+  formatImpl.apply(inputString, param);
@@ -12,11 +12,15 @@ export {
  defaultCondenseQuestionPrompt,
  defaultContextSystemPrompt,
  defaultKeywordExtractPrompt,
+  defaultNodeTextTemplate,
  defaultQueryKeywordExtractPrompt,
+  defaultQuestionExtractPrompt,
  defaultRefinePrompt,
  defaultSubQuestionPrompt,
  defaultSummaryPrompt,
  defaultTextQAPrompt,
+  defaultTitleCombinePromptTemplate,
+  defaultTitleExtractorPromptTemplate,
  defaultTreeSummarizePrompt,
 } from "./prompt";
 export type {
@@ -25,9 +29,12 @@ export type {
  ContextSystemPrompt,
  KeywordExtractPrompt,
  QueryKeywordExtractPrompt,
+  QuestionExtractPrompt,
  RefinePrompt,
  SubQuestionPrompt,
  SummaryPrompt,
  TextQAPrompt,
+  TitleCombinePrompt,
+  TitleExtractorPrompt,
  TreeSummarizePrompt,
 } from "./prompt";
@@ -13,8 +13,12 @@ export type CondenseQuestionPrompt = PromptTemplate<
  ["chatHistory", "question"]
 >;
 export type ContextSystemPrompt = PromptTemplate<["context"]>;
-export type KeywordExtractPrompt = PromptTemplate<["context"]>;
+export type KeywordExtractPrompt = PromptTemplate<["context", "maxKeywords"]>;
 export type QueryKeywordExtractPrompt = PromptTemplate<["question"]>;
+export type QuestionExtractPrompt = PromptTemplate<["context", "numQuestions"]>;
+export type TitleExtractorPrompt = PromptTemplate<["context"]>;
+export type TitleCombinePrompt = PromptTemplate<["context"]>;
+export type KeywordExtractorPrompt = PromptTemplate<["context", "numKeywords"]>;

 export const defaultTextQAPrompt: TextQAPrompt = new PromptTemplate({
  templateVars: ["context", "query"],
@@ -253,3 +257,55 @@ export const defaultQueryKeywordExtractPrompt = new PromptTemplate({
 }).partialFormat({
  maxKeywords: "10",
 });
+
+export const defaultQuestionExtractPrompt = new PromptTemplate({
+  templateVars: ["numQuestions", "context"],
+  template: `(
+  "Given the contextual informations below, generate {numQuestions} questions this context can provides specific answers to which are unlikely to be found else where. Higher-level summaries of surrounding context may be provided as well. "
+  "Try using these summaries to generate better questions that this context can answer."
+  "---------------------"
+  "{context}"
+  "---------------------"
+  "Provide questions in the following format: 'QUESTIONS: <questions>'"
+)`,
+}).partialFormat({
+  numQuestions: "5",
+});
+
+export const defaultTitleExtractorPromptTemplate = new PromptTemplate({
+  templateVars: ["context"],
+  template: `{context}
+Give a title that summarizes all of the unique entities, titles or themes found in the context. 
+Title: `,
+});
+
+export const defaultTitleCombinePromptTemplate = new PromptTemplate({
+  templateVars: ["context"],
+  template: `{context} 
+Based on the above candidate titles and contents, what is the comprehensive title for this document? 
+Title: `,
+});
+
+export const defaultKeywordExtractorPromptTemplate = new PromptTemplate({
+  templateVars: ["context", "numKeywords"],
+  template: `{context}
+Give {numKeywords} unique keywords for this document. 
+Format as comma separated. 
+Keywords: `,
+}).partialFormat({
+  keywordCount: "5",
+});
+
+export const defaultNodeTextTemplate = new PromptTemplate({
+  templateVars: ["metadataStr", "content"],
+  template: `[Excerpt from document]
+{metadataStr}
+Excerpt:
+-----
+{content}
+-----
+`,
+}).partialFormat({
+  metadataStr: "",
+  content: "",
+});
@@ -0,0 +1,62 @@
+import type { JSONSchemaType } from "ajv";
+import { z } from "zod";
+import { zodToJsonSchema } from "zod-to-json-schema";
+import type { JSONValue } from "../global";
+import type { BaseTool, ToolMetadata } from "../llms";
+
+const kOriginalFn = Symbol("originalFn");
+
+export class FunctionTool<T, R extends JSONValue | Promise<JSONValue>>
+  implements BaseTool<T>
+{
+  [kOriginalFn]?: (input: T) => R;
+
+  #fn: (input: T) => R;
+  #metadata: ToolMetadata<JSONSchemaType<T>>;
+  // todo: for the future, we can use zod to validate the input parameters
+  #zodType: z.ZodType<T> | null = null;
+  constructor(
+    fn: (input: T) => R,
+    metadata: ToolMetadata<JSONSchemaType<T>>,
+    zodType?: z.ZodType<T>,
+  ) {
+    this.#fn = fn;
+    this.#metadata = metadata;
+    if (zodType) {
+      this.#zodType = zodType;
+    }
+  }
+
+  static from<T>(
+    fn: (input: T) => JSONValue | Promise<JSONValue>,
+    schema: ToolMetadata<JSONSchemaType<T>>,
+  ): FunctionTool<T, JSONValue | Promise<JSONValue>>;
+  static from<T, R extends z.ZodType<T>>(
+    fn: (input: T) => JSONValue | Promise<JSONValue>,
+    schema: Omit<ToolMetadata, "parameters"> & {
+      parameters: R;
+    },
+  ): FunctionTool<T, JSONValue>;
+  static from(fn: any, schema: any): any {
+    if (schema.parameter instanceof z.ZodSchema) {
+      const jsonSchema = zodToJsonSchema(schema.parameter);
+      return new FunctionTool(
+        fn,
+        {
+          ...schema,
+          parameters: jsonSchema,
+        },
+        schema.parameter,
+      );
+    }
+    return new FunctionTool(fn, schema);
+  }
+
+  get metadata(): BaseTool<T>["metadata"] {
+    return this.#metadata as BaseTool<T>["metadata"];
+  }
+
+  call(input: T) {
+    return this.#fn.call(null, input);
+  }
+}
@@ -0,0 +1 @@
+export { FunctionTool } from "./function-tool";
@@ -0,0 +1,35 @@
+import { FunctionTool } from "@llamaindex/core/tools";
+import { describe, test } from "vitest";
+import { z } from "zod";
+
+describe("FunctionTool", () => {
+  test("type system", () => {
+    FunctionTool.from((input: string) => input, {
+      name: "test",
+      description: "test",
+    });
+    FunctionTool.from(({ input }: { input: string }) => input, {
+      name: "test",
+      description: "test",
+      parameters: {
+        type: "object",
+        properties: {
+          input: {
+            type: "string",
+          },
+        },
+        required: ["input"],
+      },
+    });
+    const inputSchema = z
+      .object({
+        input: z.string(),
+      })
+      .required();
+    FunctionTool.from(({ input }: { input: string }) => input, {
+      name: "test",
+      description: "test",
+      parameters: inputSchema,
+    });
+  });
+});
@@ -0,0 +1,8 @@
+{
+  "type": "module",
+  "main": "./dist/index.cjs",
+  "module": "./dist/index.js",
+  "types": "./dist/index.d.ts",
+  "exports": "./dist/index.js",
+  "private": true
+}
@@ -0,0 +1,8 @@
+{
+  "type": "module",
+  "main": "./dist/index.cjs",
+  "module": "./dist/index.js",
+  "types": "./dist/index.d.ts",
+  "exports": "./dist/index.js",
+  "private": true
+}
@@ -1,5 +1,18 @@
 # @llamaindex/env

+## 0.1.15
+
+### Patch Changes
+
+- 4ba2cfe: fix(env): align export APIs
+
+## 0.1.14
+
+### Patch Changes
+
+- ae49ff4: feat: use `gpt-tokenizer`
+- a75af83: refactor: move some llm and embedding to single package
+
 ## 0.1.13

 ### Patch Changes
@@ -1,10 +1,11 @@
 {
  "name": "@llamaindex/env",
  "description": "environment wrapper, supports all JS environment including node, deno, bun, edge runtime, and cloudflare worker",
-  "version": "0.1.13",
+  "version": "0.1.15",
  "type": "module",
-  "types": "dist/type/index.d.ts",
-  "main": "dist/cjs/index.js",
+  "types": "dist/index.d.ts",
+  "module": "dist/index.js",
+  "main": "dist/index.cjs",
  "keywords": [
    "llm",
    "llama",
@@ -24,29 +25,30 @@
  "exports": {
    ".": {
      "node": {
-        "types": "./dist/type/index.d.ts",
+        "types": "./dist/index.d.ts",
        "import": "./dist/index.js",
-        "default": "./dist/cjs/index.js"
+        "require": "./dist/index.cjs",
+        "default": "./dist/index.cjs"
      },
      "workerd": {
-        "types": "./dist/type/index.workerd.d.ts",
+        "types": "./dist/index.workerd.d.ts",
        "default": "./dist/index.workerd.js"
      },
      "edge-light": {
-        "types": "./dist/type/index.edge-light.d.ts",
+        "types": "./dist/index.edge-light.d.ts",
        "default": "./dist/index.edge-light.js"
      },
      "browser": {
-        "types": "./dist/type/index.browser.d.ts",
+        "types": "./dist/index.browser.d.ts",
        "default": "./dist/index.browser.js"
      },
      "import": {
-        "types": "./dist/type/index.d.ts",
+        "types": "./dist/index.d.ts",
        "default": "./dist/index.js"
      },
      "require": {
-        "types": "./dist/type/index.d.ts",
-        "default": "./dist/cjs/index.js"
+        "types": "./dist/index.d.cts",
+        "default": "./dist/index.cjs"
      }
    }
  },
@@ -61,33 +63,25 @@
    "directory": "packages/env"
  },
  "scripts": {
-    "build": "rm -rf ./dist && pnpm run build:esm && pnpm run build:cjs && pnpm run build:type",
-    "build:esm": "swc src -d dist --strip-leading-paths --config-file ../../.swcrc",
-    "build:cjs": "swc src -d dist/cjs --strip-leading-paths --config-file ../../.cjs.swcrc",
-    "build:type": "tsc -p tsconfig.json",
-    "postbuild": "node -e \"require('fs').writeFileSync('./dist/cjs/package.json', JSON.stringify({ type: 'commonjs' }))\"",
-    "dev": "concurrently \"pnpm run build:esm --watch\" \"pnpm run build:cjs --watch\" \"pnpm run build:type --watch\"",
+    "dev": "bunchee --watch",
+    "build": "bunchee",
    "test": "vitest"
  },
  "devDependencies": {
-    "@aws-crypto/sha256-js": "^5.2.0",
-    "@swc/cli": "^0.4.0",
-    "@swc/core": "^1.7.22",
+    "@types/node": "^22.5.1",
+    "@types/readable-stream": "^4.0.15",
    "@xenova/transformers": "^2.17.2",
-    "concurrently": "^8.2.2",
+    "bunchee": "5.5.1",
+    "gpt-tokenizer": "^2.5.0",
    "pathe": "^1.1.2",
-    "tiktoken": "^1.0.16",
    "vitest": "^2.0.5"
  },
-  "dependencies": {
-    "@types/node": "^22.5.1"
-  },
  "peerDependencies": {
    "@aws-crypto/sha256-js": "^5.2.0",
    "@xenova/transformers": "^2.17.2",
+    "gpt-tokenizer": "^2.5.0",
    "js-tiktoken": "^1.0.12",
-    "pathe": "^1.1.2",
-    "tiktoken": "^1.0.15"
+    "pathe": "^1.1.2"
  },
  "peerDependenciesMeta": {
    "@aws-crypto/sha256-js": {
@@ -5,4 +5,7 @@
 */
 import memFS from "./memfs/index.js";

+export function createWriteStream() {
+  throw new Error("Not supported in this environment.");
+}
 export const fs = memFS.promises;
@@ -4,7 +4,6 @@
 * @module
 */
 import "./global-check.js";
-export * from "./web-polyfill.js";

 export { consoleLogger, emptyLogger, type Logger } from "./logger/index.js";
 export {
@@ -14,7 +13,8 @@ export {
  type OnLoad,
 } from "./multi-model/index.browser.js";
 export { Tokenizers, tokenizers, type Tokenizer } from "./tokenizers/js.js";
-
+export { NotSupportCurrentRuntimeClass } from "./utils/shared.js";
+export * from "./web-polyfill.js";
 // @ts-expect-error
 if (typeof window === "undefined") {
  console.warn(
@@ -4,8 +4,6 @@
 * @module
 */
 import "./global-check.js";
-export * from "./node-polyfill.js";
-
 export { consoleLogger, emptyLogger, type Logger } from "./logger/index.js";
 export {
  loadTransformers,
@@ -13,4 +11,6 @@ export {
  type LoadTransformerEvent,
  type OnLoad,
 } from "./multi-model/index.non-nodejs.js";
+export * from "./node-polyfill.js";
 export { Tokenizers, tokenizers, type Tokenizer } from "./tokenizers/js.js";
+export { NotSupportCurrentRuntimeClass } from "./utils/shared.js";
@@ -47,6 +47,7 @@ export {
  getEnv,
  setEnvs,
 } from "./utils/index.js";
+export { NotSupportCurrentRuntimeClass } from "./utils/shared.js";
 export {
  createWriteStream,
  EOL,
@@ -7,6 +7,8 @@
 */
 import { INTERNAL_ENV } from "./utils/index.js";

+export { NotSupportCurrentRuntimeClass } from "./utils/shared.js";
+
 export * from "./node-polyfill.js";

 export function getEnv(name: string): string | undefined {
@@ -9,9 +9,12 @@
 */
 import { Sha256 } from "@aws-crypto/sha256-js";
 import pathe from "pathe";
-import { fs } from "./fs/memory.js";
+import { NotSupportCurrentRuntimeClass } from "./utils/shared.js";

-export { fs, pathe as path };
+export { createWriteStream, fs } from "./fs/memory.js";
+export { fileURLToPath } from "./url/index.js";
+export { pathe as path };
+export const Readable = NotSupportCurrentRuntimeClass.bind("non-Node.js");

 export interface SHA256 {
  update(data: string | Uint8Array): void;
@@ -2,21 +2,18 @@
 import type { Tokenizer } from "./types.js";
 import { Tokenizers } from "./types.js";

-import { get_encoding } from "tiktoken";
+import cl100kBase from "gpt-tokenizer";

 class TokenizerSingleton {
-  private defaultTokenizer: Tokenizer;
+  #defaultTokenizer: Tokenizer;

  constructor() {
-    const encoding = get_encoding("cl100k_base");
-
-    this.defaultTokenizer = {
-      encode: (text: string) => {
-        return encoding.encode(text);
+    this.#defaultTokenizer = {
+      encode: (text: string): Uint32Array => {
+        return new Uint32Array(cl100kBase.encode(text));
      },
      decode: (tokens: Uint32Array) => {
-        const text = encoding.decode(tokens);
-        return new TextDecoder().decode(text);
+        return cl100kBase.decode(tokens);
      },
    };
  }
@@ -26,7 +23,7 @@ class TokenizerSingleton {
      throw new Error(`Tokenizer encoding ${encoding} not yet supported`);
    }

-    return this.defaultTokenizer;
+    return this.#defaultTokenizer;
  }
 }

@@ -0,0 +1,172 @@
+// Copyright (c) 2000-2006, The Perl Foundation.
+//
+// 	Everyone is permitted to copy and distribute verbatim copies of this license document, but changing it is not allowed.
+//
+// 	Preamble
+//
+// This license establishes the terms under which a given free software Package may be copied, modified, distributed, and/or redistributed. The intent is that the Copyright Holder maintains some artistic control over the development of that Package while still keeping the Package available as open source and free software.
+//
+// 	You are always permitted to make arrangements wholly outside of this license directly with the Copyright Holder of a given Package.  If the terms of this license do not permit the full use that you propose to make of the Package, you should contact the Copyright Holder and seek a different licensing arrangement.
+//
+// 	Definitions
+//
+// "Copyright Holder" means the individual(s) or organization(s) named in the copyright notice for the entire Package.
+//
+// "Contributor" means any party that has contributed code or other material to the Package, in accordance with the Copyright Holder's procedures.
+//
+// "You" and "your" means any person who would like to copy, distribute, or modify the Package.
+//
+// "Package" means the collection of files distributed by the Copyright Holder, and derivatives of that collection and/or of those files. A given Package may consist of either the Standard Version, or a Modified Version.
+//
+// "Distribute" means providing a copy of the Package or making it accessible to anyone else, or in the case of a company or organization, to others outside of your company or organization.
+//
+// "Distributor Fee" means any fee that you charge for Distributing this Package or providing support for this Package to another party.  It does not mean licensing fees.
+//
+// "Standard Version" refers to the Package if it has not been modified, or has been modified only in ways explicitly requested by the Copyright Holder.
+//
+// "Modified Version" means the Package, if it has been changed, and such changes were not explicitly requested by the Copyright Holder.
+//
+// "Original License" means this Artistic License as Distributed with the Standard Version of the Package, in its current version or as it may be modified by The Perl Foundation in the future.
+//
+// "Source" form means the source code, documentation source, and configuration files for the Package.
+//
+// "Compiled" form means the compiled bytecode, object code, binary, or any other form resulting from mechanical transformation or translation of the Source form.
+//
+// 	Permission for Use and Modification Without Distribution
+//
+// (1) You are permitted to use the Standard Version and create and use Modified Versions for any purpose without restriction, provided that you do not Distribute the Modified Version.
+//
+// 	Permissions for Redistribution of the Standard Version
+//
+// (2) You may Distribute verbatim copies of the Source form of the Standard Version of this Package in any medium without restriction, either gratis or for a Distributor Fee, provided that you duplicate all of the original copyright notices and associated disclaimers.  At your discretion, such verbatim copies may or may not include a Compiled form of the Package.
+//
+// 	(3) You may apply any bug fixes, portability changes, and other modifications made available from the Copyright Holder.  The resulting Package will still be considered the Standard Version, and as such will be subject to the Original License.
+//
+// 	Distribution of Modified Versions of the Package as Source
+//
+// (4) You may Distribute your Modified Version as Source (either gratis or for a Distributor Fee, and with or without a Compiled form of the Modified Version) provided that you clearly document how it differs from the Standard Version, including, but not limited to, documenting any non-standard features, executables, or modules, and provided that you do at least ONE of the following:
+//
+// 	(a) make the Modified Version available to the Copyright Holder of the Standard Version, under the Original License, so that the Copyright Holder may include your modifications in the Standard Version.
+// 	(b) ensure that installation of your Modified Version does not prevent the user installing or running the Standard Version. In addition, the Modified Version must bear a name that is different from the name of the Standard Version.
+// 	(c) allow anyone who receives a copy of the Modified Version to make the Source form of the Modified Version available to others under
+//
+// (i) the Original License or
+// (ii) a license that permits the licensee to freely copy, modify and redistribute the Modified Version using the same licensing terms that apply to the copy that the licensee received, and requires that the Source form of the Modified Version, and of any works derived from it, be made freely available in that license fees are prohibited but Distributor Fees are allowed.
+//
+// 	Distribution of Compiled Forms of the Standard Version or Modified Versions without the Source
+//
+// (5)  You may Distribute Compiled forms of the Standard Version without the Source, provided that you include complete instructions on how to get the Source of the Standard Version.  Such instructions must be valid at the time of your distribution.  If these instructions, at any time while you are carrying out such distribution, become invalid, you must provide new instructions on demand or cease further distribution. If you provide valid instructions or cease distribution within thirty days after you become aware that the instructions are invalid, then you do not forfeit any of your rights under this license.
+//
+// 	(6)  You may Distribute a Modified Version in Compiled form without the Source, provided that you comply with Section 4 with respect to the Source of the Modified Version.
+//
+// 	Aggregating or Linking the Package
+//
+// (7)  You may aggregate the Package (either the Standard Version or Modified Version) with other packages and Distribute the resulting aggregation provided that you do not charge a licensing fee for the Package.  Distributor Fees are permitted, and licensing fees for other components in the aggregation are permitted. The terms of this license apply to the use and Distribution of the Standard or Modified Versions as included in the aggregation.
+//
+// 	(8) You are permitted to link Modified and Standard Versions with other works, to embed the Package in a larger work of your own, or to build stand-alone binary or bytecode versions of applications that include the Package, and Distribute the result without restriction, provided the result does not expose a direct interface to the Package.
+//
+// 	Items That are Not Considered Part of a Modified Version
+//
+// (9) Works (including, but not limited to, modules and scripts) that merely extend or make use of the Package, do not, by themselves, cause the Package to be a Modified Version.  In addition, such works are not considered parts of the Package itself, and are not subject to the terms of this license.
+//
+// 	General Provisions
+//
+// (10)  Any use, modification, and distribution of the Standard or Modified Versions is governed by this Artistic License. By using, modifying or distributing the Package, you accept this license. Do not use, modify, or distribute the Package, if you do not accept this license.
+//
+// 	(11)  If your Modified Version has been derived from a Modified Version made by someone other than you, you are nevertheless required to ensure that your Modified Version complies with the requirements of this license.
+//
+// 	(12)  This license does not grant you the right to use any trademark, service mark, tradename, or logo of the Copyright Holder.
+//
+// 	(13)  This license includes the non-exclusive, worldwide, free-of-charge patent license to make, have made, use, offer to sell, sell, import and otherwise transfer the Package with respect to any patent claims licensable by the Copyright Holder that are necessarily infringed by the Package. If you institute patent litigation (including a cross-claim or counterclaim) against any party alleging that the Package constitutes direct or contributory patent infringement, then this Artistic License to you shall terminate on the date that such litigation is filed.
+//
+// 	(14)  Disclaimer of Warranty:
+// 	THE PACKAGE IS PROVIDED BY THE COPYRIGHT HOLDER AND CONTRIBUTORS "AS IS" AND WITHOUT ANY EXPRESS OR IMPLIED WARRANTIES. THE IMPLIED WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, OR NON-INFRINGEMENT ARE DISCLAIMED TO THE EXTENT PERMITTED BY YOUR LOCAL LAW. UNLESS REQUIRED BY LAW, NO COPYRIGHT HOLDER OR CONTRIBUTOR WILL BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL DAMAGES ARISING IN ANY WAY OUT OF THE USE OF THE PACKAGE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+/**
+ * This function ensures the correct decodings of percent-encoded characters as
+ * well as ensuring a cross-platform valid absolute path string.
+ */
+export function fileURLToPath(href: string, separator: string): string {
+  // conform with Node.js fileURLToPath
+  if (!href.includes(":/")) {
+    const error = new Error("Invalid URL") as any;
+    error.code = "ERR_INVALID_URL";
+    throw error;
+  }
+  if (!href.startsWith("file:")) {
+    const error = new Error("The URL must be of scheme file") as any;
+    error.code = "ERR_INVALID_URL_SCHEME";
+    throw error;
+  }
+
+  // https://en.wikipedia.org/wiki/File_URI_scheme#Examples
+  // https://nodejs.org/api/url.html#urlfileurltopathurl
+  // file:/path (no hostname)
+  // file://hostname/path
+  // file:///path (empty hostname)
+  let file;
+  if (separator === "\\") {
+    // is windows
+    if (href.startsWith("file:///")) {
+      // is full path, e.g. file:///foo
+      file = href.substring(8);
+      if (file[1] !== ":") {
+        const error = new Error("File URL path must be absolute") as any;
+        error.code = "ERR_INVALID_FILE_URL_PATH";
+        throw error;
+      }
+    } else if (href.startsWith("file://localhost/")) {
+      // is localhost path, e.g. file://localhost/foo
+      // conform with Node.js fileURLToPath
+      file = href.substring(17); // trim leading slash
+      if (file[1] !== ":") {
+        const error = new Error("File URL path must be absolute") as any;
+        error.code = "ERR_INVALID_FILE_URL_PATH";
+        throw error;
+      }
+    } else if (href.startsWith("file://")) {
+      // is host path, e.g. file://hostname/foo
+      // conform with Node.js fileURLToPath, which does not error
+      file = href.substring(7);
+      file = separator + separator + file;
+    } else if (href.startsWith("file:/")) {
+      // is full path with unknown drive letter
+      // conform with Node.js fileURLToPath
+      file = href.substring(6);
+      if (file[1] !== ":") {
+        const error = new Error("File URL path must be absolute") as any;
+        error.code = "ERR_INVALID_FILE_URL_PATH";
+        throw error;
+      }
+    } else {
+      file = href;
+    }
+
+    // replace slashes with backslashes
+    file = file.replace(/[/]/g, separator);
+  } else if (separator === "/") {
+    // is posix
+    if (href.startsWith("file:///")) {
+      // is full path, e.g. file:///foo
+      file = href.substring(7); // keep leading slash
+    } else if (href.startsWith("file://")) {
+      // is host path, e.g. file://localhost/foo
+      if (!href.startsWith("file://localhost/")) {
+        const error = new Error(
+          'File URL host must be "localhost" or empty',
+        ) as any;
+        error.code = "ERR_INVALID_FILE_URL_HOST";
+        throw error;
+      }
+      file = href.substring(16); // keep leading slash
+    } else if (href.startsWith("file:/")) {
+      // is full path, e.g. file:/foo
+      file = href.substring(5); // keep leading slash
+    } else {
+      file = href;
+    }
+  } else {
+    file = href;
+  }
+  return file;
+}
@@ -0,0 +1,13 @@
+export class NotSupportCurrentRuntimeClass {
+  constructor(runtime: string) {
+    throw new Error(`Current environment ${runtime} is not supported`);
+  }
+
+  static bind(runtime: string) {
+    return class extends NotSupportCurrentRuntimeClass {
+      constructor(...args: any[]) {
+        super(runtime);
+      }
+    } as any;
+  }
+}
@@ -9,9 +9,12 @@
 */
 import { Sha256 } from "@aws-crypto/sha256-js";
 import pathe from "pathe";
-import { fs } from "./fs/memory.js";
+import { NotSupportCurrentRuntimeClass } from "./utils/shared.js";

-export { fs, pathe as path };
+export { createWriteStream, fs } from "./fs/memory.js";
+export { fileURLToPath } from "./url/index.js";
+export { pathe as path };
+export const Readable = NotSupportCurrentRuntimeClass.bind("browser");

 export interface SHA256 {
  update(data: string | Uint8Array): void;
@@ -0,0 +1,11 @@
+import { describe, expect, it } from "vitest";
+import { tokenizers } from "../src/tokenizers/node.js";
+
+describe("tokenizer", () => {
+  it("should tokenize text", () => {
+    const tokenizer = tokenizers.tokenizer();
+    expect(tokenizer.decode(tokenizer.encode("hello world"))).toBe(
+      "hello world",
+    );
+  });
+});
@@ -1,5 +1,59 @@
 # @llamaindex/experimental

+## 0.0.104
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.0.103
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.0.102
+
+### Patch Changes
+
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.0.101
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.0.100
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.0.99
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.0.98
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.0.97

 ### Patch Changes
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/experimental",
  "description": "Experimental package for LlamaIndexTS",
-  "version": "0.0.97",
+  "version": "0.0.104",
  "type": "module",
  "types": "dist/type/index.d.ts",
  "main": "dist/cjs/index.js",
@@ -1,5 +1,105 @@
 # llamaindex

+## 0.7.3
+
+### Patch Changes
+
+- Updated dependencies [0493f67]
+  - @llamaindex/core@0.3.3
+  - @llamaindex/cloud@1.0.3
+  - @llamaindex/anthropic@0.0.4
+  - @llamaindex/clip@0.0.4
+  - @llamaindex/deepinfra@0.0.4
+  - @llamaindex/huggingface@0.0.4
+  - @llamaindex/ollama@0.0.11
+  - @llamaindex/openai@0.1.20
+  - @llamaindex/portkey-ai@0.0.4
+  - @llamaindex/replicate@0.0.4
+  - @llamaindex/groq@0.0.19
+
+## 0.7.2
+
+### Patch Changes
+
+- Updated dependencies [4ba2cfe]
+  - @llamaindex/env@0.1.15
+  - @llamaindex/cloud@1.0.2
+  - @llamaindex/core@0.3.2
+  - @llamaindex/anthropic@0.0.3
+  - @llamaindex/clip@0.0.3
+  - @llamaindex/deepinfra@0.0.3
+  - @llamaindex/groq@0.0.18
+  - @llamaindex/huggingface@0.0.3
+  - @llamaindex/ollama@0.0.10
+  - @llamaindex/openai@0.1.19
+  - @llamaindex/portkey-ai@0.0.3
+  - @llamaindex/replicate@0.0.3
+
+## 0.7.1
+
+### Patch Changes
+
+- ae49ff4: feat: use `gpt-tokenizer`
+- 4c38c1b: fix(cloud): do not detect file type in llama parse
+- a75af83: feat: allow passing perform setup in pg vector store
+- a75af83: refactor: move some llm and embedding to single package
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [24d065f]
+- Updated dependencies [a75af83]
+  - @llamaindex/env@0.1.14
+  - @llamaindex/cloud@1.0.1
+  - @llamaindex/huggingface@0.0.2
+  - @llamaindex/portkey-ai@0.0.2
+  - @llamaindex/anthropic@0.0.2
+  - @llamaindex/deepinfra@0.0.2
+  - @llamaindex/replicate@0.0.2
+  - @llamaindex/ollama@0.0.9
+  - @llamaindex/openai@0.1.18
+  - @llamaindex/clip@0.0.2
+  - @llamaindex/groq@0.0.17
+  - @llamaindex/core@0.3.1
+
+## 0.7.0
+
+### Minor Changes
+
+- 1364e8e: update metadata extractors to use PromptTemplate
+- 96fc69c: Correct initialization of QuestionsAnsweredExtractor so that it uses the promptTemplate arg when passed in
+
+### Patch Changes
+
+- 3b7736f: feat: added gemini 002 support
+- Updated dependencies [1364e8e]
+- Updated dependencies [96fc69c]
+  - @llamaindex/core@0.3.0
+  - @llamaindex/cloud@1.0.0
+  - @llamaindex/ollama@0.0.8
+  - @llamaindex/openai@0.1.17
+  - @llamaindex/groq@0.0.16
+
+## 0.6.22
+
+### Patch Changes
+
+- 5729bd9: Fix LlamaCloud API calls for ensuring an index and for file uploads
+
+## 0.6.21
+
+### Patch Changes
+
+- 6f75306: feat: support metadata filters for AstraDB
+- 94cb4ad: feat: Add metadata filters to ChromaDb and update to 1.9.2
+
+## 0.6.20
+
+### Patch Changes
+
+- 6a9a7b1: fix: take init api key into account
+- Updated dependencies [6a9a7b1]
+  - @llamaindex/openai@0.1.16
+  - @llamaindex/groq@0.0.15
+
 ## 0.6.19

 ### Patch Changes
@@ -1,5 +1,58 @@
 # @llamaindex/cloudflare-worker-agent-test

+## 0.0.88
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.0.87
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.0.86
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.0.85
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.0.84
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.0.83
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.0.82
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.0.81

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/cloudflare-worker-agent-test",
-  "version": "0.0.81",
+  "version": "0.0.88",
  "type": "module",
  "private": true,
  "scripts": {
@@ -1,5 +1,32 @@
 # @llamaindex/llama-parse-browser-test

+## 0.0.14
+
+### Patch Changes
+
+- @llamaindex/cloud@1.0.3
+
+## 0.0.13
+
+### Patch Changes
+
+- @llamaindex/cloud@1.0.2
+
+## 0.0.12
+
+### Patch Changes
+
+- Updated dependencies [4c38c1b]
+- Updated dependencies [24d065f]
+- Updated dependencies [a75af83]
+  - @llamaindex/cloud@1.0.1
+
+## 0.0.11
+
+### Patch Changes
+
+- @llamaindex/cloud@1.0.0
+
 ## 0.0.10

 ### Patch Changes
@@ -1,7 +1,7 @@
 {
  "name": "@llamaindex/llama-parse-browser-test",
  "private": true,
-  "version": "0.0.10",
+  "version": "0.0.14",
  "type": "module",
  "scripts": {
    "dev": "vite",
@@ -1,5 +1,58 @@
 # @llamaindex/next-agent-test

+## 0.1.88
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.1.87
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.1.86
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.1.85
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.1.84
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.1.83
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.1.82
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.1.81

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/next-agent-test",
-  "version": "0.1.81",
+  "version": "0.1.88",
  "private": true,
  "scripts": {
    "dev": "next dev",
@@ -1,5 +1,58 @@
 # test-edge-runtime

+## 0.1.87
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.1.86
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.1.85
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.1.84
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.1.83
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.1.82
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.1.81
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.1.80

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/nextjs-edge-runtime-test",
-  "version": "0.1.80",
+  "version": "0.1.87",
  "private": true,
  "scripts": {
    "dev": "next dev",
@@ -1,19 +1,12 @@
-import { tokenizerResultPromise } from "@/utils/llm";
-import { use } from "react";
+import "@/utils/llm";

 export const runtime = "edge";

 export default function Home() {
-  const result = use(tokenizerResultPromise);
  return (
    <main>
      <div>
        <h1>Next.js Edge Runtime</h1>
-        <div>
-          {result.map((value, index) => (
-            <span key={index}>{value}</span>
-          ))}
-        </div>
      </div>
    </main>
  );
@@ -1,23 +1,8 @@
 // test runtime
 import "llamaindex";
-import { ClipEmbedding } from "llamaindex";
 import "llamaindex/readers/SimpleDirectoryReader";

 // @ts-expect-error
 if (typeof EdgeRuntime !== "string") {
  throw new Error("Expected run in EdgeRuntime");
 }
-
-export const tokenizerResultPromise = new Promise<number[]>(
-  (resolve, reject) => {
-    const embedding = new ClipEmbedding();
-    //#region make sure @xenova/transformers is working in edge runtime
-    embedding
-      .getTokenizer()
-      .then((tokenizer) => {
-        resolve(tokenizer.encode("hello world"));
-      })
-      .catch(reject);
-    //#endregion
-  },
-);
@@ -1,5 +1,58 @@
 # @llamaindex/next-node-runtime

+## 0.0.69
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.0.68
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.0.67
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.0.66
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.0.65
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.0.64
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.0.63
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.0.62

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/next-node-runtime-test",
-  "version": "0.0.62",
+  "version": "0.0.69",
  "private": true,
  "scripts": {
    "dev": "next dev",
@@ -1,5 +1,58 @@
 # @llamaindex/waku-query-engine-test

+## 0.0.88
+
+### Patch Changes
+
+- llamaindex@0.7.3
+
+## 0.0.87
+
+### Patch Changes
+
+- llamaindex@0.7.2
+
+## 0.0.86
+
+### Patch Changes
+
+- Updated dependencies [ae49ff4]
+- Updated dependencies [4c38c1b]
+- Updated dependencies [a75af83]
+- Updated dependencies [a75af83]
+  - llamaindex@0.7.1
+
+## 0.0.85
+
+### Patch Changes
+
+- Updated dependencies [1364e8e]
+- Updated dependencies [3b7736f]
+- Updated dependencies [96fc69c]
+  - llamaindex@0.7.0
+
+## 0.0.84
+
+### Patch Changes
+
+- Updated dependencies [5729bd9]
+  - llamaindex@0.6.22
+
+## 0.0.83
+
+### Patch Changes
+
+- Updated dependencies [6f75306]
+- Updated dependencies [94cb4ad]
+  - llamaindex@0.6.21
+
+## 0.0.82
+
+### Patch Changes
+
+- Updated dependencies [6a9a7b1]
+  - llamaindex@0.6.20
+
 ## 0.0.81

 ### Patch Changes
@@ -1,6 +1,6 @@
 {
  "name": "@llamaindex/waku-query-engine-test",
-  "version": "0.0.81",
+  "version": "0.0.88",
  "type": "module",
  "private": true,
  "scripts": {
@@ -10,17 +10,16 @@
  },
  "dependencies": {
    "llamaindex": "workspace:*",
-    "react": "19.0.0-rc-7771d3a7-20240827",
-    "react-dom": "19.0.0-rc-7771d3a7-20240827",
-    "react-server-dom-webpack": "19.0.0-rc-7771d3a7-20240827",
-    "waku": "0.21.1"
+    "react": "19.0.0-rc-bf7e210c-20241017",
+    "react-dom": "19.0.0-rc-bf7e210c-20241017",
+    "react-server-dom-webpack": "19.0.0-rc-bf7e210c-20241017",
+    "waku": "0.21.4"
  },
  "devDependencies": {
-    "@types/react": "18.3.5",
-    "@types/react-dom": "18.3.0",
-    "autoprefixer": "10.4.20",
-    "tailwindcss": "3.4.10",
-    "typescript": "5.6.2",
-    "vite-plugin-wasm": "^3.3.0"
+    "@types/react": "18.3.11",
+    "@types/react-dom": "18.3.1",
+    "autoprefixer": "^10.4.20",
+    "tailwindcss": "^3.4.14",
+    "typescript": "5.6.2"
  }
 }
@@ -1,8 +0,0 @@
-import wasm from "vite-plugin-wasm";
-
-export default {
-  plugins: [wasm()],
-  ssr: {
-    external: ["tiktoken"],
-  },
-};
@@ -105,3 +105,22 @@ await test("simple node", async (t) => {
    assert.deepStrictEqual(result.nodes, []);
  }
 });
+
+await test("no setup", async (t) => {
+  // @ts-expect-error private method
+  assert.ok(PGVectorStore.prototype.checkSchema);
+  // @ts-expect-error private method
+  const Mock = class extends PGVectorStore {
+    private override async checkSchema(): Promise<any> {
+      throw new Error("should not be called");
+    }
+  };
+  const vectorStore = new Mock({
+    clientConfig: pgConfig,
+    performSetup: false,
+  });
+  const db = await vectorStore.client();
+  t.after(async () => {
+    await db.close();
+  });
+});
@@ -1,6 +1,6 @@
 {
  "name": "llamaindex",
-  "version": "0.6.19",
+  "version": "0.7.3",
  "license": "MIT",
  "type": "module",
  "keywords": [
@@ -29,13 +29,18 @@
    "@google-cloud/vertexai": "1.2.0",
    "@google/generative-ai": "0.12.0",
    "@grpc/grpc-js": "^1.11.1",
-    "@huggingface/inference": "^2.8.0",
+    "@llamaindex/anthropic": "workspace:*",
+    "@llamaindex/clip": "workspace:*",
    "@llamaindex/cloud": "workspace:*",
    "@llamaindex/core": "workspace:*",
+    "@llamaindex/deepinfra": "workspace:*",
    "@llamaindex/env": "workspace:*",
    "@llamaindex/groq": "workspace:*",
+    "@llamaindex/huggingface": "workspace:*",
    "@llamaindex/ollama": "workspace:*",
    "@llamaindex/openai": "workspace:*",
+    "@llamaindex/portkey-ai": "workspace:*",
+    "@llamaindex/replicate": "workspace:^0.0.4",
    "@mistralai/mistralai": "^1.0.4",
    "@mixedbread-ai/sdk": "^2.2.11",
    "@pinecone-database/pinecone": "^3.0.2",
@@ -48,9 +53,11 @@
    "@zilliz/milvus2-sdk-node": "^2.4.6",
    "ajv": "^8.17.1",
    "assemblyai": "^4.7.0",
-    "chromadb": "1.8.1",
+    "chromadb": "1.9.2",
+    "chromadb-default-embed": "^2.13.2",
    "cohere-ai": "7.13.0",
    "discord-api-types": "^0.37.98",
+    "gpt-tokenizer": "^2.5.0",
    "groq-sdk": "^0.6.1",
    "js-tiktoken": "^1.0.14",
    "lodash": "^4.17.21",
@@ -62,10 +69,8 @@
    "openai": "^4.60.0",
    "papaparse": "^5.4.1",
    "pathe": "^1.1.2",
-    "portkey-ai": "0.1.16",
    "rake-modified": "^1.0.8",
    "string-strip-html": "^13.4.8",
-    "tiktoken": "^1.0.15",
    "unpdf": "^0.11.0",
    "weaviate-client": "^3.1.4",
    "wikipedia": "^2.1.2",
@@ -11,7 +11,6 @@ import {
  type NodeParser,
  SentenceSplitter,
 } from "@llamaindex/core/node-parser";
-import type { LoadTransformerEvent } from "@llamaindex/env";
 import { AsyncLocalStorage } from "@llamaindex/env";
 import type { ServiceContext } from "./ServiceContext.js";
 import {
@@ -20,12 +19,6 @@ import {
  withEmbeddedModel,
 } from "./internal/settings/EmbedModel.js";

-declare module "@llamaindex/core/global" {
-  interface LlamaIndexEventMaps {
-    "load-transformers": LoadTransformerEvent;
-  }
-}
-
 export type PromptConfig = {
  llm?: string;
  lang?: string;
@@ -1,43 +1 @@
-import {
-  LLMAgent,
-  LLMAgentWorker,
-  type LLMAgentParams,
-} from "@llamaindex/core/agent";
-import type {
-  NonStreamingChatEngineParams,
-  StreamingChatEngineParams,
-} from "@llamaindex/core/chat-engine";
-import type { EngineResponse } from "@llamaindex/core/schema";
-import { Settings } from "../Settings.js";
-import { Anthropic } from "../llm/anthropic.js";
-
-export type AnthropicAgentParams = LLMAgentParams;
-
-export class AnthropicAgentWorker extends LLMAgentWorker {}
-
-export class AnthropicAgent extends LLMAgent {
-  constructor(params: AnthropicAgentParams) {
-    const llm =
-      params.llm ??
-      (Settings.llm instanceof Anthropic
-        ? (Settings.llm as Anthropic)
-        : new Anthropic());
-    super({
-      ...params,
-      llm,
-    });
-  }
-
-  async chat(params: NonStreamingChatEngineParams): Promise<EngineResponse>;
-  async chat(params: StreamingChatEngineParams): Promise<never>;
-  override async chat(
-    params: NonStreamingChatEngineParams | StreamingChatEngineParams,
-  ) {
-    const { stream } = params;
-    if (stream) {
-      // Anthropic does support this, but looks like it's not supported in the LITS LLM
-      throw new Error("Anthropic does not support streaming");
-    }
-    return super.chat(params);
-  }
-}
+export * from "@llamaindex/anthropic";
@@ -41,7 +41,7 @@ export class LLamaCloudFileService {
  ) {
    initService();
    const { data: file } = await FilesService.uploadFileApiV1FilesPost({
-      path: { project_id: projectId },
+      query: { project_id: projectId },
      body: {
        upload_file: uploadFile,
      },
@@ -378,7 +378,7 @@ export class LlamaCloudIndex {

      const { data: pipeline } =
        await PipelinesService.upsertPipelineApiV1PipelinesPut({
-          path: {
+          query: {
            project_id: projectId,
          },
          body: {
@@ -1,139 +1 @@
-import { MultiModalEmbedding } from "@llamaindex/core/embeddings";
-import type { ImageType } from "@llamaindex/core/schema";
-import _ from "lodash";
-// only import type, to avoid bundling error
-import { loadTransformers } from "@llamaindex/env";
-import type {
-  CLIPTextModelWithProjection,
-  CLIPVisionModelWithProjection,
-  PreTrainedTokenizer,
-  Processor,
-} from "@xenova/transformers";
-import { Settings } from "../Settings.js";
-
-async function readImage(input: ImageType) {
-  const { RawImage } = await loadTransformers((transformer) => {
-    Settings.callbackManager.dispatchEvent(
-      "load-transformers",
-      {
-        transformer,
-      },
-      true,
-    );
-  });
-  if (input instanceof Blob) {
-    return await RawImage.fromBlob(input);
-  } else if (_.isString(input) || input instanceof URL) {
-    return await RawImage.fromURL(input);
-  } else {
-    throw new Error(`Unsupported input type: ${typeof input}`);
-  }
-}
-
-export enum ClipEmbeddingModelType {
-  XENOVA_CLIP_VIT_BASE_PATCH32 = "Xenova/clip-vit-base-patch32",
-  XENOVA_CLIP_VIT_BASE_PATCH16 = "Xenova/clip-vit-base-patch16",
-}
-
-export class ClipEmbedding extends MultiModalEmbedding {
-  modelType: ClipEmbeddingModelType =
-    ClipEmbeddingModelType.XENOVA_CLIP_VIT_BASE_PATCH16;
-
-  private tokenizer: PreTrainedTokenizer | null = null;
-  private processor: Processor | null = null;
-  private visionModel: CLIPVisionModelWithProjection | null = null;
-  private textModel: CLIPTextModelWithProjection | null = null;
-
-  constructor() {
-    super();
-  }
-
-  async getTokenizer() {
-    const { AutoTokenizer } = await loadTransformers((transformer) => {
-      Settings.callbackManager.dispatchEvent(
-        "load-transformers",
-        {
-          transformer,
-        },
-        true,
-      );
-    });
-    if (!this.tokenizer) {
-      this.tokenizer = await AutoTokenizer.from_pretrained(this.modelType);
-    }
-    return this.tokenizer;
-  }
-
-  async getProcessor() {
-    const { AutoProcessor } = await loadTransformers((transformer) => {
-      Settings.callbackManager.dispatchEvent(
-        "load-transformers",
-        {
-          transformer,
-        },
-        true,
-      );
-    });
-    if (!this.processor) {
-      this.processor = await AutoProcessor.from_pretrained(this.modelType);
-    }
-    return this.processor;
-  }
-
-  async getVisionModel() {
-    const { CLIPVisionModelWithProjection } = await loadTransformers(
-      (transformer) => {
-        Settings.callbackManager.dispatchEvent(
-          "load-transformers",
-          {
-            transformer,
-          },
-          true,
-        );
-      },
-    );
-    if (!this.visionModel) {
-      this.visionModel = await CLIPVisionModelWithProjection.from_pretrained(
-        this.modelType,
-      );
-    }
-
-    return this.visionModel;
-  }
-
-  async getTextModel() {
-    const { CLIPTextModelWithProjection } = await loadTransformers(
-      (transformer) => {
-        Settings.callbackManager.dispatchEvent(
-          "load-transformers",
-          {
-            transformer,
-          },
-          true,
-        );
-      },
-    );
-    if (!this.textModel) {
-      this.textModel = await CLIPTextModelWithProjection.from_pretrained(
-        this.modelType,
-      );
-    }
-
-    return this.textModel;
-  }
-
-  async getImageEmbedding(image: ImageType): Promise<number[]> {
-    const loadedImage = await readImage(image);
-    const imageInputs = await (await this.getProcessor())(loadedImage);
-    const { image_embeds } = await (await this.getVisionModel())(imageInputs);
-    return Array.from(image_embeds.data);
-  }
-
-  async getTextEmbedding(text: string): Promise<number[]> {
-    const textInputs = await (
-      await this.getTokenizer()
-    )([text], { padding: true, truncation: true });
-    const { text_embeds } = await (await this.getTextModel())(textInputs);
-    return text_embeds.data;
-  }
-}
+export * from "@llamaindex/clip";
@@ -1,17 +0,0 @@
-import { MultiModalEmbedding } from "@llamaindex/core/embeddings";
-import type { ImageType } from "@llamaindex/core/schema";
-
-/**
- * Cloudflare worker doesn't support image embeddings for now
- */
-export class CloudflareWorkerMultiModalEmbedding extends MultiModalEmbedding {
-  constructor() {
-    super();
-  }
-  getImageEmbedding(images: ImageType): Promise<number[]> {
-    throw new Error("Method not implemented.");
-  }
-  getTextEmbedding(text: string): Promise<number[]> {
-    throw new Error("Method not implemented.");
-  }
-}
@@ -1,152 +1 @@
-import { BaseEmbedding } from "@llamaindex/core/embeddings";
-import type { MessageContentDetail } from "@llamaindex/core/llms";
-import { extractSingleText } from "@llamaindex/core/utils";
-import { getEnv } from "@llamaindex/env";
-
-const DEFAULT_MODEL = "sentence-transformers/clip-ViT-B-32";
-
-const API_TOKEN_ENV_VARIABLE_NAME = "DEEPINFRA_API_TOKEN";
-
-const API_ROOT = "https://api.deepinfra.com/v1/inference";
-
-const DEFAULT_TIMEOUT = 60 * 1000;
-
-const DEFAULT_MAX_RETRIES = 5;
-
-export interface DeepInfraEmbeddingResponse {
-  embeddings: number[][];
-  request_id: string;
-  inference_status: InferenceStatus;
-}
-
-export interface InferenceStatus {
-  status: string;
-  runtime_ms: number;
-  cost: number;
-  tokens_input: number;
-}
-
-const mapPrefixWithInputs = (prefix: string, inputs: string[]): string[] => {
-  return inputs.map((input) => (prefix ? `${prefix} ${input}` : input));
-};
-
-/**
- * DeepInfraEmbedding is an alias for DeepInfra that implements the BaseEmbedding interface.
- */
-export class DeepInfraEmbedding extends BaseEmbedding {
-  /**
-   * DeepInfra model to use
-   * @default "sentence-transformers/clip-ViT-B-32"
-   * @see https://deepinfra.com/models/embeddings
-   */
-  model: string;
-
-  /**
-   * DeepInfra API token
-   * @see https://deepinfra.com/dash/api_keys
-   * If not provided, it will try to get the token from the environment variable `DEEPINFRA_API_TOKEN`
-   *
-   */
-  apiToken: string;
-
-  /**
-   * Prefix to add to the query
-   * @default ""
-   */
-  queryPrefix: string;
-
-  /**
-   * Prefix to add to the text
-   * @default ""
-   */
-  textPrefix: string;
-
-  /**
-   *
-   * @default 5
-   */
-  maxRetries: number;
-
-  /**
-   *
-   * @default 60 * 1000
-   */
-  timeout: number;
-
-  constructor(init?: Partial<DeepInfraEmbedding>) {
-    super();
-
-    this.model = init?.model ?? DEFAULT_MODEL;
-    this.apiToken = init?.apiToken ?? getEnv(API_TOKEN_ENV_VARIABLE_NAME) ?? "";
-    this.queryPrefix = init?.queryPrefix ?? "";
-    this.textPrefix = init?.textPrefix ?? "";
-    this.maxRetries = init?.maxRetries ?? DEFAULT_MAX_RETRIES;
-    this.timeout = init?.timeout ?? DEFAULT_TIMEOUT;
-  }
-
-  async getTextEmbedding(text: string): Promise<number[]> {
-    const texts = mapPrefixWithInputs(this.textPrefix, [text]);
-    const embeddings = await this.getDeepInfraEmbedding(texts);
-    return embeddings[0]!;
-  }
-
-  async getQueryEmbedding(
-    query: MessageContentDetail,
-  ): Promise<number[] | null> {
-    const text = extractSingleText(query);
-    if (text) {
-      const queries = mapPrefixWithInputs(this.queryPrefix, [text]);
-      const embeddings = await this.getDeepInfraEmbedding(queries);
-      return embeddings[0]!;
-    } else {
-      return null;
-    }
-  }
-
-  getTextEmbeddings = async (texts: string[]): Promise<number[][]> => {
-    const textsWithPrefix = mapPrefixWithInputs(this.textPrefix, texts);
-    return this.getDeepInfraEmbedding(textsWithPrefix);
-  };
-
-  async getQueryEmbeddings(queries: string[]): Promise<number[][]> {
-    const queriesWithPrefix = mapPrefixWithInputs(this.queryPrefix, queries);
-    return await this.getDeepInfraEmbedding(queriesWithPrefix);
-  }
-
-  private async getDeepInfraEmbedding(inputs: string[]): Promise<number[][]> {
-    const url = this.getUrl(this.model);
-
-    for (let attempt = 0; attempt < this.maxRetries; attempt++) {
-      const controller = new AbortController();
-      const id = setTimeout(() => controller.abort(), this.timeout);
-
-      try {
-        const response = await fetch(url, {
-          method: "POST",
-          headers: {
-            "Content-Type": "application/json",
-            Authorization: `Bearer ${this.apiToken}`,
-          },
-          body: JSON.stringify({ inputs }),
-          signal: controller.signal,
-        });
-        if (!response.ok) {
-          throw new Error(`Request failed with status ${response.status}`);
-        }
-
-        const responseJson: DeepInfraEmbeddingResponse = await response.json();
-        return responseJson.embeddings;
-      } catch (error) {
-        console.error(`Attempt ${attempt + 1} failed: ${error}`);
-      } finally {
-        clearTimeout(id);
-      }
-    }
-
-    throw new Error("Exceeded maximum retries");
-  }
-
-  private getUrl(model: string): string {
-    return `${API_ROOT}/${model}`;
-  }
-}
+export * from "@llamaindex/deepinfra";
@@ -1,110 +1 @@
-import { HfInference } from "@huggingface/inference";
-import { BaseEmbedding } from "@llamaindex/core/embeddings";
-import { loadTransformers } from "@llamaindex/env";
-import { Settings } from "../Settings.js";
-
-export enum HuggingFaceEmbeddingModelType {
-  XENOVA_ALL_MINILM_L6_V2 = "Xenova/all-MiniLM-L6-v2",
-  XENOVA_ALL_MPNET_BASE_V2 = "Xenova/all-mpnet-base-v2",
-}
-
-/**
- * Uses feature extraction from '@xenova/transformers' to generate embeddings.
- * Per default the model [XENOVA_ALL_MINILM_L6_V2](https://huggingface.co/Xenova/all-MiniLM-L6-v2) is used.
- *
- * Can be changed by setting the `modelType` parameter in the constructor, e.g.:
- * ```
- * new HuggingFaceEmbedding({
- *     modelType: HuggingFaceEmbeddingModelType.XENOVA_ALL_MPNET_BASE_V2,
- * });
- * ```
- *
- * @extends BaseEmbedding
- */
-export class HuggingFaceEmbedding extends BaseEmbedding {
-  modelType: string = HuggingFaceEmbeddingModelType.XENOVA_ALL_MINILM_L6_V2;
-  quantized: boolean = true;
-
-  private extractor: any;
-
-  constructor(init?: Partial<HuggingFaceEmbedding>) {
-    super();
-    Object.assign(this, init);
-  }
-
-  async getExtractor() {
-    if (!this.extractor) {
-      const { pipeline } = await loadTransformers((transformer) => {
-        Settings.callbackManager.dispatchEvent(
-          "load-transformers",
-          {
-            transformer,
-          },
-          true,
-        );
-      });
-      this.extractor = await pipeline("feature-extraction", this.modelType, {
-        quantized: this.quantized,
-      });
-    }
-    return this.extractor;
-  }
-
-  override async getTextEmbedding(text: string): Promise<number[]> {
-    const extractor = await this.getExtractor();
-    const output = await extractor(text, { pooling: "mean", normalize: true });
-    return Array.from(output.data);
-  }
-}
-
-// Workaround to get the Options type from @huggingface/inference@2.7.0
-type HfInferenceOptions = ConstructorParameters<typeof HfInference>[1];
-
-export type HFConfig = HfInferenceOptions & {
-  model: string;
-  accessToken: string;
-  endpoint?: string;
-};
-
-/**
- * Uses feature extraction from Hugging Face's Inference API to generate embeddings.
- *
- * Set the `model` and `accessToken` parameter in the constructor, e.g.:
- * ```
- * new HuggingFaceInferenceAPIEmbedding({
- *     model: HuggingFaceEmbeddingModelType.XENOVA_ALL_MPNET_BASE_V2,
- *     accessToken: "<your-access-token>"
- * });
- * ```
- *
- * @extends BaseEmbedding
- */
-export class HuggingFaceInferenceAPIEmbedding extends BaseEmbedding {
-  model: string;
-  hf: HfInference;
-
-  constructor(init: HFConfig) {
-    super();
-    const { model, accessToken, endpoint, ...hfInferenceOpts } = init;
-
-    this.hf = new HfInference(accessToken, hfInferenceOpts);
-    this.model = model;
-    if (endpoint) this.hf.endpoint(endpoint);
-  }
-
-  async getTextEmbedding(text: string): Promise<number[]> {
-    const res = await this.hf.featureExtraction({
-      model: this.model,
-      inputs: text,
-    });
-    return res as number[];
-  }
-
-  getTextEmbeddings = async (texts: string[]): Promise<Array<number[]>> => {
-    const res = await this.hf.featureExtraction({
-      model: this.model,
-      inputs: texts,
-    });
-    return res as number[][];
-  };
-}
+export * from "@llamaindex/huggingface";
@@ -1,4 +1,5 @@
 export * from "@llamaindex/core/embeddings";
+export { ClipEmbedding, ClipEmbeddingModelType } from "./ClipEmbedding.js";
 export { DeepInfraEmbedding } from "./DeepInfraEmbedding.js";
 export { FireworksEmbedding } from "./fireworks.js";
 export * from "./GeminiEmbedding.js";
@@ -9,5 +10,3 @@ export * from "./MixedbreadAIEmbeddings.js";
 export { OllamaEmbedding } from "./OllamaEmbedding.js";
 export * from "./OpenAIEmbedding.js";
 export { TogetherEmbedding } from "./together.js";
-// ClipEmbedding might not work in non-node.js runtime, but it doesn't have side effects
-export { ClipEmbedding, ClipEmbeddingModelType } from "./ClipEmbedding.js";
@@ -1,14 +1,20 @@
 import type { LLM } from "@llamaindex/core/llms";
+import {
+  PromptTemplate,
+  defaultKeywordExtractPrompt,
+  defaultQuestionExtractPrompt,
+  defaultSummaryPrompt,
+  defaultTitleCombinePromptTemplate,
+  defaultTitleExtractorPromptTemplate,
+  type KeywordExtractPrompt,
+  type QuestionExtractPrompt,
+  type SummaryPrompt,
+  type TitleCombinePrompt,
+  type TitleExtractorPrompt,
+} from "@llamaindex/core/prompts";
 import type { BaseNode } from "@llamaindex/core/schema";
 import { MetadataMode, TextNode } from "@llamaindex/core/schema";
 import { OpenAI } from "@llamaindex/openai";
-import {
-  defaultKeywordExtractorPromptTemplate,
-  defaultQuestionAnswerPromptTemplate,
-  defaultSummaryExtractorPromptTemplate,
-  defaultTitleCombinePromptTemplate,
-  defaultTitleExtractorPromptTemplate,
-} from "./prompts.js";
 import { BaseExtractor } from "./types.js";

 const STRIP_REGEX = /(\r\n|\n|\r)/gm;
@@ -16,6 +22,7 @@ const STRIP_REGEX = /(\r\n|\n|\r)/gm;
 type KeywordExtractArgs = {
  llm?: LLM;
  keywords?: number;
+  promptTemplate?: KeywordExtractPrompt["template"];
 };

 type ExtractKeyword = {
@@ -39,6 +46,12 @@ export class KeywordExtractor extends BaseExtractor {
   */
  keywords: number = 5;

+  /**
+   * The prompt template to use for the question extractor.
+   * @type {string}
+   */
+  promptTemplate: KeywordExtractPrompt;
+
  /**
   * Constructor for the KeywordExtractor class.
   * @param {LLM} llm LLM instance.
@@ -53,6 +66,12 @@ export class KeywordExtractor extends BaseExtractor {

    this.llm = options?.llm ?? new OpenAI();
    this.keywords = options?.keywords ?? 5;
+    this.promptTemplate = options?.promptTemplate
+      ? new PromptTemplate({
+          templateVars: ["context", "maxKeywords"],
+          template: options.promptTemplate,
+        })
+      : defaultKeywordExtractPrompt;
  }

  /**
@@ -66,9 +85,9 @@ export class KeywordExtractor extends BaseExtractor {
    }

    const completion = await this.llm.complete({
-      prompt: defaultKeywordExtractorPromptTemplate({
-        contextStr: node.getContent(MetadataMode.ALL),
-        keywords: this.keywords,
+      prompt: this.promptTemplate.format({
+        context: node.getContent(MetadataMode.ALL),
+        maxKeywords: this.keywords.toString(),
      }),
    });

@@ -93,8 +112,8 @@ export class KeywordExtractor extends BaseExtractor {
 type TitleExtractorsArgs = {
  llm?: LLM;
  nodes?: number;
-  nodeTemplate?: string;
-  combineTemplate?: string;
+  nodeTemplate?: TitleExtractorPrompt["template"];
+  combineTemplate?: TitleCombinePrompt["template"];
 };

 type ExtractTitle = {
@@ -129,19 +148,19 @@ export class TitleExtractor extends BaseExtractor {
   * The prompt template to use for the title extractor.
   * @type {string}
   */
-  nodeTemplate: string;
+  nodeTemplate: TitleExtractorPrompt;

  /**
   * The prompt template to merge title with..
   * @type {string}
   */
-  combineTemplate: string;
+  combineTemplate: TitleCombinePrompt;

  /**
   * Constructor for the TitleExtractor class.
   * @param {LLM} llm LLM instance.
   * @param {number} nodes Number of nodes to extract titles from.
-   * @param {string} nodeTemplate The prompt template to use for the title extractor.
+   * @param {TitleExtractorPrompt} nodeTemplate The prompt template to use for the title extractor.
   * @param {string} combineTemplate The prompt template to merge title with..
   */
  constructor(options?: TitleExtractorsArgs) {
@@ -150,10 +169,19 @@ export class TitleExtractor extends BaseExtractor {
    this.llm = options?.llm ?? new OpenAI();
    this.nodes = options?.nodes ?? 5;

-    this.nodeTemplate =
-      options?.nodeTemplate ?? defaultTitleExtractorPromptTemplate();
-    this.combineTemplate =
-      options?.combineTemplate ?? defaultTitleCombinePromptTemplate();
+    this.nodeTemplate = options?.nodeTemplate
+      ? new PromptTemplate({
+          templateVars: ["context"],
+          template: options.nodeTemplate,
+        })
+      : defaultTitleExtractorPromptTemplate;
+
+    this.combineTemplate = options?.combineTemplate
+      ? new PromptTemplate({
+          templateVars: ["context"],
+          template: options.combineTemplate,
+        })
+      : defaultTitleCombinePromptTemplate;
  }

  /**
@@ -218,8 +246,8 @@ export class TitleExtractor extends BaseExtractor {
      const titleCandidates = await this.getTitlesCandidates(nodes);
      const combinedTitles = titleCandidates.join(", ");
      const completion = await this.llm.complete({
-        prompt: defaultTitleCombinePromptTemplate({
-          contextStr: combinedTitles,
+        prompt: this.combineTemplate.format({
+          context: combinedTitles,
        }),
      });

@@ -232,8 +260,8 @@ export class TitleExtractor extends BaseExtractor {
  private async getTitlesCandidates(nodes: BaseNode[]): Promise<string[]> {
    const titleJobs = nodes.map(async (node) => {
      const completion = await this.llm.complete({
-        prompt: defaultTitleExtractorPromptTemplate({
-          contextStr: node.getContent(MetadataMode.ALL),
+        prompt: this.nodeTemplate.format({
+          context: node.getContent(MetadataMode.ALL),
        }),
      });

@@ -247,7 +275,7 @@ export class TitleExtractor extends BaseExtractor {
 type QuestionAnswerExtractArgs = {
  llm?: LLM;
  questions?: number;
-  promptTemplate?: string;
+  promptTemplate?: QuestionExtractPrompt["template"];
  embeddingOnly?: boolean;
 };

@@ -276,7 +304,7 @@ export class QuestionsAnsweredExtractor extends BaseExtractor {
   * The prompt template to use for the question extractor.
   * @type {string}
   */
-  promptTemplate: string;
+  promptTemplate: QuestionExtractPrompt;

  /**
   * Wheter to use metadata for embeddings only
@@ -289,7 +317,7 @@ export class QuestionsAnsweredExtractor extends BaseExtractor {
   * Constructor for the QuestionsAnsweredExtractor class.
   * @param {LLM} llm LLM instance.
   * @param {number} questions Number of questions to generate.
-   * @param {string} promptTemplate The prompt template to use for the question extractor.
+   * @param {TextQAPrompt} promptTemplate The prompt template to use for the question extractor.
   * @param {boolean} embeddingOnly Wheter to use metadata for embeddings only.
   */
  constructor(options?: QuestionAnswerExtractArgs) {
@@ -300,12 +328,14 @@ export class QuestionsAnsweredExtractor extends BaseExtractor {

    this.llm = options?.llm ?? new OpenAI();
    this.questions = options?.questions ?? 5;
-    this.promptTemplate =
-      options?.promptTemplate ??
-      defaultQuestionAnswerPromptTemplate({
-        numQuestions: this.questions,
-        contextStr: "",
-      });
+    this.promptTemplate = options?.promptTemplate
+      ? new PromptTemplate({
+          templateVars: ["numQuestions", "context"],
+          template: options.promptTemplate,
+        }).partialFormat({
+          numQuestions: "5",
+        })
+      : defaultQuestionExtractPrompt;
    this.embeddingOnly = options?.embeddingOnly ?? false;
  }

@@ -323,9 +353,9 @@ export class QuestionsAnsweredExtractor extends BaseExtractor {

    const contextStr = node.getContent(this.metadataMode);

-    const prompt = defaultQuestionAnswerPromptTemplate({
-      contextStr,
-      numQuestions: this.questions,
+    const prompt = this.promptTemplate.format({
+      context: contextStr,
+      numQuestions: this.questions.toString(),
    });

    const questions = await this.llm.complete({
@@ -356,7 +386,7 @@ export class QuestionsAnsweredExtractor extends BaseExtractor {
 type SummaryExtractArgs = {
  llm?: LLM;
  summaries?: string[];
-  promptTemplate?: string;
+  promptTemplate?: SummaryPrompt["template"];
 };

 type ExtractSummary = {
@@ -385,7 +415,7 @@ export class SummaryExtractor extends BaseExtractor {
   * The prompt template to use for the summary extractor.
   * @type {string}
   */
-  promptTemplate: string;
+  promptTemplate: SummaryPrompt;

  private selfSummary: boolean;
  private prevSummary: boolean;
@@ -404,8 +434,12 @@ export class SummaryExtractor extends BaseExtractor {

    this.llm = options?.llm ?? new OpenAI();
    this.summaries = summaries;
-    this.promptTemplate =
-      options?.promptTemplate ?? defaultSummaryExtractorPromptTemplate();
+    this.promptTemplate = options?.promptTemplate
+      ? new PromptTemplate({
+          templateVars: ["context"],
+          template: options.promptTemplate,
+        })
+      : defaultSummaryPrompt;

    this.selfSummary = summaries?.includes("self") ?? false;
    this.prevSummary = summaries?.includes("prev") ?? false;
@@ -422,10 +456,10 @@ export class SummaryExtractor extends BaseExtractor {
      return "";
    }

-    const contextStr = node.getContent(this.metadataMode);
+    const context = node.getContent(this.metadataMode);

-    const prompt = defaultSummaryExtractorPromptTemplate({
-      contextStr,
+    const prompt = this.promptTemplate.format({
+      context,
    });

    const summary = await this.llm.complete({
@@ -1,74 +0,0 @@
-export interface DefaultPromptTemplate {
-  contextStr: string;
-}
-
-export interface DefaultKeywordExtractorPromptTemplate
-  extends DefaultPromptTemplate {
-  keywords: number;
-}
-
-export interface DefaultQuestionAnswerPromptTemplate
-  extends DefaultPromptTemplate {
-  numQuestions: number;
-}
-
-export interface DefaultNodeTextTemplate {
-  metadataStr: string;
-  content: string;
-}
-
-export const defaultKeywordExtractorPromptTemplate = ({
-  contextStr = "",
-  keywords = 5,
-}: DefaultKeywordExtractorPromptTemplate) => `${contextStr} 
-Give ${keywords} unique keywords for this document. 
-Format as comma separated. 
-Keywords: `;
-
-export const defaultTitleExtractorPromptTemplate = (
-  { contextStr = "" }: DefaultPromptTemplate = {
-    contextStr: "",
-  },
-) => `${contextStr}
-Give a title that summarizes all of the unique entities, titles or themes found in the context. 
-Title: `;
-
-export const defaultTitleCombinePromptTemplate = (
-  { contextStr = "" }: DefaultPromptTemplate = {
-    contextStr: "",
-  },
-) => `${contextStr} 
-Based on the above candidate titles and contents, what is the comprehensive title for this document? 
-Title: `;
-
-export const defaultQuestionAnswerPromptTemplate = (
-  { contextStr = "", numQuestions = 5 }: DefaultQuestionAnswerPromptTemplate = {
-    contextStr: "",
-    numQuestions: 5,
-  },
-) => `${contextStr}
-Given the contextual informations, generate ${numQuestions} questions this context can provides specific answers to which are unlikely to be found else where. Higher-level summaries of surrounding context may be provideds as well. 
-Try using these summaries to generate better questions that this context can answer.
-`;
-
-export const defaultSummaryExtractorPromptTemplate = (
-  { contextStr = "" }: DefaultPromptTemplate = {
-    contextStr: "",
-  },
-) => `${contextStr}
-Summarize the key topics and entities of the sections.
-Summary: `;
-
-export const defaultNodeTextTemplate = ({
-  metadataStr = "",
-  content = "",
-}: {
-  metadataStr?: string;
-  content?: string;
-} = {}) => `[Excerpt from document]
-${metadataStr}
-Excerpt:
-----
-${content}
-----
-`;
@@ -1,10 +1,10 @@
+import { defaultNodeTextTemplate } from "@llamaindex/core/prompts";
 import {
  BaseNode,
  MetadataMode,
  TextNode,
  TransformComponent,
 } from "@llamaindex/core/schema";
-import { defaultNodeTextTemplate } from "./prompts.js";

 /*
 * Abstract class for all extractors.
@@ -71,7 +71,7 @@ export abstract class BaseExtractor extends TransformComponent {
        if (newNodes[idx] instanceof TextNode) {
          newNodes[idx] = new TextNode({
            ...newNodes[idx],
-            textTemplate: defaultNodeTextTemplate(),
+            textTemplate: defaultNodeTextTemplate.format(),
          });
        }
      }
@@ -8,39 +8,6 @@ import { runTransformations } from "../ingestion/IngestionPipeline.js";
 import type { StorageContext } from "../storage/StorageContext.js";
 import type { BaseDocumentStore } from "../storage/docStore/types.js";
 import type { BaseIndexStore } from "../storage/indexStore/types.js";
-import { IndexStruct } from "./IndexStruct.js";
-import { IndexStructType } from "./json-to-index-struct.js";
-
-// A table of keywords mapping keywords to text chunks.
-export class KeywordTable extends IndexStruct {
-  table: Map<string, Set<string>> = new Map();
-  type: IndexStructType = IndexStructType.KEYWORD_TABLE;
-
-  addNode(keywords: string[], nodeId: string): void {
-    keywords.forEach((keyword) => {
-      if (!this.table.has(keyword)) {
-        this.table.set(keyword, new Set());
-      }
-      this.table.get(keyword)!.add(nodeId);
-    });
-  }
-
-  deleteNode(keywords: string[], nodeId: string) {
-    keywords.forEach((keyword) => {
-      if (this.table.has(keyword)) {
-        this.table.get(keyword)!.delete(nodeId);
-      }
-    });
-  }
-
-  toJson(): Record<string, unknown> {
-    return {
-      ...super.toJson(),
-      table: this.table,
-      type: this.type,
-    };
-  }
-}

 export interface BaseIndexInit<T> {
  serviceContext?: ServiceContext | undefined;
@@ -13,7 +13,7 @@ import type { StorageContext } from "../../storage/StorageContext.js";
 import { storageContextFromDefaults } from "../../storage/StorageContext.js";
 import type { BaseDocumentStore } from "../../storage/docStore/types.js";
 import type { BaseIndexInit } from "../BaseIndex.js";
-import { BaseIndex, KeywordTable } from "../BaseIndex.js";
+import { BaseIndex } from "../BaseIndex.js";
 import { IndexStructType } from "../json-to-index-struct.js";
 import {
  extractKeywordsGivenResponse,
@@ -21,6 +21,7 @@ import {
  simpleExtractKeywords,
 } from "./utils.js";

+import { KeywordTable } from "@llamaindex/core/data-structs";
 import type { LLM } from "@llamaindex/core/llms";
 import {
  defaultKeywordExtractPrompt,
@@ -31,8 +31,8 @@ import type { StorageContext } from "../../storage/StorageContext.js";
 import { storageContextFromDefaults } from "../../storage/StorageContext.js";
 import type { BaseIndexStore } from "../../storage/indexStore/types.js";
 import type {
+  BaseVectorStore,
  MetadataFilters,
-  VectorStore,
  VectorStoreByType,
  VectorStoreQueryResult,
 } from "../../vector-store/index.js";
@@ -264,7 +264,7 @@ export class VectorStoreIndex extends BaseIndex<IndexDict> {
  }

  static async fromVectorStore(
-    vectorStore: VectorStore,
+    vectorStore: BaseVectorStore,
    serviceContext?: ServiceContext,
  ) {
    return this.fromVectorStores(
@@ -307,7 +307,7 @@ export class VectorStoreIndex extends BaseIndex<IndexDict> {
  protected async insertNodesToStore(
    newIds: string[],
    nodes: BaseNode[],
-    vectorStore: VectorStore,
+    vectorStore: BaseVectorStore,
  ): Promise<void> {
    // NOTE: if the vector store doesn't store text,
    // we need to add the nodes to the index struct and document store
@@ -357,7 +357,7 @@ export class VectorStoreIndex extends BaseIndex<IndexDict> {
  }

  protected async deleteRefDocFromStore(
-    vectorStore: VectorStore,
+    vectorStore: BaseVectorStore,
    refDocId: string,
  ): Promise<void> {
    await vectorStore.delete(refDocId);
@@ -425,7 +425,7 @@ export class VectorIndexRetriever extends BaseRetriever {
    let nodesWithScores: NodeWithScore[] = [];

    for (const type in vectorStores) {
-      const vectorStore: VectorStore = vectorStores[type as ModalityType]!;
+      const vectorStore: BaseVectorStore = vectorStores[type as ModalityType]!;
      nodesWithScores = nodesWithScores.concat(
        await this.retrieveQuery(query, type as ModalityType, vectorStore),
      );
@@ -436,7 +436,7 @@ export class VectorIndexRetriever extends BaseRetriever {
  protected async retrieveQuery(
    query: MessageContent,
    type: ModalityType,
-    vectorStore: VectorStore,
+    vectorStore: BaseVectorStore,
    filters?: MetadataFilters,
  ): Promise<NodeWithScore[]> {
    // convert string message to multi-modal format
@@ -7,7 +7,10 @@ import {
  type Metadata,
 } from "@llamaindex/core/schema";
 import type { BaseDocumentStore } from "../storage/docStore/types.js";
-import type { VectorStore, VectorStoreByType } from "../vector-store/types.js";
+import type {
+  BaseVectorStore,
+  VectorStoreByType,
+} from "../vector-store/types.js";
 import { IngestionCache, getTransformationHash } from "./IngestionCache.js";
 import {
  DocStoreStrategy,
@@ -59,7 +62,7 @@ export class IngestionPipeline {
  transformations: TransformComponent[] = [];
  documents?: Document[] | undefined;
  reader?: BaseReader | undefined;
-  vectorStore?: VectorStore | undefined;
+  vectorStore?: BaseVectorStore | undefined;
  vectorStores?: VectorStoreByType | undefined;
  docStore?: BaseDocumentStore;
  docStoreStrategy: DocStoreStrategy = DocStoreStrategy.UPSERTS;
@@ -133,7 +136,7 @@ export async function addNodesToVectorStores(
  nodesAdded?: (
    newIds: string[],
    nodes: BaseNode<Metadata>[],
-    vectorStore: VectorStore,
+    vectorStore: BaseVectorStore,
  ) => Promise<void>,
 ) {
  const nodeMap = splitNodesByType(nodes);
@@ -1,6 +1,6 @@
 import { BaseNode, TransformComponent } from "@llamaindex/core/schema";
 import type { BaseDocumentStore } from "../../storage/docStore/types.js";
-import type { VectorStore } from "../../vector-store/types.js";
+import type { BaseVectorStore } from "../../vector-store/types.js";
 import { classify } from "./classify.js";

 /**
@@ -9,9 +9,9 @@ import { classify } from "./classify.js";
 */
 export class UpsertsAndDeleteStrategy extends TransformComponent {
  protected docStore: BaseDocumentStore;
-  protected vectorStores: VectorStore[] | undefined;
+  protected vectorStores: BaseVectorStore[] | undefined;

-  constructor(docStore: BaseDocumentStore, vectorStores?: VectorStore[]) {
+  constructor(docStore: BaseDocumentStore, vectorStores?: BaseVectorStore[]) {
    super(async (nodes: BaseNode[]): Promise<BaseNode[]> => {
      const { dedupedNodes, missingDocs, unusedDocs } = await classify(
        this.docStore,
@@ -1,6 +1,6 @@
 import { BaseNode, TransformComponent } from "@llamaindex/core/schema";
 import type { BaseDocumentStore } from "../../storage/docStore/types.js";
-import type { VectorStore } from "../../vector-store/types.js";
+import type { BaseVectorStore } from "../../vector-store/types.js";
 import { classify } from "./classify.js";

 /**
@@ -8,9 +8,9 @@ import { classify } from "./classify.js";
 */
 export class UpsertsStrategy extends TransformComponent {
  protected docStore: BaseDocumentStore;
-  protected vectorStores: VectorStore[] | undefined;
+  protected vectorStores: BaseVectorStore[] | undefined;

-  constructor(docStore: BaseDocumentStore, vectorStores?: VectorStore[]) {
+  constructor(docStore: BaseDocumentStore, vectorStores?: BaseVectorStore[]) {
    super(async (nodes: BaseNode[]): Promise<BaseNode[]> => {
      const { dedupedNodes, unusedDocs } = await classify(this.docStore, nodes);
      // remove unused docs
@@ -1,6 +1,6 @@
 import { TransformComponent } from "@llamaindex/core/schema";
 import type { BaseDocumentStore } from "../../storage/docStore/types.js";
-import type { VectorStore } from "../../vector-store/types.js";
+import type { BaseVectorStore } from "../../vector-store/types.js";
 import { DuplicatesStrategy } from "./DuplicatesStrategy.js";
 import { UpsertsAndDeleteStrategy } from "./UpsertsAndDeleteStrategy.js";
 import { UpsertsStrategy } from "./UpsertsStrategy.js";
@@ -28,7 +28,7 @@ class NoOpStrategy extends TransformComponent {
 export function createDocStoreStrategy(
  docStoreStrategy: DocStoreStrategy,
  docStore?: BaseDocumentStore,
-  vectorStores: VectorStore[] = [],
+  vectorStores: BaseVectorStore[] = [],
 ): TransformComponent {
  if (docStoreStrategy === DocStoreStrategy.NONE) {
    return new NoOpStrategy();
@@ -1,305 +0,0 @@
-type Status = "starting" | "processing" | "succeeded" | "failed" | "canceled";
-type Visibility = "public" | "private";
-type WebhookEventType = "start" | "output" | "logs" | "completed";
-
-export interface ApiError extends Error {
-  request: Request;
-  response: Response;
-}
-
-export interface Account {
-  type: "user" | "organization";
-  username: string;
-  name: string;
-  github_url?: string;
-}
-
-export interface Collection {
-  name: string;
-  slug: string;
-  description: string;
-  models?: Model[];
-}
-
-export interface Deployment {
-  owner: string;
-  name: string;
-  current_release: {
-    number: number;
-    model: string;
-    version: string;
-    created_at: string;
-    created_by: Account;
-    configuration: {
-      hardware: string;
-      min_instances: number;
-      max_instances: number;
-    };
-  };
-}
-
-export interface Hardware {
-  sku: string;
-  name: string;
-}
-
-export interface Model {
-  url: string;
-  owner: string;
-  name: string;
-  description?: string;
-  visibility: "public" | "private";
-  github_url?: string;
-  paper_url?: string;
-  license_url?: string;
-  run_count: number;
-  cover_image_url?: string;
-  default_example?: Prediction;
-  latest_version?: ModelVersion;
-}
-
-export interface ModelVersion {
-  id: string;
-  created_at: string;
-  cog_version: string;
-  openapi_schema: object;
-}
-
-export interface Prediction {
-  id: string;
-  status: Status;
-  model: string;
-  version: string;
-  input: object;
-  output?: any;
-  source: "api" | "web";
-  error?: any;
-  logs?: string;
-  metrics?: {
-    predict_time?: number;
-  };
-  webhook?: string;
-  webhook_events_filter?: WebhookEventType[];
-  created_at: string;
-  started_at?: string;
-  completed_at?: string;
-  urls: {
-    get: string;
-    cancel: string;
-    stream?: string;
-  };
-}
-
-export type Training = Prediction;
-
-export interface Page<T> {
-  previous?: string;
-  next?: string;
-  results: T[];
-}
-
-export interface ServerSentEvent {
-  event: string;
-  data: string;
-  id?: string;
-  retry?: number;
-}
-
-export interface WebhookSecret {
-  key: string;
-}
-
-export default class Replicate {
-  constructor(options?: {
-    auth?: string;
-    userAgent?: string;
-    baseUrl?: string;
-    fetch?: (input: Request | string, init?: RequestInit) => Promise<Response>;
-  });
-
-  auth: string;
-  userAgent?: string;
-  baseUrl?: string;
-  fetch: (input: Request | string, init?: RequestInit) => Promise<Response>;
-
-  run(
-    identifier: `${string}/${string}` | `${string}/${string}:${string}`,
-    options: {
-      input: object;
-      wait?: { interval?: number };
-      webhook?: string;
-      webhook_events_filter?: WebhookEventType[];
-      signal?: AbortSignal;
-    },
-    progress?: (prediction: Prediction) => void,
-  ): Promise<object>;
-
-  stream(
-    identifier: `${string}/${string}` | `${string}/${string}:${string}`,
-    options: {
-      input: object;
-      webhook?: string;
-      webhook_events_filter?: WebhookEventType[];
-      signal?: AbortSignal;
-    },
-  ): AsyncGenerator<ServerSentEvent>;
-
-  request(
-    route: string | URL,
-    options: {
-      method?: string;
-      headers?: object | Headers;
-      params?: object;
-      data?: object;
-    },
-  ): Promise<Response>;
-
-  paginate<T>(endpoint: () => Promise<Page<T>>): AsyncGenerator<[T]>;
-
-  wait(
-    prediction: Prediction,
-    options?: {
-      interval?: number;
-    },
-    stop?: (prediction: Prediction) => Promise<boolean>,
-  ): Promise<Prediction>;
-
-  accounts: {
-    current(): Promise<Account>;
-  };
-
-  collections: {
-    list(): Promise<Page<Collection>>;
-    get(collection_slug: string): Promise<Collection>;
-  };
-
-  deployments: {
-    predictions: {
-      create(
-        deployment_owner: string,
-        deployment_name: string,
-        options: {
-          input: object;
-          stream?: boolean;
-          webhook?: string;
-          webhook_events_filter?: WebhookEventType[];
-        },
-      ): Promise<Prediction>;
-    };
-    get(deployment_owner: string, deployment_name: string): Promise<Deployment>;
-    create(deployment_config: {
-      name: string;
-      model: string;
-      version: string;
-      hardware: string;
-      min_instances: number;
-      max_instances: number;
-    }): Promise<Deployment>;
-    update(
-      deployment_owner: string,
-      deployment_name: string,
-      deployment_config: {
-        version?: string;
-        hardware?: string;
-        min_instances?: number;
-        max_instances?: number;
-      } & (
-        | { version: string }
-        | { hardware: string }
-        | { min_instances: number }
-        | { max_instances: number }
-      ),
-    ): Promise<Deployment>;
-    list(): Promise<Page<Deployment>>;
-  };
-
-  hardware: {
-    list(): Promise<Hardware[]>;
-  };
-
-  models: {
-    get(model_owner: string, model_name: string): Promise<Model>;
-    list(): Promise<Page<Model>>;
-    create(
-      model_owner: string,
-      model_name: string,
-      options: {
-        visibility: Visibility;
-        hardware: string;
-        description?: string;
-        github_url?: string;
-        paper_url?: string;
-        license_url?: string;
-        cover_image_url?: string;
-      },
-    ): Promise<Model>;
-    versions: {
-      list(model_owner: string, model_name: string): Promise<ModelVersion[]>;
-      get(
-        model_owner: string,
-        model_name: string,
-        version_id: string,
-      ): Promise<ModelVersion>;
-    };
-  };
-
-  predictions: {
-    create(
-      options: {
-        model?: string;
-        version?: string;
-        input: object;
-        stream?: boolean;
-        webhook?: string;
-        webhook_events_filter?: WebhookEventType[];
-      } & ({ version: string } | { model: string }),
-    ): Promise<Prediction>;
-    get(prediction_id: string): Promise<Prediction>;
-    cancel(prediction_id: string): Promise<Prediction>;
-    list(): Promise<Page<Prediction>>;
-  };
-
-  trainings: {
-    create(
-      model_owner: string,
-      model_name: string,
-      version_id: string,
-      options: {
-        destination: `${string}/${string}`;
-        input: object;
-        webhook?: string;
-        webhook_events_filter?: WebhookEventType[];
-      },
-    ): Promise<Training>;
-    get(training_id: string): Promise<Training>;
-    cancel(training_id: string): Promise<Training>;
-    list(): Promise<Page<Training>>;
-  };
-
-  webhooks: {
-    default: {
-      secret: {
-        get(): Promise<WebhookSecret>;
-      };
-    };
-  };
-}
-
-export function validateWebhook(
-  requestData:
-    | Request
-    | {
-        id?: string;
-        timestamp?: string;
-        body: string;
-        secret?: string;
-        signature?: string;
-      },
-  secret: string,
-): Promise<boolean>;
-
-export function parseProgressFromLogs(logs: Prediction | string): {
-  percentage: number;
-  current: number;
-  total: number;
-} | null;
@@ -1,201 +0,0 @@
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-1.  Definitions.
-
-    "License" shall mean the terms and conditions for use, reproduction,
-    and distribution as defined by Sections 1 through 9 of this document.
-
-    "Licensor" shall mean the copyright owner or entity authorized by
-    the copyright owner that is granting the License.
-
-    "Legal Entity" shall mean the union of the acting entity and all
-    other entities that control, are controlled by, or are under common
-    control with that entity. For the purposes of this definition,
-    "control" means (i) the power, direct or indirect, to cause the
-    direction or management of such entity, whether by contract or
-    otherwise, or (ii) ownership of fifty percent (50%) or more of the
-    outstanding shares, or (iii) beneficial ownership of such entity.
-
-    "You" (or "Your") shall mean an individual or Legal Entity
-    exercising permissions granted by this License.
-
-    "Source" form shall mean the preferred form for making modifications,
-    including but not limited to software source code, documentation
-    source, and configuration files.
-
-    "Object" form shall mean any form resulting from mechanical
-    transformation or translation of a Source form, including but
-    not limited to compiled object code, generated documentation,
-    and conversions to other media types.
-
-    "Work" shall mean the work of authorship, whether in Source or
-    Object form, made available under the License, as indicated by a
-    copyright notice that is included in or attached to the work
-    (an example is provided in the Appendix below).
-
-    "Derivative Works" shall mean any work, whether in Source or Object
-    form, that is based on (or derived from) the Work and for which the
-    editorial revisions, annotations, elaborations, or other modifications
-    represent, as a whole, an original work of authorship. For the purposes
-    of this License, Derivative Works shall not include works that remain
-    separable from, or merely link (or bind by name) to the interfaces of,
-    the Work and Derivative Works thereof.
-
-    "Contribution" shall mean any work of authorship, including
-    the original version of the Work and any modifications or additions
-    to that Work or Derivative Works thereof, that is intentionally
-    submitted to Licensor for inclusion in the Work by the copyright owner
-    or by an individual or Legal Entity authorized to submit on behalf of
-    the copyright owner. For the purposes of this definition, "submitted"
-    means any form of electronic, verbal, or written communication sent
-    to the Licensor or its representatives, including but not limited to
-    communication on electronic mailing lists, source code control systems,
-    and issue tracking systems that are managed by, or on behalf of, the
-    Licensor for the purpose of discussing and improving the Work, but
-    excluding communication that is conspicuously marked or otherwise
-    designated in writing by the copyright owner as "Not a Contribution."
-
-    "Contributor" shall mean Licensor and any individual or Legal Entity
-    on behalf of whom a Contribution has been received by Licensor and
-    subsequently incorporated within the Work.
-
-2.  Grant of Copyright License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    copyright license to reproduce, prepare Derivative Works of,
-    publicly display, publicly perform, sublicense, and distribute the
-    Work and such Derivative Works in Source or Object form.
-
-3.  Grant of Patent License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    (except as stated in this section) patent license to make, have made,
-    use, offer to sell, sell, import, and otherwise transfer the Work,
-    where such license applies only to those patent claims licensable
-    by such Contributor that are necessarily infringed by their
-    Contribution(s) alone or by combination of their Contribution(s)
-    with the Work to which such Contribution(s) was submitted. If You
-    institute patent litigation against any entity (including a
-    cross-claim or counterclaim in a lawsuit) alleging that the Work
-    or a Contribution incorporated within the Work constitutes direct
-    or contributory patent infringement, then any patent licenses
-    granted to You under this License for that Work shall terminate
-    as of the date such litigation is filed.
-
-4.  Redistribution. You may reproduce and distribute copies of the
-    Work or Derivative Works thereof in any medium, with or without
-    modifications, and in Source or Object form, provided that You
-    meet the following conditions:
-
-    (a) You must give any other recipients of the Work or
-    Derivative Works a copy of this License; and
-
-    (b) You must cause any modified files to carry prominent notices
-    stating that You changed the files; and
-
-    (c) You must retain, in the Source form of any Derivative Works
-    that You distribute, all copyright, patent, trademark, and
-    attribution notices from the Source form of the Work,
-    excluding those notices that do not pertain to any part of
-    the Derivative Works; and
-
-    (d) If the Work includes a "NOTICE" text file as part of its
-    distribution, then any Derivative Works that You distribute must
-    include a readable copy of the attribution notices contained
-    within such NOTICE file, excluding those notices that do not
-    pertain to any part of the Derivative Works, in at least one
-    of the following places: within a NOTICE text file distributed
-    as part of the Derivative Works; within the Source form or
-    documentation, if provided along with the Derivative Works; or,
-    within a display generated by the Derivative Works, if and
-    wherever such third-party notices normally appear. The contents
-    of the NOTICE file are for informational purposes only and
-    do not modify the License. You may add Your own attribution
-    notices within Derivative Works that You distribute, alongside
-    or as an addendum to the NOTICE text from the Work, provided
-    that such additional attribution notices cannot be construed
-    as modifying the License.
-
-    You may add Your own copyright statement to Your modifications and
-    may provide additional or different license terms and conditions
-    for use, reproduction, or distribution of Your modifications, or
-    for any such Derivative Works as a whole, provided Your use,
-    reproduction, and distribution of the Work otherwise complies with
-    the conditions stated in this License.
-
-5.  Submission of Contributions. Unless You explicitly state otherwise,
-    any Contribution intentionally submitted for inclusion in the Work
-    by You to the Licensor shall be under the terms and conditions of
-    this License, without any additional terms or conditions.
-    Notwithstanding the above, nothing herein shall supersede or modify
-    the terms of any separate license agreement you may have executed
-    with Licensor regarding such Contributions.
-
-6.  Trademarks. This License does not grant permission to use the trade
-    names, trademarks, service marks, or product names of the Licensor,
-    except as required for reasonable and customary use in describing the
-    origin of the Work and reproducing the content of the NOTICE file.
-
-7.  Disclaimer of Warranty. Unless required by applicable law or
-    agreed to in writing, Licensor provides the Work (and each
-    Contributor provides its Contributions) on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-    implied, including, without limitation, any warranties or conditions
-    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-    PARTICULAR PURPOSE. You are solely responsible for determining the
-    appropriateness of using or redistributing the Work and assume any
-    risks associated with Your exercise of permissions under this License.
-
-8.  Limitation of Liability. In no event and under no legal theory,
-    whether in tort (including negligence), contract, or otherwise,
-    unless required by applicable law (such as deliberate and grossly
-    negligent acts) or agreed to in writing, shall any Contributor be
-    liable to You for damages, including any direct, indirect, special,
-    incidental, or consequential damages of any character arising as a
-    result of this License or out of the use or inability to use the
-    Work (including but not limited to damages for loss of goodwill,
-    work stoppage, computer failure or malfunction, or any and all
-    other commercial damages or losses), even if such Contributor
-    has been advised of the possibility of such damages.
-
-9.  Accepting Warranty or Additional Liability. While redistributing
-    the Work or Derivative Works thereof, You may choose to offer,
-    and charge a fee for, acceptance of support, warranty, indemnity,
-    or other liability obligations and/or rights consistent with this
-    License. However, in accepting such obligations, You may act only
-    on Your own behalf and on Your sole responsibility, not on behalf
-    of any other Contributor, and only if You agree to indemnify,
-    defend, and hold each Contributor harmless for any liability
-    incurred by, or claims asserted against, such Contributor by reason
-    of your accepting any such warranty or additional liability.
-
-END OF TERMS AND CONDITIONS
-
-APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. We also recommend that a
-      file or class name and description of purpose be included on the
-      same "printed page" as the copyright notice for easier
-      identification within third-party archives.
-
-Copyright 2023 Replicate, Inc.
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
@@ -1,8 +0,0 @@
-export async function getImageEmbedModel() {
-  if (globalThis.navigator?.userAgent === "Cloudflare-Workers") {
-    return (await import("../../embeddings/CloudflareWorkerEmbedding.js"))
-      .CloudflareWorkerMultiModalEmbedding;
-  } else {
-    return (await import("../../embeddings/ClipEmbedding.js")).ClipEmbedding;
-  }
-}
@@ -1,462 +1 @@
-import type { ClientOptions } from "@anthropic-ai/sdk";
-import { Anthropic as SDKAnthropic } from "@anthropic-ai/sdk";
-import type {
-  TextBlock,
-  TextBlockParam,
-} from "@anthropic-ai/sdk/resources/index";
-import type {
-  ImageBlockParam,
-  MessageCreateParamsNonStreaming,
-  MessageParam,
-  Tool,
-  ToolResultBlockParam,
-  ToolUseBlock,
-  ToolUseBlockParam,
-} from "@anthropic-ai/sdk/resources/messages";
-import { wrapLLMEvent } from "@llamaindex/core/decorator";
-import type {
-  BaseTool,
-  ChatMessage,
-  ChatResponse,
-  ChatResponseChunk,
-  LLMChatParamsNonStreaming,
-  LLMChatParamsStreaming,
-  ToolCallLLMMessageOptions,
-} from "@llamaindex/core/llms";
-import { ToolCallLLM } from "@llamaindex/core/llms";
-import { extractText } from "@llamaindex/core/utils";
-import { getEnv } from "@llamaindex/env";
-import _ from "lodash";
-
-export class AnthropicSession {
-  anthropic: SDKAnthropic;
-
-  constructor(options: ClientOptions = {}) {
-    if (!options.apiKey) {
-      options.apiKey = getEnv("ANTHROPIC_API_KEY");
-    }
-
-    if (!options.apiKey) {
-      throw new Error("Set Anthropic Key in ANTHROPIC_API_KEY env variable");
-    }
-
-    this.anthropic = new SDKAnthropic(options);
-  }
-}
-
-// I'm not 100% sure this is necessary vs. just starting a new session
-// every time we make a call. They say they try to reuse connections
-// so in theory this is more efficient, but we should test it in the future.
-const defaultAnthropicSession: {
-  session: AnthropicSession;
-  options: ClientOptions;
-}[] = [];
-
-/**
- * Get a session for the Anthropic API. If one already exists with the same options,
- * it will be returned. Otherwise, a new session will be created.
- * @param options
- * @returns
- */
-export function getAnthropicSession(options: ClientOptions = {}) {
-  let session = defaultAnthropicSession.find((session) => {
-    return _.isEqual(session.options, options);
-  })?.session;
-
-  if (!session) {
-    session = new AnthropicSession(options);
-    defaultAnthropicSession.push({ session, options });
-  }
-
-  return session;
-}
-
-export const ALL_AVAILABLE_ANTHROPIC_LEGACY_MODELS = {
-  "claude-2.1": {
-    contextWindow: 200000,
-  },
-  "claude-instant-1.2": {
-    contextWindow: 100000,
-  },
-};
-
-export const ALL_AVAILABLE_V3_MODELS = {
-  "claude-3-opus": { contextWindow: 200000 },
-  "claude-3-sonnet": { contextWindow: 200000 },
-  "claude-3-haiku": { contextWindow: 200000 },
-};
-
-export const ALL_AVAILABLE_V3_5_MODELS = {
-  "claude-3-5-sonnet": { contextWindow: 200000 },
-};
-
-export const ALL_AVAILABLE_ANTHROPIC_MODELS = {
-  ...ALL_AVAILABLE_ANTHROPIC_LEGACY_MODELS,
-  ...ALL_AVAILABLE_V3_MODELS,
-  ...ALL_AVAILABLE_V3_5_MODELS,
-};
-
-const AVAILABLE_ANTHROPIC_MODELS_WITHOUT_DATE: { [key: string]: string } = {
-  "claude-3-opus": "claude-3-opus-20240229",
-  "claude-3-sonnet": "claude-3-sonnet-20240229",
-  "claude-3-haiku": "claude-3-haiku-20240307",
-  "claude-3-5-sonnet": "claude-3-5-sonnet-20240620",
-} as { [key in keyof typeof ALL_AVAILABLE_ANTHROPIC_MODELS]: string };
-
-export type AnthropicAdditionalChatOptions = {};
-
-export class Anthropic extends ToolCallLLM<AnthropicAdditionalChatOptions> {
-  // Per completion Anthropic params
-  model: keyof typeof ALL_AVAILABLE_ANTHROPIC_MODELS;
-  temperature: number;
-  topP: number;
-  maxTokens?: number | undefined;
-
-  // Anthropic session params
-  apiKey?: string | undefined;
-  maxRetries: number;
-  timeout?: number;
-  session: AnthropicSession;
-
-  constructor(init?: Partial<Anthropic>) {
-    super();
-    this.model = init?.model ?? "claude-3-opus";
-    this.temperature = init?.temperature ?? 0.1;
-    this.topP = init?.topP ?? 0.999; // Per Ben Mann
-    this.maxTokens = init?.maxTokens ?? undefined;
-
-    this.apiKey = init?.apiKey ?? undefined;
-    this.maxRetries = init?.maxRetries ?? 10;
-    this.timeout = init?.timeout ?? 60 * 1000; // Default is 60 seconds
-    this.session =
-      init?.session ??
-      getAnthropicSession({
-        apiKey: this.apiKey,
-        maxRetries: this.maxRetries,
-        timeout: this.timeout,
-      });
-  }
-
-  get supportToolCall() {
-    return this.model.startsWith("claude-3");
-  }
-
-  get metadata() {
-    return {
-      model: this.model,
-      temperature: this.temperature,
-      topP: this.topP,
-      maxTokens: this.maxTokens,
-      contextWindow: ALL_AVAILABLE_ANTHROPIC_MODELS[this.model].contextWindow,
-      tokenizer: undefined,
-    };
-  }
-
-  getModelName = (model: string): string => {
-    if (Object.keys(AVAILABLE_ANTHROPIC_MODELS_WITHOUT_DATE).includes(model)) {
-      return AVAILABLE_ANTHROPIC_MODELS_WITHOUT_DATE[model]!;
-    }
-    return model;
-  };
-
-  formatMessages(
-    messages: ChatMessage<ToolCallLLMMessageOptions>[],
-  ): MessageParam[] {
-    const result: MessageParam[] = messages
-      .filter(
-        (message) => message.role === "user" || message.role === "assistant",
-      )
-      .map((message) => {
-        const options = message.options ?? {};
-        if ("toolResult" in options) {
-          const { id, isError } = options.toolResult;
-          return {
-            role: "user",
-            content: [
-              {
-                type: "tool_result",
-                is_error: isError,
-                content: [
-                  {
-                    type: "text",
-                    text: extractText(message.content),
-                  },
-                ],
-                tool_use_id: id,
-              },
-            ] satisfies ToolResultBlockParam[],
-          } satisfies MessageParam;
-        } else if ("toolCall" in options) {
-          const aiThinkingText = extractText(message.content);
-          return {
-            role: "assistant",
-            content: [
-              // this could be empty when you call two tools in one query
-              ...(aiThinkingText.trim()
-                ? [
-                    {
-                      type: "text",
-                      text: aiThinkingText,
-                    } satisfies TextBlockParam,
-                  ]
-                : []),
-              ...options.toolCall.map(
-                (toolCall) =>
-                  ({
-                    type: "tool_use",
-                    id: toolCall.id,
-                    name: toolCall.name,
-                    input: toolCall.input,
-                  }) satisfies ToolUseBlockParam,
-              ),
-            ],
-          } satisfies MessageParam;
-        }
-
-        return {
-          content:
-            typeof message.content === "string"
-              ? message.content
-              : message.content.map(
-                  (content): TextBlockParam | ImageBlockParam =>
-                    content.type === "text"
-                      ? {
-                          type: "text",
-                          text: content.text,
-                        }
-                      : {
-                          type: "image",
-                          source: {
-                            data: content.image_url.url.substring(
-                              content.image_url.url.indexOf(",") + 1,
-                            ),
-                            media_type:
-                              `image/${content.image_url.url.substring("data:image/".length, content.image_url.url.indexOf(";base64"))}` as
-                                | "image/jpeg"
-                                | "image/png"
-                                | "image/gif"
-                                | "image/webp",
-                            type: "base64",
-                          },
-                        },
-                ),
-          role: message.role as "user" | "assistant",
-        } satisfies MessageParam;
-      });
-    // merge messages with the same role
-    // in case of 'messages: roles must alternate between "user" and "assistant", but found multiple "user" roles in a row'
-    const realResult: MessageParam[] = [];
-    for (let i = 0; i < result.length; i++) {
-      if (i === 0) {
-        realResult.push(result[i]!);
-        continue;
-      }
-      const current = result[i]!;
-      const previous = result[i - 1]!;
-      if (current.role === previous.role) {
-        // merge two messages with the same role
-        if (Array.isArray(previous.content)) {
-          if (Array.isArray(current.content)) {
-            previous.content.push(...current.content);
-          } else {
-            previous.content.push({
-              type: "text",
-              text: current.content,
-            });
-          }
-        } else {
-          if (Array.isArray(current.content)) {
-            previous.content = [
-              {
-                type: "text",
-                text: previous.content,
-              },
-              ...current.content,
-            ];
-          } else {
-            previous.content += `\n${current.content}`;
-          }
-        }
-        // no need to push the message
-      }
-      // if the roles are different, just push the message
-      else {
-        realResult.push(current);
-      }
-    }
-
-    return realResult;
-  }
-
-  chat(
-    params: LLMChatParamsStreaming<
-      AnthropicAdditionalChatOptions,
-      ToolCallLLMMessageOptions
-    >,
-  ): Promise<AsyncIterable<ChatResponseChunk<ToolCallLLMMessageOptions>>>;
-  chat(
-    params: LLMChatParamsNonStreaming<
-      AnthropicAdditionalChatOptions,
-      ToolCallLLMMessageOptions
-    >,
-  ): Promise<ChatResponse<ToolCallLLMMessageOptions>>;
-  @wrapLLMEvent
-  async chat(
-    params:
-      | LLMChatParamsNonStreaming<
-          AnthropicAdditionalChatOptions,
-          ToolCallLLMMessageOptions
-        >
-      | LLMChatParamsStreaming<
-          AnthropicAdditionalChatOptions,
-          ToolCallLLMMessageOptions
-        >,
-  ): Promise<
-    | ChatResponse<ToolCallLLMMessageOptions>
-    | AsyncIterable<ChatResponseChunk<ToolCallLLMMessageOptions>>
-  > {
-    let { messages } = params;
-
-    const { stream, tools } = params;
-
-    let systemPrompt: string | null = null;
-
-    const systemMessages = messages.filter(
-      (message) => message.role === "system",
-    );
-
-    if (systemMessages.length > 0) {
-      systemPrompt = systemMessages
-        .map((message) => message.content)
-        .join("\n");
-      messages = messages.filter((message) => message.role !== "system");
-    }
-
-    // case: Streaming
-    if (stream) {
-      if (tools) {
-        console.error("Tools are not supported in streaming mode");
-      }
-      return this.streamChat(messages, systemPrompt);
-    }
-    // case: Non-streaming
-    const anthropic = this.session.anthropic;
-
-    if (tools) {
-      const params: MessageCreateParamsNonStreaming = {
-        messages: this.formatMessages(messages),
-        tools: tools.map(Anthropic.toTool),
-        model: this.getModelName(this.model),
-        temperature: this.temperature,
-        max_tokens: this.maxTokens ?? 4096,
-        top_p: this.topP,
-        ...(systemPrompt && { system: systemPrompt }),
-      };
-      // Remove tools if there are none, as it will cause an error
-      if (tools.length === 0) {
-        delete params.tools;
-      }
-      const response = await anthropic.messages.create(params);
-
-      const toolUseBlock = response.content.filter(
-        (content): content is ToolUseBlock => content.type === "tool_use",
-      );
-
-      return {
-        raw: response,
-        message: {
-          content: response.content
-            .filter((content): content is TextBlock => content.type === "text")
-            .map((content) => ({
-              type: "text",
-              text: content.text,
-            })),
-          role: "assistant",
-          options:
-            toolUseBlock.length > 0
-              ? {
-                  toolCall: toolUseBlock.map((block) => ({
-                    id: block.id,
-                    name: block.name,
-                    input: block.input,
-                  })),
-                }
-              : {},
-        },
-      };
-    } else {
-      const response = await anthropic.messages.create({
-        model: this.getModelName(this.model),
-        messages: this.formatMessages(messages),
-        max_tokens: this.maxTokens ?? 4096,
-        temperature: this.temperature,
-        top_p: this.topP,
-        ...(systemPrompt && { system: systemPrompt }),
-      });
-
-      return {
-        raw: response,
-        message: {
-          content: response.content
-            .filter((content): content is TextBlock => content.type === "text")
-            .map((content) => ({
-              type: "text",
-              text: content.text,
-            })),
-          role: "assistant",
-          options: {},
-        },
-      };
-    }
-  }
-
-  protected async *streamChat(
-    messages: ChatMessage<ToolCallLLMMessageOptions>[],
-    systemPrompt?: string | null,
-  ): AsyncIterable<ChatResponseChunk<ToolCallLLMMessageOptions>> {
-    const stream = await this.session.anthropic.messages.create({
-      model: this.getModelName(this.model),
-      messages: this.formatMessages(messages),
-      max_tokens: this.maxTokens ?? 4096,
-      temperature: this.temperature,
-      top_p: this.topP,
-      stream: true,
-      ...(systemPrompt && { system: systemPrompt }),
-    });
-
-    let idx_counter: number = 0;
-    for await (const part of stream) {
-      const content =
-        part.type === "content_block_delta"
-          ? part.delta.type === "text_delta"
-            ? part.delta.text
-            : part.delta
-          : undefined;
-
-      if (typeof content !== "string") continue;
-
-      idx_counter++;
-      yield {
-        raw: part,
-        delta: content,
-        options: {},
-      };
-    }
-    return;
-  }
-
-  static toTool(tool: BaseTool): Tool {
-    if (tool.metadata.parameters?.type !== "object") {
-      throw new TypeError("Tool parameters must be an object");
-    }
-    return {
-      input_schema: {
-        type: "object",
-        properties: tool.metadata.parameters.properties,
-        required: tool.metadata.parameters.required,
-      },
-      name: tool.metadata.name,
-      description: tool.metadata.description,
-    };
-  }
-}
+export * from "@llamaindex/anthropic";
@@ -1,33 +1 @@
-import { getEnv } from "@llamaindex/env";
-import { OpenAI } from "@llamaindex/openai";
-
-const ENV_VARIABLE_NAME = "DEEPINFRA_API_TOKEN";
-const DEFAULT_MODEL = "mistralai/Mixtral-8x22B-Instruct-v0.1";
-const BASE_URL = "https://api.deepinfra.com/v1/openai";
-
-export class DeepInfra extends OpenAI {
-  constructor(init?: Omit<Partial<OpenAI>, "session">) {
-    const {
-      apiKey = getEnv(ENV_VARIABLE_NAME),
-      additionalSessionOptions = {},
-      model = DEFAULT_MODEL,
-      ...rest
-    } = init ?? {};
-
-    if (!apiKey) {
-      throw new Error(
-        `Set DeepInfra API key in ${ENV_VARIABLE_NAME} env variable`,
-      );
-    }
-
-    additionalSessionOptions.baseURL =
-      additionalSessionOptions.baseURL ?? BASE_URL;
-
-    super({
-      apiKey,
-      additionalSessionOptions,
-      model,
-      ...rest,
-    });
-  }
-}
+export * from "@llamaindex/deepinfra";
@@ -44,12 +44,15 @@ import {
 export const GEMINI_MODEL_INFO_MAP: Record<GEMINI_MODEL, GeminiModelInfo> = {
  [GEMINI_MODEL.GEMINI_PRO]: { contextWindow: 30720 },
  [GEMINI_MODEL.GEMINI_PRO_VISION]: { contextWindow: 12288 },
-  [GEMINI_MODEL.GEMINI_PRO_LATEST]: { contextWindow: 10 ** 6 },
  // multi-modal/multi turn
+  [GEMINI_MODEL.GEMINI_PRO_LATEST]: { contextWindow: 10 ** 6 },
+  [GEMINI_MODEL.GEMINI_PRO_FLASH_LATEST]: { contextWindow: 10 ** 6 },
  [GEMINI_MODEL.GEMINI_PRO_1_5_PRO_PREVIEW]: { contextWindow: 10 ** 6 },
  [GEMINI_MODEL.GEMINI_PRO_1_5_FLASH_PREVIEW]: { contextWindow: 10 ** 6 },
  [GEMINI_MODEL.GEMINI_PRO_1_5]: { contextWindow: 2 * 10 ** 6 },
  [GEMINI_MODEL.GEMINI_PRO_1_5_FLASH]: { contextWindow: 10 ** 6 },
+  [GEMINI_MODEL.GEMINI_PRO_1_5_LATEST]: { contextWindow: 2 * 10 ** 6 },
+  [GEMINI_MODEL.GEMINI_PRO_1_5_FLASH_LATEST]: { contextWindow: 10 ** 6 },
 };

 const SUPPORT_TOOL_CALL_MODELS: GEMINI_MODEL[] = [
@@ -59,6 +62,10 @@ const SUPPORT_TOOL_CALL_MODELS: GEMINI_MODEL[] = [
  GEMINI_MODEL.GEMINI_PRO_1_5_FLASH_PREVIEW,
  GEMINI_MODEL.GEMINI_PRO_1_5,
  GEMINI_MODEL.GEMINI_PRO_1_5_FLASH,
+  GEMINI_MODEL.GEMINI_PRO_LATEST,
+  GEMINI_MODEL.GEMINI_PRO_FLASH_LATEST,
+  GEMINI_MODEL.GEMINI_PRO_1_5_LATEST,
+  GEMINI_MODEL.GEMINI_PRO_1_5_FLASH_LATEST,
 ];

 const DEFAULT_GEMINI_PARAMS = {
@@ -56,10 +56,14 @@ export enum GEMINI_MODEL {
  GEMINI_PRO = "gemini-pro",
  GEMINI_PRO_VISION = "gemini-pro-vision",
  GEMINI_PRO_LATEST = "gemini-1.5-pro-latest",
+  GEMINI_PRO_FLASH_LATEST = "gemini-1.5-flash-latest",
  GEMINI_PRO_1_5_PRO_PREVIEW = "gemini-1.5-pro-preview-0514",
  GEMINI_PRO_1_5_FLASH_PREVIEW = "gemini-1.5-flash-preview-0514",
  GEMINI_PRO_1_5 = "gemini-1.5-pro-001",
  GEMINI_PRO_1_5_FLASH = "gemini-1.5-flash-001",
+  // Note: should be switched to -latest suffix when google supports it
+  GEMINI_PRO_1_5_LATEST = "gemini-1.5-pro-002",
+  GEMINI_PRO_1_5_FLASH_LATEST = "gemini-1.5-flash-002",
 }

 export interface GeminiModelInfo {
@@ -1,313 +1 @@
-import { HfInference } from "@huggingface/inference";
-import { wrapLLMEvent } from "@llamaindex/core/decorator";
-import "@llamaindex/core/llms";
-import {
-  BaseLLM,
-  type ChatMessage,
-  type ChatResponse,
-  type ChatResponseChunk,
-  type LLMChatParamsNonStreaming,
-  type LLMChatParamsStreaming,
-  type LLMMetadata,
-  type ToolCallLLMMessageOptions,
-} from "@llamaindex/core/llms";
-import { streamConverter } from "@llamaindex/core/utils";
-import { loadTransformers } from "@llamaindex/env";
-import type {
-  PreTrainedModel,
-  PreTrainedTokenizer,
-  Tensor,
-} from "@xenova/transformers";
-import { Settings } from "../Settings.js";
-
-// TODO workaround issue with @huggingface/inference@2.7.0
-interface HfInferenceOptions {
-  /**
-   * (Default: true) Boolean. If a request 503s and wait_for_model is set to false, the request will be retried with the same parameters but with wait_for_model set to true.
-   */
-  retry_on_error?: boolean;
-  /**
-   * (Default: true). Boolean. There is a cache layer on Inference API (serverless) to speedup requests we have already seen. Most models can use those results as is as models are deterministic (meaning the results will be the same anyway). However if you use a non deterministic model, you can set this parameter to prevent the caching mechanism from being used resulting in a real new query.
-   */
-  use_cache?: boolean;
-  /**
-   * (Default: false). Boolean. Do not load the model if it's not already available.
-   */
-  dont_load_model?: boolean;
-  /**
-   * (Default: false). Boolean to use GPU instead of CPU for inference (requires Startup plan at least).
-   */
-  use_gpu?: boolean;
-  /**
-   * (Default: false) Boolean. If the model is not ready, wait for it instead of receiving 503. It limits the number of requests required to get your inference done. It is advised to only set this flag to true after receiving a 503 error as it will limit hanging in your application to known places.
-   */
-  wait_for_model?: boolean;
-  /**
-   * Custom fetch function to use instead of the default one, for example to use a proxy or edit headers.
-   */
-  fetch?: typeof fetch;
-  /**
-   * Abort Controller signal to use for request interruption.
-   */
-  signal?: AbortSignal;
-  /**
-   * (Default: "same-origin"). String | Boolean. Credentials to use for the request. If this is a string, it will be passed straight on. If it's a boolean, true will be "include" and false will not send credentials at all.
-   */
-  includeCredentials?: string | boolean;
-}
-
-const DEFAULT_PARAMS = {
-  temperature: 0.1,
-  topP: 1,
-  maxTokens: undefined,
-  contextWindow: 3900,
-};
-
-export type HFConfig = Partial<typeof DEFAULT_PARAMS> &
-  HfInferenceOptions & {
-    model: string;
-    accessToken: string;
-    endpoint?: string;
-  };
-
-/**
-    Wrapper on the Hugging Face's Inference API.
-    API Docs: https://huggingface.co/docs/huggingface.js/inference/README
-    List of tasks with models: huggingface.co/api/tasks 
-    
-    Note that Conversational API is not yet supported by the Inference API.
-    They recommend using the text generation API instead.
-    See: https://github.com/huggingface/huggingface.js/issues/586#issuecomment-2024059308
- */
-export class HuggingFaceInferenceAPI extends BaseLLM {
-  model: string;
-  temperature: number;
-  topP: number;
-  maxTokens?: number | undefined;
-  contextWindow: number;
-  hf: HfInference;
-
-  constructor(init: HFConfig) {
-    super();
-    const {
-      model,
-      temperature,
-      topP,
-      maxTokens,
-      contextWindow,
-      accessToken,
-      endpoint,
-      ...hfInferenceOpts
-    } = init;
-    this.hf = new HfInference(accessToken, hfInferenceOpts);
-    this.model = model;
-    this.temperature = temperature ?? DEFAULT_PARAMS.temperature;
-    this.topP = topP ?? DEFAULT_PARAMS.topP;
-    this.maxTokens = maxTokens ?? DEFAULT_PARAMS.maxTokens;
-    this.contextWindow = contextWindow ?? DEFAULT_PARAMS.contextWindow;
-    if (endpoint) this.hf.endpoint(endpoint);
-  }
-
-  get metadata(): LLMMetadata {
-    return {
-      model: this.model,
-      temperature: this.temperature,
-      topP: this.topP,
-      maxTokens: this.maxTokens,
-      contextWindow: this.contextWindow,
-      tokenizer: undefined,
-    };
-  }
-
-  chat(
-    params: LLMChatParamsStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk>>;
-  chat(params: LLMChatParamsNonStreaming): Promise<ChatResponse>;
-  @wrapLLMEvent
-  async chat(
-    params: LLMChatParamsStreaming | LLMChatParamsNonStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk> | ChatResponse<object>> {
-    if (params.stream) return this.streamChat(params);
-    return this.nonStreamChat(params);
-  }
-
-  private messagesToPrompt(messages: ChatMessage<ToolCallLLMMessageOptions>[]) {
-    let prompt = "";
-    for (const message of messages) {
-      if (message.role === "system") {
-        prompt += `<|system|>\n${message.content}</s>\n`;
-      } else if (message.role === "user") {
-        prompt += `<|user|>\n${message.content}</s>\n`;
-      } else if (message.role === "assistant") {
-        prompt += `<|assistant|>\n${message.content}</s>\n`;
-      }
-    }
-    // ensure we start with a system prompt, insert blank if needed
-    if (!prompt.startsWith("<|system|>\n")) {
-      prompt = "<|system|>\n</s>\n" + prompt;
-    }
-    // add final assistant prompt
-    prompt = prompt + "<|assistant|>\n";
-    return prompt;
-  }
-
-  protected async nonStreamChat(
-    params: LLMChatParamsNonStreaming,
-  ): Promise<ChatResponse> {
-    const res = await this.hf.textGeneration({
-      model: this.model,
-      inputs: this.messagesToPrompt(params.messages),
-      parameters: this.metadata,
-    });
-    return {
-      raw: res,
-      message: {
-        content: res.generated_text,
-        role: "assistant",
-      },
-    };
-  }
-
-  protected async *streamChat(
-    params: LLMChatParamsStreaming,
-  ): AsyncIterable<ChatResponseChunk> {
-    const stream = this.hf.textGenerationStream({
-      model: this.model,
-      inputs: this.messagesToPrompt(params.messages),
-      parameters: this.metadata,
-    });
-    yield* streamConverter(stream, (chunk: any) => ({
-      delta: chunk.token.text,
-      raw: chunk,
-    }));
-  }
-}
-
-const DEFAULT_HUGGINGFACE_MODEL = "stabilityai/stablelm-tuned-alpha-3b";
-
-export interface HFLLMConfig {
-  modelName?: string;
-  tokenizerName?: string;
-  temperature?: number;
-  topP?: number;
-  maxTokens?: number;
-  contextWindow?: number;
-}
-
-export class HuggingFaceLLM extends BaseLLM {
-  modelName: string;
-  tokenizerName: string;
-  temperature: number;
-  topP: number;
-  maxTokens?: number | undefined;
-  contextWindow: number;
-
-  private tokenizer: PreTrainedTokenizer | null = null;
-  private model: PreTrainedModel | null = null;
-
-  constructor(init?: HFLLMConfig) {
-    super();
-    this.modelName = init?.modelName ?? DEFAULT_HUGGINGFACE_MODEL;
-    this.tokenizerName = init?.tokenizerName ?? DEFAULT_HUGGINGFACE_MODEL;
-    this.temperature = init?.temperature ?? DEFAULT_PARAMS.temperature;
-    this.topP = init?.topP ?? DEFAULT_PARAMS.topP;
-    this.maxTokens = init?.maxTokens ?? DEFAULT_PARAMS.maxTokens;
-    this.contextWindow = init?.contextWindow ?? DEFAULT_PARAMS.contextWindow;
-  }
-
-  get metadata(): LLMMetadata {
-    return {
-      model: this.modelName,
-      temperature: this.temperature,
-      topP: this.topP,
-      maxTokens: this.maxTokens,
-      contextWindow: this.contextWindow,
-      tokenizer: undefined,
-    };
-  }
-
-  async getTokenizer() {
-    const { AutoTokenizer } = await loadTransformers((transformer) => {
-      Settings.callbackManager.dispatchEvent(
-        "load-transformers",
-        {
-          transformer,
-        },
-        true,
-      );
-    });
-    if (!this.tokenizer) {
-      this.tokenizer = await AutoTokenizer.from_pretrained(this.tokenizerName);
-    }
-    return this.tokenizer;
-  }
-
-  async getModel() {
-    const { AutoModelForCausalLM } = await loadTransformers((transformer) => {
-      Settings.callbackManager.dispatchEvent(
-        "load-transformers",
-        {
-          transformer,
-        },
-        true,
-      );
-    });
-    if (!this.model) {
-      this.model = await AutoModelForCausalLM.from_pretrained(this.modelName);
-    }
-    return this.model;
-  }
-
-  chat(
-    params: LLMChatParamsStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk>>;
-  chat(params: LLMChatParamsNonStreaming): Promise<ChatResponse>;
-  @wrapLLMEvent
-  async chat(
-    params: LLMChatParamsStreaming | LLMChatParamsNonStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk> | ChatResponse<object>> {
-    if (params.stream) return this.streamChat(params);
-    return this.nonStreamChat(params);
-  }
-
-  protected async nonStreamChat(
-    params: LLMChatParamsNonStreaming,
-  ): Promise<ChatResponse> {
-    const tokenizer = await this.getTokenizer();
-    const model = await this.getModel();
-
-    const messageInputs = params.messages.map((msg) => ({
-      role: msg.role,
-      content: msg.content as string,
-    }));
-    const inputs = tokenizer.apply_chat_template(messageInputs, {
-      add_generation_prompt: true,
-      ...this.metadata,
-    }) as Tensor;
-
-    // TODO: the input for model.generate should be updated when using @xenova/transformers v3
-    // We should add `stopping_criteria` also when it's supported in v3
-    // See: https://github.com/xenova/transformers.js/blob/3260640b192b3e06a10a1f4dc004b1254fdf1b80/src/models.js#L1248C9-L1248C27
-    const outputs = await model.generate(inputs, this.metadata);
-    const outputText = tokenizer.batch_decode(outputs, {
-      skip_special_tokens: false,
-    });
-
-    return {
-      raw: outputs,
-      message: {
-        content: outputText.join(""),
-        role: "assistant",
-      },
-    };
-  }
-
-  protected async *streamChat(
-    params: LLMChatParamsStreaming,
-  ): AsyncIterable<ChatResponseChunk> {
-    // @xenova/transformers v2 doesn't support streaming generation yet
-    // they are working on it in v3
-    // See: https://github.com/xenova/transformers.js/blob/3260640b192b3e06a10a1f4dc004b1254fdf1b80/src/models.js#L1249
-    throw new Error("Method not implemented.");
-  }
-}
+export * from "@llamaindex/huggingface";
@@ -1,135 +1 @@
-import { wrapLLMEvent } from "@llamaindex/core/decorator";
-import {
-  BaseLLM,
-  type ChatMessage,
-  type ChatResponse,
-  type ChatResponseChunk,
-  type LLMChatParamsNonStreaming,
-  type LLMChatParamsStreaming,
-  type LLMMetadata,
-  type MessageType,
-} from "@llamaindex/core/llms";
-import { extractText } from "@llamaindex/core/utils";
-import { getEnv } from "@llamaindex/env";
-import _ from "lodash";
-import { Portkey as OrigPortKey } from "portkey-ai";
-
-type PortkeyOptions = ConstructorParameters<typeof OrigPortKey>[0];
-
-export class PortkeySession {
-  portkey: OrigPortKey;
-
-  constructor(options: PortkeyOptions = {}) {
-    if (!options.apiKey) {
-      options.apiKey = getEnv("PORTKEY_API_KEY")!;
-    }
-
-    if (!options.baseURL) {
-      options.baseURL = getEnv("PORTKEY_BASE_URL") ?? "https://api.portkey.ai";
-    }
-
-    this.portkey = new OrigPortKey({});
-    if (!options.apiKey) {
-      throw new Error("Set Portkey ApiKey in PORTKEY_API_KEY env variable");
-    }
-
-    this.portkey = new OrigPortKey(options);
-  }
-}
-
-const defaultPortkeySession: {
-  session: PortkeySession;
-  options: PortkeyOptions;
-}[] = [];
-
-/**
- * Get a session for the Portkey API. If one already exists with the same options,
- * it will be returned. Otherwise, a new session will be created.
- * @param options
- * @returns
- */
-export function getPortkeySession(options: PortkeyOptions = {}) {
-  let session = defaultPortkeySession.find((session) => {
-    return _.isEqual(session.options, options);
-  })?.session;
-
-  if (!session) {
-    session = new PortkeySession(options);
-    defaultPortkeySession.push({ session, options });
-  }
-  return session;
-}
-
-export class Portkey extends BaseLLM {
-  apiKey?: string | undefined = undefined;
-  baseURL?: string | undefined = undefined;
-  session: PortkeySession;
-
-  constructor(init?: Partial<Portkey> & PortkeyOptions) {
-    super();
-    const { apiKey, baseURL, ...rest } = init || {};
-    this.apiKey = apiKey;
-    this.baseURL = baseURL;
-    this.session = getPortkeySession({
-      ...rest,
-      apiKey: this.apiKey ?? null,
-      baseURL: this.baseURL ?? null,
-    });
-  }
-
-  get metadata(): LLMMetadata {
-    throw new Error("metadata not implemented for Portkey");
-  }
-
-  chat(
-    params: LLMChatParamsStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk>>;
-  chat(params: LLMChatParamsNonStreaming): Promise<ChatResponse>;
-  @wrapLLMEvent
-  async chat(
-    params: LLMChatParamsNonStreaming | LLMChatParamsStreaming,
-  ): Promise<ChatResponse | AsyncIterable<ChatResponseChunk>> {
-    const { messages, stream, additionalChatOptions } = params;
-    if (stream) {
-      return this.streamChat(messages, additionalChatOptions);
-    } else {
-      const bodyParams = additionalChatOptions || {};
-      const response = await this.session.portkey.chatCompletions.create({
-        messages: messages.map((message) => ({
-          content: extractText(message.content),
-          role: message.role,
-        })),
-        ...bodyParams,
-      });
-
-      const content = response.choices[0]!.message?.content ?? "";
-      const role = response.choices[0]!.message?.role || "assistant";
-      return { raw: response, message: { content, role: role as MessageType } };
-    }
-  }
-
-  async *streamChat(
-    messages: ChatMessage[],
-    params?: Record<string, any>,
-  ): AsyncIterable<ChatResponseChunk> {
-    const chunkStream = await this.session.portkey.chatCompletions.create({
-      messages: messages.map((message) => ({
-        content: extractText(message.content),
-        role: message.role,
-      })),
-      ...params,
-      stream: true,
-    });
-
-    //Indices
-    let idx_counter: number = 0;
-    for await (const part of chunkStream) {
-      part.choices[0]!.index = idx_counter;
-
-      idx_counter++;
-
-      yield { raw: part, delta: part.choices[0]!.delta?.content ?? "" };
-    }
-    return;
-  }
-}
+export * from "@llamaindex/portkey-ai";
@@ -1,379 +1 @@
-import { wrapLLMEvent } from "@llamaindex/core/decorator";
-import {
-  BaseLLM,
-  type ChatMessage,
-  type ChatResponse,
-  type ChatResponseChunk,
-  type LLMChatParamsNonStreaming,
-  type LLMChatParamsStreaming,
-  type MessageType,
-} from "@llamaindex/core/llms";
-import {
-  extractText,
-  streamCallbacks,
-  streamConverter,
-} from "@llamaindex/core/utils";
-import { getEnv } from "@llamaindex/env";
-import Replicate from "../internal/deps/replicate.js";
-
-export class ReplicateSession {
-  replicateKey: string | null = null;
-  replicate: Replicate;
-
-  constructor(replicateKey: string | null = null) {
-    if (replicateKey) {
-      this.replicateKey = replicateKey;
-    } else if (getEnv("REPLICATE_API_TOKEN")) {
-      this.replicateKey = getEnv("REPLICATE_API_TOKEN") as string;
-    } else {
-      throw new Error(
-        "Set Replicate token in REPLICATE_API_TOKEN env variable",
-      );
-    }
-
-    this.replicate = new Replicate({ auth: this.replicateKey });
-  }
-}
-
-export const ALL_AVAILABLE_REPLICATE_MODELS = {
-  // TODO: add more models from replicate
-  "Llama-2-70b-chat-old": {
-    contextWindow: 4096,
-    replicateApi:
-      "replicate/llama70b-v2-chat:e951f18578850b652510200860fc4ea62b3b16fac280f83ff32282f87bbd2e48",
-    //^ Previous 70b model. This is also actually 4 bit, although not exllama.
-  },
-  "Llama-2-70b-chat-4bit": {
-    contextWindow: 4096,
-    replicateApi:
-      "meta/llama-2-70b-chat:02e509c789964a7ea8736978a43525956ef40397be9033abf9fd2badfe68c9e3",
-    //^ Model is based off of exllama 4bit.
-  },
-  "Llama-2-13b-chat-old": {
-    contextWindow: 4096,
-    replicateApi:
-      "a16z-infra/llama13b-v2-chat:df7690f1994d94e96ad9d568eac121aecf50684a0b0963b25a41cc40061269e5",
-  },
-  //^ Last known good 13b non-quantized model. In future versions they add the SYS and INST tags themselves
-  "Llama-2-13b-chat-4bit": {
-    contextWindow: 4096,
-    replicateApi:
-      "meta/llama-2-13b-chat:f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d",
-  },
-  "Llama-2-7b-chat-old": {
-    contextWindow: 4096,
-    replicateApi:
-      "a16z-infra/llama7b-v2-chat:4f0a4744c7295c024a1de15e1a63c880d3da035fa1f49bfd344fe076074c8eea",
-    //^ Last (somewhat) known good 7b non-quantized model. In future versions they add the SYS and INST
-    // tags themselves
-    // https://github.com/replicate/cog-llama-template/commit/fa5ce83912cf82fc2b9c01a4e9dc9bff6f2ef137
-    // Problem is that they fix the max_new_tokens issue in the same commit. :-(
-  },
-  "Llama-2-7b-chat-4bit": {
-    contextWindow: 4096,
-    replicateApi:
-      "meta/llama-2-7b-chat:13c3cdee13ee059ab779f0291d29054dab00a47dad8261375654de5540165fb0",
-  },
-
-  "llama-3-70b-instruct": {
-    contextWindow: 8192,
-    replicateApi: "meta/meta-llama-3-70b-instruct",
-  },
-
-  "llama-3-8b-instruct": {
-    contextWindow: 8192,
-    replicateApi: "meta/meta-llama-3-8b-instruct",
-  },
-};
-
-export enum ReplicateChatStrategy {
-  A16Z = "a16z",
-  META = "meta",
-  METAWBOS = "metawbos",
-  //^ This is not exactly right because SentencePiece puts the BOS and EOS token IDs in after tokenization
-  // Unfortunately any string only API won't support these properly.
-  REPLICATE4BIT = "replicate4bit",
-  //^ To satisfy Replicate's 4 bit models' requirements where they also insert some INST tags
-  REPLICATE4BITWNEWLINES = "replicate4bitwnewlines",
-  //^ Replicate's documentation recommends using newlines: https://replicate.com/blog/how-to-prompt-llama
-  LLAMA3 = "llama3",
-}
-
-export const DeuceChatStrategy = ReplicateChatStrategy;
-
-/**
- * Replicate LLM implementation used
- */
-export class ReplicateLLM extends BaseLLM {
-  model: keyof typeof ALL_AVAILABLE_REPLICATE_MODELS;
-  chatStrategy: ReplicateChatStrategy;
-  temperature: number;
-  topP: number;
-  maxTokens?: number;
-  replicateSession: ReplicateSession;
-
-  constructor(init?: Partial<ReplicateLLM> & { noWarn?: boolean }) {
-    super();
-
-    if (!init?.model && !init?.noWarn) {
-      console.warn(
-        "The default model has been changed to llama-3-70b-instruct. Set noWarn to true to suppress this warning.",
-      );
-    }
-
-    this.model = init?.model ?? "llama-3-70b-instruct";
-    this.chatStrategy =
-      init?.chatStrategy ??
-      (this.model.startsWith("llama-3")
-        ? ReplicateChatStrategy.LLAMA3
-        : this.model.endsWith("4bit")
-          ? ReplicateChatStrategy.REPLICATE4BITWNEWLINES // With the newer Replicate models they do the system message themselves.
-          : ReplicateChatStrategy.METAWBOS); // With BOS and EOS seems to work best, although they all have problems past a certain point
-    this.temperature = init?.temperature ?? 0.1; // minimum temperature is 0.01 for Replicate endpoint
-    this.topP = init?.topP ?? (this.model.startsWith("llama-3") ? 0.9 : 1); // llama-3 defaults to 0.9 top P
-    this.maxTokens =
-      init?.maxTokens ??
-      ALL_AVAILABLE_REPLICATE_MODELS[this.model].contextWindow; // For Replicate, the default is 500 tokens which is too low.
-    this.replicateSession = init?.replicateSession ?? new ReplicateSession();
-  }
-
-  get metadata() {
-    return {
-      model: this.model,
-      temperature: this.temperature,
-      topP: this.topP,
-      maxTokens: this.maxTokens,
-      contextWindow: ALL_AVAILABLE_REPLICATE_MODELS[this.model].contextWindow,
-      tokenizer: undefined,
-    };
-  }
-
-  mapMessagesToPrompt(messages: ChatMessage[]) {
-    if (this.chatStrategy === ReplicateChatStrategy.LLAMA3) {
-      return this.mapMessagesToPromptLlama3(messages);
-    } else if (this.chatStrategy === ReplicateChatStrategy.A16Z) {
-      return this.mapMessagesToPromptA16Z(messages);
-    } else if (this.chatStrategy === ReplicateChatStrategy.META) {
-      return this.mapMessagesToPromptMeta(messages);
-    } else if (this.chatStrategy === ReplicateChatStrategy.METAWBOS) {
-      return this.mapMessagesToPromptMeta(messages, { withBos: true });
-    } else if (this.chatStrategy === ReplicateChatStrategy.REPLICATE4BIT) {
-      return this.mapMessagesToPromptMeta(messages, {
-        replicate4Bit: true,
-        withNewlines: true,
-      });
-    } else if (
-      this.chatStrategy === ReplicateChatStrategy.REPLICATE4BITWNEWLINES
-    ) {
-      return this.mapMessagesToPromptMeta(messages, {
-        replicate4Bit: true,
-        withNewlines: true,
-      });
-    } else {
-      return this.mapMessagesToPromptMeta(messages);
-    }
-  }
-
-  mapMessagesToPromptLlama3(messages: ChatMessage[]) {
-    return {
-      prompt:
-        "<|begin_of_text|>" +
-        messages.reduce((acc, message) => {
-          let content = "";
-          if (typeof message.content === "string") {
-            content = message.content;
-          } else {
-            if (message.content[0]!.type === "text") {
-              content = message.content[0]!.text;
-            } else {
-              content = "";
-            }
-          }
-
-          return (
-            acc +
-            `<|start_header_id|>${message.role}<|end_header_id|>\n\n${content}<|eot_id|>`
-          );
-        }, "") +
-        "<|start_header_id|>assistant<|end_header_id|>\n\n",
-      systemPrompt: undefined,
-    };
-  }
-
-  mapMessagesToPromptA16Z(messages: ChatMessage[]) {
-    return {
-      prompt:
-        messages.reduce((acc, message) => {
-          return (
-            (acc && `${acc}\n\n`) +
-            `${this.mapMessageTypeA16Z(message.role)}${message.content}`
-          );
-        }, "") + "\n\nAssistant:",
-      //^ Here we're differing from A16Z by omitting the space. Generally spaces at the end of prompts decrease performance due to tokenization
-      systemPrompt: undefined,
-    };
-  }
-
-  mapMessageTypeA16Z(messageType: MessageType): string {
-    switch (messageType) {
-      case "user":
-        return "User: ";
-      case "assistant":
-        return "Assistant: ";
-      case "system":
-        return "";
-      default:
-        throw new Error("Unsupported ReplicateLLM message type");
-    }
-  }
-
-  mapMessagesToPromptMeta(
-    messages: ChatMessage[],
-    opts?: {
-      withBos?: boolean;
-      replicate4Bit?: boolean;
-      withNewlines?: boolean;
-    },
-  ) {
-    const {
-      withBos = false,
-      replicate4Bit = false,
-      withNewlines = false,
-    } = opts ?? {};
-    const DEFAULT_SYSTEM_PROMPT = `You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.
-
-If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.`;
-
-    const B_SYS = "<<SYS>>\n";
-    const E_SYS = "\n<</SYS>>\n\n";
-    const B_INST = "[INST]";
-    const E_INST = "[/INST]";
-    const BOS = "<s>";
-    const EOS = "</s>";
-
-    if (messages.length === 0) {
-      return { prompt: "", systemPrompt: undefined };
-    }
-
-    messages = [...messages]; // so we can use shift without mutating the original array
-
-    let systemPrompt = undefined;
-    if (messages[0]!.role === "system") {
-      const systemMessage = messages.shift()!;
-
-      if (replicate4Bit) {
-        systemPrompt = systemMessage.content;
-      } else {
-        const systemStr = `${B_SYS}${systemMessage.content}${E_SYS}`;
-
-        // TS Bug: https://github.com/microsoft/TypeScript/issues/9998
-        // @ts-ignore
-        if (messages[0].role !== "user") {
-          throw new Error(
-            "ReplicateLLM: if there is a system message, the second message must be a user message.",
-          );
-        }
-
-        const userContent = messages[0]!.content;
-
-        messages[0]!.content = `${systemStr}${userContent}`;
-      }
-    } else {
-      if (!replicate4Bit) {
-        messages[0]!.content = `${B_SYS}${DEFAULT_SYSTEM_PROMPT}${E_SYS}${messages[0]!.content}`;
-      }
-    }
-
-    return {
-      prompt: messages.reduce((acc, message, index) => {
-        const content = extractText(message.content);
-        if (index % 2 === 0) {
-          return (
-            `${acc}${withBos ? BOS : ""}${B_INST} ${content.trim()} ${E_INST}` +
-            (withNewlines ? "\n" : "")
-          );
-        } else {
-          return (
-            `${acc} ${content.trim()}` +
-            (withNewlines ? "\n" : " ") +
-            (withBos ? EOS : "")
-          ); // Yes, the EOS comes after the space. This is not a mistake.
-        }
-      }, ""),
-      systemPrompt,
-    };
-  }
-
-  chat(
-    params: LLMChatParamsStreaming,
-  ): Promise<AsyncIterable<ChatResponseChunk>>;
-  chat(params: LLMChatParamsNonStreaming): Promise<ChatResponse>;
-  @wrapLLMEvent
-  async chat(
-    params: LLMChatParamsNonStreaming | LLMChatParamsStreaming,
-  ): Promise<ChatResponse | AsyncIterable<ChatResponseChunk>> {
-    const { messages, stream } = params;
-    const api = ALL_AVAILABLE_REPLICATE_MODELS[this.model]
-      .replicateApi as `${string}/${string}:${string}`;
-
-    const { prompt, systemPrompt } = this.mapMessagesToPrompt(messages);
-
-    const replicateOptions: any = {
-      input: {
-        prompt,
-        system_prompt: systemPrompt,
-        temperature: this.temperature,
-        max_tokens: this.maxTokens,
-        top_p: this.topP,
-      },
-    };
-
-    if (this.model.endsWith("4bit")) {
-      replicateOptions.input.max_new_tokens = this.maxTokens;
-    } else {
-      replicateOptions.input.max_length = this.maxTokens;
-    }
-
-    if (this.model.startsWith("llama-3")) {
-      replicateOptions.input.prompt_template = "{prompt}";
-    }
-
-    if (stream) {
-      const controller = new AbortController();
-      const stream = this.replicateSession.replicate.stream(api, {
-        ...replicateOptions,
-        signal: controller.signal,
-      });
-      // replicate.stream is not closing if used as AsyncIterable, force closing after consumption with the AbortController
-      return streamCallbacks(
-        streamConverter(stream, (chunk) => {
-          if (chunk.event === "done") {
-            return null;
-          }
-          return {
-            raw: chunk,
-            delta: chunk.data,
-          };
-        }),
-        { finished: () => controller.abort() },
-      );
-    }
-
-    //Non-streaming
-    const response = await this.replicateSession.replicate.run(
-      api,
-      replicateOptions,
-    );
-
-    return {
-      raw: response,
-      message: {
-        content: (response as Array<string>).join("").trimStart(),
-        //^ We need to do this because Replicate returns a list of strings (for streaming functionality which is not exposed by the run function)
-        role: "assistant",
-      },
-    };
-  }
-}
-
-export const LlamaDeuce = ReplicateLLM;
+export * from "@llamaindex/replicate";
@@ -17,12 +17,6 @@
 */
 export default function withLlamaIndex(config: any) {
  config.experimental = config.experimental ?? {};
-  // copy tiktoken WASM files to the NextJS build
-  config.experimental.outputFileTracingIncludes =
-    config.experimental.outputFileTracingIncludes ?? {};
-  config.experimental.outputFileTracingIncludes["/**/*"] = [
-    "./node_modules/tiktoken/*.wasm",
-  ];
  // needed for transformers, see https://huggingface.co/docs/transformers.js/en/tutorials/next#step-2-install-and-configure-transformersjs
  config.experimental.serverComponentsExternalPackages =
    config.experimental.serverComponentsExternalPackages ?? [];
@@ -44,6 +38,7 @@ export default function withLlamaIndex(config: any) {
    webpackConfig.externals.push({
      "onnxruntime-node": "commonjs onnxruntime-node",
      sharp: "commonjs sharp",
+      chromadb: "commonjs chromadb",
    });
    return webpackConfig;
  };
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
github-actions[bot]	76b925e62a	Release 0.7.3 (#1357 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: himself65 <himself65@users.noreply.github.com>	2024-10-20 20:15:51 -07:00
Alex Yang	0493f679a4	fix(core): inline `python-format-js` (#1356 )	2024-10-20 20:07:48 -07:00
github-actions[bot]	0e0a627c9a	Release 0.7.2 (#1355 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: himself65 <himself65@users.noreply.github.com>	2024-10-20 19:22:59 -07:00
Alex Yang	4ba2cfe7ab	fix(env): align export APIs (#1354 )	2024-10-20 17:11:09 -07:00
github-actions[bot]	c1578a19d9	Release 0.7.1 (#1342 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: himself65 <himself65@users.noreply.github.com>	2024-10-20 15:29:19 -07:00
Alex Yang	ae49ff4e15	feat: use `gpt-tokenizer` (#1352 )	2024-10-20 15:18:30 -07:00
Alex Yang	a75af835a5	chore: fix misc before release (#1351 )	2024-10-20 14:34:21 -07:00
Alex Yang	7c7cd34908	fix(pg): allow passing perform setup (#1350 )	2024-10-20 14:01:24 -07:00
Alex Yang	f651891196	fix: remove internal `getImageEmbedModel`	2024-10-20 13:21:15 -07:00
Alex Yang	04714c886f	chore: move under providers directory (#1349 )	2024-10-19 20:19:12 -07:00
Alex Yang	cf28574f51	refactor: move clip&huggingface embedding into single package (#1346 )	2024-10-19 18:39:52 -07:00
Jason Musgrave	24d065f054	feat: log api response from failed parse jobs (#1348 )	2024-10-19 18:39:28 -07:00
Alex Yang	b8719586e3	ci: pack all module under packages (#1345 )	2024-10-18 17:26:40 -07:00
Alex Yang	07a40aca49	refactor: move llm into single packages (#1344 )	2024-10-18 16:12:52 -07:00
Alex Yang	33b562938d	refactor: move `data-structs` module (#1343 )	2024-10-18 14:52:39 -07:00
Alex Yang	723b41c23c	refactor: move tools into core module (#1316 )	2024-10-18 09:45:01 -07:00
Alex Yang	4c38c1be0b	fix: do not detect file type in sdk (#1340 )	2024-10-18 09:36:01 -07:00
Alex Yang	0dde0ca27f	ci: fix pre-release (#1341 )	2024-10-17 23:28:58 -07:00
github-actions[bot]	f3e0d07f48	Release 0.7.0 (#1337 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: himself65 <himself65@users.noreply.github.com>	2024-10-17 11:18:29 -07:00
Bruno Bornsztein	1364e8eeed	feat: update metadata extractor to use prompt template (#1338 )	2024-10-17 11:10:41 -07:00
Bruno Bornsztein	96fc69cc61	feat: use promptTemplate arg correctly. (#1335 )	2024-10-16 16:16:03 -07:00
Parham Saidi	3b7736f763	feat: added gemini 002 support (#1336 )	2024-10-16 15:52:36 -07:00
Alex Yang	a7a7afe66e	fix: vector store type (#1334 )	2024-10-15 11:53:35 -07:00
github-actions[bot]	c646ee2eca	Release 0.6.22 (#1333 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>	2024-10-15 11:27:21 +07:00
Marcus Schiesser	5729bd92fd	fix: LlamaCloud API calls for ensuring and index and for file uploads (#1332 )	2024-10-15 11:21:35 +07:00
github-actions[bot]	e0e52cf879	Release 0.6.21 (#1329 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>	2024-10-14 15:36:53 +07:00
Thuc Pham	6f75306c17	feat: support metadata filters for Astra (#1330 ) Co-authored-by: Marcus Schiesser <mail@marcusschiesser.de>	2024-10-14 15:31:00 +07:00
Thuc Pham	94cb4ad810	feat: ChromaDb metadata filters (#1323 ) Co-authored-by: Marcus Schiesser <mail@marcusschiesser.de>	2024-10-14 10:21:52 +07:00
github-actions[bot]	1ea4014746	Release 0.6.20 (#1325 ) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>	2024-10-11 12:55:16 -07:00
Parham Saidi	6a9a7b1458	fix: use init api key for openai embeddings (#1324 )	2024-10-11 12:20:20 -07:00
				`@@ -0,0 +1 @@`
				`export { FunctionTool } from "./function-tool";`