Release 0.2.8 (#685 )

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
feat: support human in the loop for TS (#686 )
2026-07-04 00:16:55 -04:00 · 2025-06-12 18:09:12 +07:00 · 2025-06-12 18:00:10 +07:00 · 2025-06-09 16:53:49 +07:00 · 2025-06-06 17:19:25 +07:00 · 2025-06-06 16:43:45 +07:00
721 changed files with 45439 additions and 11219 deletions
@@ -1,12 +0,0 @@
-{
-  "extends": [
-    "prettier"
-  ],
-  "rules": {
-    "max-params": [
-      "error",
-      4
-    ],
-    "prefer-const": "error",
-  },
-}
@@ -1,12 +1,15 @@
-name: E2E Tests
+name: E2E Tests for create-llama package
 on:
  push:
    branches: [main]
+    paths-ignore:
+      - "python/llama-index-server/**"
+      - ".github/workflows/*llama_index_server.yml"
  pull_request:
    branches: [main]
-
-env:
-  POETRY_VERSION: "1.6.1"
+    paths-ignore:
+      - "python/llama-index-server/**"
+      - ".github/workflows/*llama_index_server.yml"

 jobs:
  e2e-python:
@@ -20,6 +23,7 @@ jobs:
        os: [macos-latest, windows-latest, ubuntu-22.04]
        frameworks: ["fastapi"]
        datasources: ["--no-files", "--example-file", "--llamacloud"]
+        template-types: ["streaming", "llamaindexserver"]
    defaults:
      run:
        shell: bash
@@ -32,10 +36,10 @@ jobs:
        with:
          python-version: ${{ matrix.python-version }}

-      - name: Install Poetry
-        uses: snok/install-poetry@v1
-        with:
-          version: ${{ env.POETRY_VERSION }}
+      - name: Install uv
+        run: curl -LsSf https://astral.sh/uv/install.sh | sh
+      - name: Add uv to PATH # Ensure uv is available in subsequent steps
+        run: echo "$HOME/.cargo/bin" >> $GITHUB_PATH

      - uses: pnpm/action-setup@v3

@@ -50,15 +54,24 @@ jobs:

      - name: Install Playwright Browsers
        run: pnpm exec playwright install --with-deps
-        working-directory: .
+        working-directory: packages/create-llama

      - name: Build create-llama
        run: pnpm run build
-        working-directory: .
+        working-directory: packages/create-llama

      - name: Install
        run: pnpm run pack-install
-        working-directory: .
+        working-directory: packages/create-llama
+
+      - name: Build and store server package
+        run: |
+          pnpm run build
+          wheel_file=$(ls dist/*.whl | head -n 1)
+          mkdir -p "${{ runner.temp }}"
+          cp "$wheel_file" "${{ runner.temp }}/"
+          echo "SERVER_PACKAGE_PATH=${{ runner.temp }}/$(basename "$wheel_file")" >> $GITHUB_ENV
+        working-directory: python/llama-index-server

      - name: Run Playwright tests for Python
        run: pnpm run e2e:python
@@ -67,15 +80,17 @@ jobs:
          LLAMA_CLOUD_API_KEY: ${{ secrets.LLAMA_CLOUD_API_KEY }}
          FRAMEWORK: ${{ matrix.frameworks }}
          DATASOURCE: ${{ matrix.datasources }}
+          TEMPLATE_TYPE: ${{ matrix.template-types }}
          PYTHONIOENCODING: utf-8
          PYTHONLEGACYWINDOWSSTDIO: utf-8
-        working-directory: .
+          SERVER_PACKAGE_PATH: ${{ env.SERVER_PACKAGE_PATH }}
+        working-directory: packages/create-llama

      - uses: actions/upload-artifact@v4
        if: always()
        with:
-          name: playwright-report-python-${{ matrix.os }}-${{ matrix.frameworks }}-${{ matrix.datasources }}
-          path: ./playwright-report/
+          name: playwright-report-python-${{ matrix.os }}-${{ matrix.frameworks }}-${{ matrix.datasources }}-${{ matrix.template-types }}
+          path: packages/create-llama/playwright-report/
          overwrite: true
          retention-days: 30

@@ -85,11 +100,12 @@ jobs:
    strategy:
      fail-fast: true
      matrix:
-        node-version: [18, 20]
+        node-version: [20, 22]
        python-version: ["3.11"]
        os: [macos-latest, windows-latest, ubuntu-22.04]
        frameworks: ["nextjs"]
        datasources: ["--no-files", "--example-file", "--llamacloud"]
+        template-types: ["streaming", "llamaindexserver"]
    defaults:
      run:
        shell: bash
@@ -102,10 +118,10 @@ jobs:
        with:
          python-version: ${{ matrix.python-version }}

-      - name: Install Poetry
-        uses: snok/install-poetry@v1
-        with:
-          version: ${{ env.POETRY_VERSION }}
+      - name: Install uv
+        run: curl -LsSf https://astral.sh/uv/install.sh | sh
+      - name: Add uv to PATH # Ensure uv is available in subsequent steps
+        run: echo "$HOME/.cargo/bin" >> $GITHUB_PATH

      - uses: pnpm/action-setup@v3

@@ -120,15 +136,30 @@ jobs:

      - name: Install Playwright Browsers
        run: pnpm exec playwright install --with-deps
-        working-directory: .
+        working-directory: packages/create-llama

      - name: Build create-llama
        run: pnpm run build
-        working-directory: .
+        working-directory: packages/create-llama

      - name: Install
        run: pnpm run pack-install
-        working-directory: .
+        working-directory: packages/create-llama
+
+      - name: Build server
+        run: pnpm run build
+        working-directory: packages/server
+
+      - name: Pack @llamaindex/server package
+        run: |
+          pnpm pack --pack-destination "${{ runner.temp }}"
+          if [ "${{ runner.os }}" == "Windows" ]; then
+            file=$(find "${{ runner.temp }}" -name "llamaindex-server-*.tgz" | head -n 1)
+            mv "$file" "${{ runner.temp }}/llamaindex-server.tgz"
+          else
+            mv ${{ runner.temp }}/llamaindex-server-*.tgz ${{ runner.temp }}/llamaindex-server.tgz
+          fi
+        working-directory: packages/server

      - name: Run Playwright tests for TypeScript
        run: pnpm run e2e:typescript
@@ -137,12 +168,14 @@ jobs:
          LLAMA_CLOUD_API_KEY: ${{ secrets.LLAMA_CLOUD_API_KEY }}
          FRAMEWORK: ${{ matrix.frameworks }}
          DATASOURCE: ${{ matrix.datasources }}
-        working-directory: .
+          TEMPLATE_TYPE: ${{ matrix.template-types }}
+          SERVER_PACKAGE_PATH: ${{ runner.temp }}/llamaindex-server.tgz
+        working-directory: packages/create-llama

      - uses: actions/upload-artifact@v4
        if: always()
        with:
-          name: playwright-report-typescript-${{ matrix.os }}-${{ matrix.frameworks }}-${{ matrix.datasources }}-node${{ matrix.node-version }}
-          path: ./playwright-report/
+          name: playwright-report-typescript-${{ matrix.os }}-${{ matrix.frameworks }}-${{ matrix.datasources }}-node${{ matrix.node-version }}-${{ matrix.template-types }}
+          path: packages/create-llama/playwright-report/
          overwrite: true
          retention-days: 30
@@ -16,6 +16,16 @@ jobs:

      - uses: pnpm/action-setup@v3

+      - name: Setup Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          enable-cache: true
+
      - name: Setup Node.js
        uses: actions/setup-node@v4
        with:
@@ -31,12 +41,21 @@ jobs:
      - name: Run Prettier
        run: pnpm run format

+      - name: Run build
+        run: pnpm run build
+
+      - name: Run Typecheck for examples
+        run: pnpm run typecheck
+        working-directory: packages/server/examples
+
      - name: Run Python format check
        uses: chartboost/ruff-action@v1
        with:
          args: "format --check"
+          src: "python/llama-index-server"

      - name: Run Python lint
        uses: chartboost/ruff-action@v1
        with:
          args: "check"
+          src: "python/llama-index-server"
@@ -17,6 +17,11 @@ jobs:

      - uses: pnpm/action-setup@v3

+      - name: Setup Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+
      - name: Install uv
        uses: astral-sh/setup-uv@v3

@@ -51,8 +56,12 @@ jobs:
        with:
          commit: Release ${{ steps.get-changeset-status.outputs.new-version }}
          title: Release ${{ steps.get-changeset-status.outputs.new-version }}
+          # bump versions
+          version: pnpm new-version
          # build package and call changeset publish
          publish: pnpm release
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          NPM_TOKEN: ${{ secrets.NPM_TOKEN }}
+          PYPI_TOKEN: ${{ secrets.PYPI_TOKEN }}
+          UV_PUBLISH_TOKEN: ${{ secrets.PYPI_TOKEN }}
@@ -1,130 +0,0 @@
-name: Release llama-index-server
-
-on:
-  push:
-    branches:
-      - main
-    paths:
-      - "llama-index-server/**"
-      - ".github/workflows/release_llama_index_server.yml"
-  pull_request:
-    types:
-      - closed
-
-concurrency: ${{ github.workflow }}-${{ github.ref }}
-
-jobs:
-  release:
-    name: Create Release PR
-    runs-on: ubuntu-latest
-    defaults:
-      run:
-        working-directory: ./llama-index-server
-    if: |
-      github.event_name == 'push' && 
-      !startsWith(github.ref, 'refs/heads/release/llama-index-server-v')
-
-    steps:
-      - name: Checkout Repository
-        uses: actions/checkout@v4
-        with:
-          fetch-depth: 0
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: "3.11"
-
-      - name: Install Poetry
-        run: |
-          curl -sSL https://install.python-poetry.org | python3 -
-
-      - name: Install dependencies
-        run: poetry install
-
-      - name: Setup Git
-        run: |
-          git config --global user.email "github-actions[bot]@users.noreply.github.com"
-          git config --global user.name "github-actions[bot]"
-
-      - name: Bump patch version
-        run: |
-          poetry version patch
-          git add pyproject.toml
-          git commit -m "chore(release): bump version to $(poetry version -s)"
-
-      - name: Get current version
-        id: get_version
-        run: |
-          version=$(poetry version -s)
-          echo "current_version=${version}" >> "$GITHUB_OUTPUT"
-
-      - name: Create Release PR
-        uses: peter-evans/create-pull-request@v6
-        with:
-          token: ${{ secrets.GITHUB_TOKEN }}
-          commit-message: "Release: llama-index-server v${{ steps.get_version.outputs.current_version }}"
-          title: "Release: llama-index-server v${{ steps.get_version.outputs.current_version }}"
-          body: |
-            This PR was automatically created to release a new version of the llama-index-server package.
-
-            Version: ${{ steps.get_version.outputs.current_version }}
-
-            Please review the changes and merge to trigger the release.
-          branch: release/llama-index-server-v${{ steps.get_version.outputs.current_version }}
-          base: main
-          labels: release, llama-index-server
-
-  publish:
-    name: Publish to PyPI
-    runs-on: ubuntu-latest
-    defaults:
-      run:
-        working-directory: ./llama-index-server
-    if: |
-      github.event_name == 'pull_request' && 
-      github.event.pull_request.merged == true && 
-      startsWith(github.event.pull_request.title, 'Release: llama-index-server') &&
-      startsWith(github.event.pull_request.head.ref, 'release/llama-index-server-v')
-
-    steps:
-      - name: Checkout Repository
-        uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: "3.11"
-
-      - name: Install Poetry
-        run: |
-          curl -sSL https://install.python-poetry.org | python3 -
-
-      - name: Install dependencies
-        run: poetry install
-
-      - name: Get current version
-        id: get_version
-        run: |
-          version=$(poetry version -s)
-          echo "current_version=${version}" >> "$GITHUB_OUTPUT"
-
-      - name: Build and publish to PyPI
-        uses: JRubics/poetry-publish@v2.1
-        with:
-          python_version: "3.11"
-          pypi_token: ${{ secrets.PYPI_TOKEN }}
-          package_directory: "llama-index-server"
-          poetry_install_options: "--without dev"
-
-      - name: Create GitHub Release
-        uses: softprops/action-gh-release@v2
-        with:
-          tag_name: llama-index-server-v${{ steps.get_version.outputs.current_version }}
-          name: "llama-index-server v${{ steps.get_version.outputs.current_version }}"
-          body: |
-            Release of llama-index-server v${{ steps.get_version.outputs.current_version }}
-          draft: false
-          prerelease: false
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
@@ -4,8 +4,8 @@ on:
  pull_request:

 env:
-  POETRY_VERSION: "1.8.3"
  PYTHON_VERSION: "3.9"
+  UI_TEST: "true"

 jobs:
  unit-test:
@@ -13,99 +13,124 @@ jobs:
    runs-on: ${{ matrix.os }}
    defaults:
      run:
-        working-directory: llama-index-server
+        working-directory: python/llama-index-server
    strategy:
      matrix:
        os: [ubuntu-latest, windows-latest]
        python-version: ["3.9"]
    steps:
      - uses: actions/checkout@v4
+      - uses: pnpm/action-setup@v3

-      - name: Install Poetry
-        run: pipx install poetry==${{ env.POETRY_VERSION }}
-
-      - name: Set up python ${{ matrix.python-version }}
+      - name: Setup Python
        uses: actions/setup-python@v5
        with:
          python-version: ${{ matrix.python-version }}
-          cache: "poetry"

-      - name: Configure Poetry
-        run: |
-          poetry config virtualenvs.create true
-          poetry config virtualenvs.in-project true
-          poetry env use python
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          enable-cache: true
+
+      - name: Setup Node.js
+        uses: actions/setup-node@v4
+        with:
+          node-version-file: ".nvmrc"
+          cache: "pnpm"

      - name: Install dependencies
        shell: bash
-        run: poetry install --with dev
+        run: pnpm install && pnpm build

      - name: Run unit tests
        shell: bash
-        run: |
-          poetry run pytest tests
+        run: uv run pytest tests

  type-check:
    name: Type Check
    runs-on: ubuntu-latest
    defaults:
      run:
-        working-directory: llama-index-server
+        working-directory: python/llama-index-server
    steps:
      - uses: actions/checkout@v4
+      - uses: pnpm/action-setup@v3

-      - name: Install Poetry
-        run: pipx install poetry==${{ env.POETRY_VERSION }}
-
-      - name: Set up Python
+      - name: Setup Python
        uses: actions/setup-python@v5
        with:
          python-version: ${{ env.PYTHON_VERSION }}
-          cache: "poetry"

-      - name: Configure Poetry
-        run: |
-          poetry config virtualenvs.create true
-          poetry config virtualenvs.in-project true
-          poetry env use python
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          enable-cache: true

      - name: Install dependencies
-        shell: bash
-        run: poetry install --with dev
+        run: pnpm install

      - name: Run mypy
        shell: bash
-        run: poetry run mypy llama_index
+        run: uv run mypy llama_index

  build:
    needs: [unit-test, type-check]
    runs-on: ubuntu-latest
    defaults:
      run:
-        working-directory: llama-index-server
+        working-directory: python/llama-index-server
    steps:
      - uses: actions/checkout@v4
-      - name: Install Poetry
-        run: pipx install poetry==${{ env.POETRY_VERSION }}
+      - uses: pnpm/action-setup@v3
+
      - name: Set up Python
        uses: actions/setup-python@v5
        with:
          python-version: ${{ env.PYTHON_VERSION }}
-      - name: Clear python cache
-        shell: bash
-        run: poetry cache clear --all pypi
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          enable-cache: true
+
+      - name: Setup Node.js
+        uses: actions/setup-node@v4
+        with:
+          node-version-file: ".nvmrc"
+          cache: "pnpm"
+
+      - name: Install dependencies
+        run: pnpm install && pnpm build
+
      - name: Build package
        shell: bash
-        run: poetry build
-      - name: Test installing built package
+        run: uv build
+
+      - name: Get the absolute wheel file path and save it to the output
        shell: bash
-        run: python -m pip install .
+        id: get_whl_path
+        run: |
+          WHL_FILE=$(readlink -f dist/*.whl)
+          echo "whl_file=$WHL_FILE" >> $GITHUB_OUTPUT
+
      - name: Test import
        shell: bash
-        working-directory: ${{ vars.RUNNER_TEMP }}
-        run: python -c "from llama_index.server import LlamaIndexServer"
+        working-directory: ${{ github.workspace }}
+        env:
+          WHL_FILE: ${{ steps.get_whl_path.outputs.whl_file }}
+        run: |
+          uv run --with $WHL_FILE python -c "from llama_index.server import LlamaIndexServer"
+
+      - name: Check frontend resources is present
+        shell: bash
+        working-directory: ${{ github.workspace }}
+        env:
+          WHL_FILE: ${{ steps.get_whl_path.outputs.whl_file }}
+        run: |
+          uv run --with $WHL_FILE python -c "from llama_index.server.chat_ui import check_ui_resources; check_ui_resources()"
+
      - name: Upload artifact
        uses: actions/upload-artifact@v4
        with:
          name: llama-index-server
-          path: llama-index-server/dist/
+          path: dist/
@@ -6,10 +6,6 @@ node_modules
 .pnpm-store
 .pnp.js

-# testing
-coverage
-.coverage
-
 # next.js
 .next/
 out/
@@ -35,31 +31,9 @@ yarn-error.log*
 dist/
 lib/

-# e2e
-.cache
-test-results/
-playwright-report/
-blob-report/
-playwright/.cache/
-.tsbuildinfo
-e2e/cache
-
 # intellij
 **/.idea

-# Python
-.mypy_cache/
-venv/
-.venv/
-dist/
-.__pycache__
-__pycache__
-.python-version
-.ui
-
-# build artifacts
-create-llama-*.tgz
-
 # vscode
 .vscode
 !.vscode/settings.json
@@ -1,3 +1,4 @@
 pnpm format
 pnpm lint
-uvx ruff format --check templates/
+uvx ruff check .
+uvx ruff format . --check 
@@ -1,6 +1,18 @@
-apps/docs/i18n
-apps/docs/docs/api
+node_modules/
 pnpm-lock.yaml
 lib/
 dist/
-.docusaurus/
+cache/
+build/
+.next/
+out/
+packages/server/server/
+packages/server/project/
+**/playwright-report/
+**/test-results/
+
+# Python
+python/
+**/*.mypy_cache/**
+**/*.venv/**
+**/*.ruff_cache/**
@@ -0,0 +1,201 @@
+# CLAUDE.md
+
+This file provides guidance to Claude Code (claude.ai/code) when working with code in this repository.
+
+## Repository Overview
+
+Create-llama is a monorepo containing CLI tools and server frameworks for building LlamaIndex-powered applications. The repository combines TypeScript/Node.js and Python components in a unified development environment.
+
+## Architecture
+
+### Monorepo Structure
+
+- **`packages/create-llama/`**: Main CLI tool for scaffolding LlamaIndex applications
+- **`packages/server/`**: TypeScript/Next.js server framework (`@llamaindex/server`)
+- **`python/llama-index-server/`**: Python/FastAPI server framework
+- **Root**: Workspace configuration and shared development tools
+
+### Key Technologies
+
+- **Package Manager**: pnpm with workspace configuration
+- **Build Tools**: bunchee (TypeScript), Next.js, hatchling (Python)
+- **Testing**: Playwright for e2e, pytest for Python
+- **Version Management**: changesets for TypeScript packages, manual for Python
+
+## Development Commands
+
+### Root Level (Monorepo)
+
+```bash
+pnpm dev          # Start all packages in development mode
+pnpm build        # Build all packages
+pnpm lint         # ESLint across TypeScript packages
+pnpm format       # Prettier formatting
+pnpm e2e          # Run end-to-end tests
+```
+
+### Create-llama Package
+
+```bash
+cd packages/create-llama
+npm run build     # Build CLI using bash script and ncc
+npm run dev       # Watch mode development
+npm run e2e       # Playwright tests for generated projects
+npm run clean     # Clean build artifacts and template caches
+```
+
+### TypeScript Server Package
+
+```bash
+cd packages/server
+pnpm dev          # Watch mode with bunchee
+pnpm build        # Multi-step build: ESM/CJS + Next.js + static assets
+pnpm clean        # Clean all build outputs
+```
+
+### Python Server Package
+
+```bash
+cd python/llama-index-server
+uv run generate   # Index data files
+fastapi dev       # Start development server with hot reload
+pytest            # Run test suite
+```
+
+## Template System
+
+The CLI uses a sophisticated template system in `packages/create-llama/templates/`:
+
+### Organization
+
+- **`types/`**: Base project structures (streaming, reflex, llamaindexserver)
+- **`components/`**: Reusable components across frameworks
+  - `engines/` - Chat and agent engines
+  - `loaders/` - File, web, database loaders
+  - `providers/` - AI model configurations
+  - `vectordbs/` - Vector database integrations
+  - `use-cases/` - Workflow implementations
+
+### Development Workflow
+
+- Templates support multiple frameworks (Next.js, Express, FastAPI)
+- Component system allows mix-and-match functionality
+- E2E tests validate generated projects work correctly
+
+## Server Framework Architecture
+
+### TypeScript Server (`@llamaindex/server`)
+
+- **Core**: `LlamaIndexServer` class wrapping Next.js with workflow support
+- **Frontend**: React-based chat UI with shadcn/ui components
+- **API**: `/api/chat` endpoint with streaming responses
+- **Build Process**: Complex multi-step build including static assets for Python integration
+
+### Python Server (`llama-index-server`)
+
+- **Core**: `LlamaIndexServer` class extending FastAPI
+- **Architecture**: Workflow factory pattern for stateless request handling
+- **UI Generation**: AI-powered React component generation from Pydantic schemas
+- **Development**: Hot reloading support with dev mode
+
+## Common Patterns
+
+### Workflow Integration
+
+Both server frameworks use factory patterns:
+
+```typescript
+// TypeScript
+const server = new LlamaIndexServer({
+  workflow: (context) => createWorkflow(context)
+});
+
+// Python
+def create_workflow(chat_request: ChatRequest) -> Workflow:
+    return MyWorkflow(chat_request.messages)
+```
+
+### Event System
+
+Structured events for UI communication:
+
+- **UIEvent**: Custom components with Pydantic/Zod schemas
+- **ArtifactEvent**: Code/documents for Canvas panel
+- **SourceNodesEvent**: Document sources with metadata
+- **AgentRunEvent**: Tool usage and progress tracking
+
+### File Handling
+
+- Both servers auto-mount `data/` and `output/` directories
+- LlamaCloud integration for remote file access
+- Static file serving through framework-specific methods
+
+## Testing Strategy
+
+### E2E Testing
+
+- Playwright tests in `packages/create-llama/e2e/`
+- Tests both Python and TypeScript generated projects
+- Validates CLI generation and application functionality
+
+### Unit Testing
+
+- Python: pytest with comprehensive API and service tests
+- TypeScript: Integrated testing through build process
+
+## Build Process
+
+### Create-llama CLI
+
+1. TypeScript compilation with bash script
+2. ncc bundling for standalone executable
+3. Template validation and caching
+
+### Server Package Build
+
+1. **prebuild**: Clean directories
+2. **build**: bunchee compilation to ESM/CJS
+3. **postbuild**: Next.js preparation and static asset generation
+4. **prepare:py-static**: Python integration assets
+
+### Release Process
+
+```bash
+pnpm release     # Build all + publish npm packages + Python release
+```
+
+## Development Environment Setup
+
+### Prerequisites
+
+- Node.js >=16.14.0
+- Python with uv package manager
+- pnpm for package management
+
+### Common Workflow
+
+1. Clone repository and run `pnpm install`
+2. For CLI development: work in `packages/create-llama/`
+3. For server development: choose TypeScript or Python package
+4. Use `pnpm dev` for concurrent development across packages
+5. Run `pnpm e2e` to validate changes with generated projects
+
+## Special Considerations
+
+### Template Development
+
+- Changes to templates require rebuilding CLI
+- E2E tests validate template functionality across frameworks
+- Template caching system speeds up repeated builds
+
+### Cross-package Dependencies
+
+- Server package builds static assets for Python integration
+- Version synchronization between TypeScript and Python packages
+- Shared UI components and styling across implementations
+
+### Performance
+
+- CLI uses caching for template operations
+- Server frameworks support streaming responses
+- Background processing for file operations and LlamaCloud integration
@@ -55,7 +55,7 @@ Then re-start your app. Remember you'll need to re-run `generate` if you add new
 If you're using the Python backend, you can trigger indexing of your data by calling:

 ```bash
-poetry run generate
+uv run generate
 ```

 ## Customizing the AI models
@@ -106,28 +106,16 @@ Ok to proceed? (y) y
 You can also pass command line arguments to set up a new project
 non-interactively. For a list of the latest options, call `create-llama --help`.

-### Running in pro mode
-
-If you prefer more advanced customization options, you can run `create-llama` in pro mode using the `--pro` flag.
-
-In pro mode, instead of selecting a predefined use case, you'll be prompted to select each technical component of your project. This allows for greater flexibility in customizing your project, including:
-
- **Vector Store**: Choose from a variety of vector stores for keeping your documents, including MongoDB, Pinecone, Weaviate, Qdrant and Chroma.
- **Tools**: Choose from a variety of agent tools (functions called by the LLM), such as:
-  - Code Interpreter: Executes Python code in a secure Jupyter notebook environment
-  - Artifact Code Generator: Generates code artifacts that can be run in a sandbox
-  - OpenAPI Action: Facilitates requests to a provided OpenAPI schema
-  - Image Generator: Creates images based on text descriptions
-  - Web Search: Performs web searches to retrieve up-to-date information
- **Data Sources**: Integrate various data sources into your chat application, including local files, websites, or database-retrieved data.
- **Backend Options**: Besides using Next.js or FastAPI, you can also select to use Express for a more traditional Node.js application.
- **Observability**: Choose from a variety of LLM observability tools, including LlamaTrace and Traceloop.
-
-Pro mode is ideal for developers who want fine-grained control over their project's configuration and are comfortable with more technical setup options.
-
 ## LlamaIndex Documentation

 - [TS/JS docs](https://ts.llamaindex.ai/)
 - [Python docs](https://docs.llamaindex.ai/en/stable/)

+## LlamaIndex Server
+
+The generated code is using the LlamaIndex Server, which serves LlamaIndex Workflows and Agent Workflows via an API server. See the following docs for more information:
+
+- [LlamaIndex Server For TypeScript](./packages/server/README.md)
+- [LlamaIndex Server For Python](./python/llama-index-server/README.md)
+
 Inspired by and adapted from [create-next-app](https://github.com/vercel/next.js/tree/canary/packages/create-next-app)
@@ -1,233 +0,0 @@
-import { expect, test } from "@playwright/test";
-import { exec } from "child_process";
-import fs from "fs";
-import path from "path";
-import util from "util";
-import { TemplateFramework, TemplateVectorDB } from "../../helpers/types";
-import { RunCreateLlamaOptions, createTestDir, runCreateLlama } from "../utils";
-
-const execAsync = util.promisify(exec);
-
-const templateFramework: TemplateFramework = process.env.FRAMEWORK
-  ? (process.env.FRAMEWORK as TemplateFramework)
-  : "fastapi";
-const dataSource: string = process.env.DATASOURCE
-  ? process.env.DATASOURCE
-  : "--example-file";
-
-// TODO: add support for other templates
-
-if (
-  dataSource === "--example-file" // XXX: this test provides its own data source - only trigger it on one data source (usually the CI matrix will trigger multiple data sources)
-) {
-  // vectorDBs, tools, and data source combinations to test
-  const vectorDbs: TemplateVectorDB[] = [
-    "mongo",
-    "pg",
-    "pinecone",
-    "milvus",
-    "astra",
-    "qdrant",
-    "chroma",
-    "weaviate",
-  ];
-
-  const toolOptions = [
-    "wikipedia.WikipediaToolSpec",
-    "google.GoogleSearchToolSpec",
-    "document_generator",
-    "artifact",
-  ];
-
-  const dataSources = [
-    "--example-file",
-    "--web-source https://www.example.com",
-    "--db-source mysql+pymysql://user:pass@localhost:3306/mydb",
-  ];
-
-  const observabilityOptions = ["llamatrace", "traceloop"];
-
-  test.describe("Mypy check", () => {
-    test.describe.configure({ retries: 0 });
-
-    // Test vector databases
-    for (const vectorDb of vectorDbs) {
-      test(`Mypy check for vectorDB: ${vectorDb}`, async () => {
-        const cwd = await createTestDir();
-        const { pyprojectPath } = await createAndCheckLlamaProject({
-          options: {
-            cwd,
-            templateType: "streaming",
-            templateFramework,
-            dataSource: "--example-file",
-            vectorDb,
-            tools: "none",
-            port: 3000,
-            postInstallAction: "none",
-            templateUI: undefined,
-            appType: "--no-frontend",
-            llamaCloudProjectName: undefined,
-            llamaCloudIndexName: undefined,
-            observability: undefined,
-          },
-        });
-
-        const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
-        if (vectorDb !== "none") {
-          if (vectorDb === "pg") {
-            expect(pyprojectContent).toContain(
-              "llama-index-vector-stores-postgres",
-            );
-          } else {
-            expect(pyprojectContent).toContain(
-              `llama-index-vector-stores-${vectorDb}`,
-            );
-          }
-        }
-      });
-    }
-
-    // Test tools
-    for (const tool of toolOptions) {
-      test(`Mypy check for tool: ${tool}`, async () => {
-        const cwd = await createTestDir();
-        const { pyprojectPath } = await createAndCheckLlamaProject({
-          options: {
-            cwd,
-            templateType: "streaming",
-            templateFramework,
-            dataSource: "--example-file",
-            vectorDb: "none",
-            tools: tool,
-            port: 3000,
-            postInstallAction: "none",
-            templateUI: undefined,
-            appType: "--no-frontend",
-            llamaCloudProjectName: undefined,
-            llamaCloudIndexName: undefined,
-            observability: undefined,
-          },
-        });
-
-        const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
-        if (tool === "wikipedia.WikipediaToolSpec") {
-          expect(pyprojectContent).toContain("wikipedia");
-        }
-        if (tool === "google.GoogleSearchToolSpec") {
-          expect(pyprojectContent).toContain("google");
-        }
-      });
-    }
-
-    // Test data sources
-    for (const dataSource of dataSources) {
-      const dataSourceType = dataSource.split(" ")[0];
-      test(`Mypy check for data source: ${dataSourceType}`, async () => {
-        const cwd = await createTestDir();
-        const { pyprojectPath } = await createAndCheckLlamaProject({
-          options: {
-            cwd,
-            templateType: "streaming",
-            templateFramework,
-            dataSource,
-            vectorDb: "none",
-            tools: "none",
-            port: 3000,
-            postInstallAction: "none",
-            templateUI: undefined,
-            appType: "--no-frontend",
-            llamaCloudProjectName: undefined,
-            llamaCloudIndexName: undefined,
-            observability: undefined,
-          },
-        });
-
-        const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
-        if (dataSource.includes("--web-source")) {
-          expect(pyprojectContent).toContain("llama-index-readers-web");
-        }
-        if (dataSource.includes("--db-source")) {
-          expect(pyprojectContent).toContain("llama-index-readers-database");
-        }
-      });
-    }
-
-    // Test observability options
-    for (const observability of observabilityOptions) {
-      test(`Mypy check for observability: ${observability}`, async () => {
-        const cwd = await createTestDir();
-
-        const { pyprojectPath } = await createAndCheckLlamaProject({
-          options: {
-            cwd,
-            templateType: "streaming",
-            templateFramework,
-            dataSource: "--example-file",
-            vectorDb: "none",
-            tools: "none",
-            port: 3000,
-            postInstallAction: "none",
-            templateUI: undefined,
-            appType: "--no-frontend",
-            llamaCloudProjectName: undefined,
-            llamaCloudIndexName: undefined,
-            observability,
-          },
-        });
-      });
-    }
-  });
-}
-
-async function createAndCheckLlamaProject({
-  options,
-}: {
-  options: RunCreateLlamaOptions;
-}): Promise<{ pyprojectPath: string; projectPath: string }> {
-  const result = await runCreateLlama(options);
-  const name = result.projectName;
-  const projectPath = path.join(options.cwd, name);
-
-  // Check if the app folder exists
-  expect(fs.existsSync(projectPath)).toBeTruthy();
-
-  // Check if pyproject.toml exists
-  const pyprojectPath = path.join(projectPath, "pyproject.toml");
-  expect(fs.existsSync(pyprojectPath)).toBeTruthy();
-
-  const env = {
-    ...process.env,
-    POETRY_VIRTUALENVS_IN_PROJECT: "true",
-  };
-
-  // Run poetry install
-  try {
-    const { stdout: installStdout, stderr: installStderr } = await execAsync(
-      "poetry install",
-      { cwd: projectPath, env },
-    );
-    console.log("poetry install stdout:", installStdout);
-    console.error("poetry install stderr:", installStderr);
-  } catch (error) {
-    console.error("Error running poetry install:", error);
-    throw error;
-  }
-
-  // Run poetry run mypy
-  try {
-    const { stdout: mypyStdout, stderr: mypyStderr } = await execAsync(
-      "poetry run mypy .",
-      { cwd: projectPath, env },
-    );
-    console.log("poetry run mypy stdout:", mypyStdout);
-    console.error("poetry run mypy stderr:", mypyStderr);
-  } catch (error) {
-    console.error("Error running mypy:", error);
-    throw error;
-  }
-
-  // If we reach this point without throwing an error, the test passes
-  expect(true).toBeTruthy();
-
-  return { pyprojectPath, projectPath };
-}
@@ -1,105 +0,0 @@
-import { expect, test } from "@playwright/test";
-import { exec } from "child_process";
-import fs from "fs";
-import path from "path";
-import util from "util";
-import { TemplateFramework, TemplateVectorDB } from "../../helpers/types";
-import { createTestDir, runCreateLlama } from "../utils";
-
-const execAsync = util.promisify(exec);
-
-const templateFramework: TemplateFramework = process.env.FRAMEWORK
-  ? (process.env.FRAMEWORK as TemplateFramework)
-  : "nextjs";
-const dataSource: string = process.env.DATASOURCE
-  ? process.env.DATASOURCE
-  : "--example-file";
-
-// vectorDBs combinations to test
-const vectorDbs: TemplateVectorDB[] = [
-  "mongo",
-  "pg",
-  "qdrant",
-  "pinecone",
-  "milvus",
-  "astra",
-  "chroma",
-  "llamacloud",
-  "weaviate",
-];
-
-test.describe("Test resolve TS dependencies", () => {
-  // Test vector DBs without LlamaParse
-  for (const vectorDb of vectorDbs) {
-    const optionDescription = `vectorDb: ${vectorDb}, dataSource: ${dataSource}`;
-
-    test(`Vector DB test - ${optionDescription}`, async () => {
-      await runTest(vectorDb, false);
-    });
-  }
-
-  // Test LlamaParse with vectorDB 'none'
-  test(`LlamaParse test - vectorDb: none, dataSource: ${dataSource}, llamaParse: true`, async () => {
-    await runTest("none", true);
-  });
-
-  async function runTest(
-    vectorDb: TemplateVectorDB | "none",
-    useLlamaParse: boolean,
-  ) {
-    const cwd = await createTestDir();
-
-    const result = await runCreateLlama({
-      cwd: cwd,
-      templateType: "streaming",
-      templateFramework: templateFramework,
-      dataSource: dataSource,
-      vectorDb: vectorDb,
-      port: 3000,
-      postInstallAction: "none",
-      templateUI: undefined,
-      appType: templateFramework === "nextjs" ? "" : "--no-frontend",
-      llamaCloudProjectName: undefined,
-      llamaCloudIndexName: undefined,
-      tools: undefined,
-      useLlamaParse: useLlamaParse,
-    });
-    const name = result.projectName;
-
-    // Check if the app folder exists
-    const appDir = path.join(cwd, name);
-    const dirExists = fs.existsSync(appDir);
-    expect(dirExists).toBeTruthy();
-
-    // Install dependencies using pnpm
-    try {
-      const { stderr: installStderr } = await execAsync(
-        "pnpm install --prefer-offline",
-        {
-          cwd: appDir,
-        },
-      );
-    } catch (error) {
-      console.error("Error installing dependencies:", error);
-      throw error;
-    }
-
-    // Run tsc type check and capture the output
-    try {
-      const { stdout, stderr } = await execAsync(
-        "pnpm exec tsc -b --diagnostics",
-        {
-          cwd: appDir,
-        },
-      );
-      // Check if there's any error output
-      expect(stderr).toBeFalsy();
-
-      // Log the stdout for debugging purposes
-      console.log("TypeScript type-check output:", stdout);
-    } catch (error) {
-      console.error("Error running tsc:", error);
-      throw error;
-    }
-  }
-});
@@ -0,0 +1,65 @@
+import eslint from "@eslint/js";
+import eslintConfigPrettier from "eslint-config-prettier";
+import globals from "globals";
+import tseslint from "typescript-eslint";
+
+export default tseslint.config(
+  eslint.configs.recommended,
+  ...tseslint.configs.recommended,
+  eslintConfigPrettier,
+  {
+    languageOptions: {
+      ecmaVersion: 2022,
+      sourceType: "module",
+      globals: {
+        ...globals.browser,
+        ...globals.node,
+      },
+    },
+  },
+  {
+    files: ["packages/create-llama/**"],
+    rules: {
+      "max-params": ["error", 4],
+      "prefer-const": "error",
+      "no-empty": "off",
+      "no-extra-boolean-cast": "off",
+      "@typescript-eslint/no-explicit-any": "off",
+      "@typescript-eslint/no-unused-vars": "off",
+      "@typescript-eslint/no-empty-object-type": "off",
+      "@typescript-eslint/no-wrapper-object-types": "off",
+      "@typescript-eslint/ban-ts-comment": "off",
+    },
+  },
+  {
+    files: ["packages/server/**"],
+    rules: {
+      "no-irregular-whitespace": "off",
+      "@typescript-eslint/no-unused-vars": "off",
+      "@typescript-eslint/no-explicit-any": [
+        "error",
+        {
+          ignoreRestArgs: true,
+        },
+      ],
+    },
+  },
+  {
+    ignores: [
+      "python/**",
+      "**/*.mypy_cache/**",
+      "**/*.venv/**",
+      "**/*.ruff_cache/**",
+      "**/dist/**",
+      "**/e2e/cache/**",
+      "**/lib/*",
+      "**/.next/**",
+      "**/out/**",
+      "**/node_modules/**",
+      "**/build/**",
+      "packages/server/server/**",
+      "packages/server/project/**",
+      "packages/server/bin/**",
+    ],
+  },
+);
@@ -1,136 +0,0 @@
-# LlamaIndex Server
-
-LlamaIndexServer is a FastAPI-based application that allows you to quickly launch your [LlamaIndex Workflows](https://docs.llamaindex.ai/en/stable/module_guides/workflow/#workflows) and [Agent Workflows](https://docs.llamaindex.ai/en/stable/understanding/agent/multi_agent/) as an API server with an optional chat UI. It provides a complete environment for running LlamaIndex workflows with both API endpoints and a user interface for interaction.
-
-## Features
-
- Serving a workflow as a chatbot
- Built on FastAPI for high performance and easy API development
- Optional built-in chat UI with extendable UI components
- Prebuilt development code
-
-## Installation
-
-```bash
-pip install llama-index-server
-```
-
-## Quick Start
-
-```python
-# main.py
-from llama_index.core.agent.workflow import AgentWorkflow
-from llama_index.core.workflow import Workflow
-from llama_index.core.tools import FunctionTool
-from llama_index.server import LlamaIndexServer
-
-
-# Define a factory function that returns a Workflow or AgentWorkflow
-def create_workflow() -> Workflow:
-    def fetch_weather(city: str) -> str:
-        return f"The weather in {city} is sunny"
-
-    return AgentWorkflow.from_tools(
-        tools=[
-            FunctionTool.from_defaults(
-                fn=fetch_weather,
-            )
-        ]
-    )
-
-
-# Create an API server for the workflow
-app = LlamaIndexServer(
-    workflow_factory=create_workflow,  # Supports Workflow or AgentWorkflow
-    env="dev",  # Enable development mode
-    include_ui=True,  # Include chat UI
-    starter_questions=["What can you do?", "How do I use this?"],
-    verbose=True
-)
-```
-
-## Running the Server
-
- In the same directory as `main.py`, run the following command to start the server:
-
-  ```bash
-  fastapi dev
-  ```
-
- Making a request to the server:
-
-  ```bash
-  curl -X POST "http://localhost:8000/api/chat" -H "Content-Type: application/json" -d '{"message": "What is the weather in Tokyo?"}'
-  ```
-
- See the API documentation at `http://localhost:8000/docs`
- Access the chat UI at `http://localhost:8000/` (Make sure you set the `env="dev"` or `include_ui=True` in the server configuration)
-
-## Configuration Options
-
-The LlamaIndexServer accepts the following configuration parameters:
-
- `workflow_factory`: A callable that creates a workflow instance for each request
- `logger`: Optional logger instance (defaults to uvicorn logger)
- `use_default_routers`: Whether to include default routers (chat, static file serving)
- `env`: Environment setting ('dev' enables CORS and UI by default)
- `include_ui`: Whether to include the chat UI
- `component_dir`: The directory for custom UI components rendering events emitted by the workflow. The default is None, which does not render custom UI components.
- `starter_questions`: List of starter questions for the chat UI
- `verbose`: Enable verbose logging
- `api_prefix`: API route prefix (default: "/api")
- `server_url`: The deployment URL of the server (default is None)
- `ui_path`: Path for downloaded UI static files (default: ".ui")
-
-## Default Routers and Features
-
-### Chat Router
-
-The server includes a default chat router at `/api/chat` for handling chat interactions.
-
-### Static File Serving
-
- The server automatically mounts the `data` and `output` folders at `{server_url}{api_prefix}/files/data` (default: `/api/files/data`) and `{server_url}{api_prefix}/files/output` (default: `/api/files/output`) respectively.
- Your workflows can use both folders to store and access files. As a convention, the `data` folder is used for documents that are ingested and the `output` folder is used for documents that are generated by the workflow.
- The example workflows from `create-llama` (see below) are following this pattern.
-
-### Chat UI
-
-When enabled, the server provides a chat interface at the root path (`/`) with:
-
- Configurable starter questions
- Real-time chat interface
- API endpoint integration
-
-### Custom UI Components
-
-You can add custom UI components for your workflow by providing `component_dir` config and adding custom .jsx or .tsx files to the directory.
-See [Custom UI Components](docs/custom_ui_component.md) for more details.
-
-## Development Mode
-
-In development mode (`env="dev"`), the server:
-
- Enables CORS for all origins
- Automatically includes the chat UI
- Provides more verbose logging
-
-## API Endpoints
-
-The server provides the following default endpoints:
-
- `/api/chat`: Chat interaction endpoint
- `/api/files/data/*`: Access to data directory files
- `/api/files/output/*`: Access to output directory files
-
-## Best Practices
-
-1. Always provide a workflow factory that creates fresh workflow instances
-2. Use environment variables for sensitive configuration
-3. Enable verbose logging during development
-4. Configure CORS appropriately for your deployment environment
-5. Use starter questions to guide users in the chat UI
-
-## Getting Started with a New Project
-
-Want to start a new project with LlamaIndexServer? Check out our [create-llama](https://github.com/run-llama/create-llama) tool to quickly generate a new project with LlamaIndexServer.
@@ -1,67 +0,0 @@
-# Custom UI Components
-
-The LlamaIndex server provides support for rendering workflow events using custom UI components, allowing you to extend and customize the chat interface.
-
-## Overview
-
-Custom UI components are a powerful feature that enables you to:
-
- Add custom interface elements to the chat UI using React JSX or TSX files
- Extend the default chat interface functionality
- Create specialized visualizations or interactions
-
-## Configuration
-
-### Workflow events
-
-Your workflow must emit events that fit this structure, allowing the LlamaIndex server to display the right UI components based on the event type.
-
-```json
-{
-    "type": "<event_name>",
-    "data": <data model>
-}
-```
-
-In Pydantic, this is equivalent to:
-
-```python
-from pydantic import BaseModel
-from typing import Literal, Any
-
-class MyCustomEvent(BaseModel):
-    type: Literal["<my_custom_event_name>"]
-    data: dict | Any
-
-    def to_response(self):
-        return self.model_dump()
-```
-
-### Server Setup
-
-1. Initialize the LlamaIndex server with a component directory:
-
-```python
-server = LlamaIndexServer(
-    workflow_factory=your_workflow,
-    component_dir="path/to/components",
-    include_ui=True
-)
-```
-
-2. Add the custom component code to the directory following the naming pattern:
-
-   - File Extension: `.jsx` and `.tsx` for React components
-   - File Name: Should match the event type from your workflow (e.g., `deep_research_event.jsx` for handling `deep_research_event` type that you defined in your workflow). If there are TSX and JSX files with the same name, the TSX file will be used.
-   - Component Name: Export a default React component named `Component` that receives props from the event data
-
-   Example component structure:
-
-   ```jsx
-   function Component({ events }) {
-       // Your component logic here
-       return (
-           // Your UI code here
-       );
-   }
-   ```
@@ -1,3 +0,0 @@
-from .server import LlamaIndexServer
-
-__all__ = ["LlamaIndexServer"]
@@ -1,32 +0,0 @@
-from typing import Any
-
-from llama_index.core.agent.workflow.workflow_events import ToolCallResult
-from llama_index.server.api.callbacks.base import EventCallback
-from llama_index.server.api.models import SourceNodesEvent
-
-
-class SourceNodesFromToolCall(EventCallback):
-    """
-    Extract source nodes from the query tool output.
-
-    Args:
-        query_tool_name: The name of the tool that queries the index.
-                         default is "query_index"
-    """
-
-    def __init__(self, query_tool_name: str = "query_index"):
-        self.query_tool_name = query_tool_name
-
-    def transform_tool_call_result(self, event: ToolCallResult) -> SourceNodesEvent:
-        source_nodes = event.tool_output.raw_output.source_nodes
-        return SourceNodesEvent(nodes=source_nodes)
-
-    async def run(self, event: Any) -> Any:
-        if isinstance(event, ToolCallResult):
-            if event.tool_name == self.query_tool_name:
-                return event, self.transform_tool_call_result(event)
-        return event
-
-    @classmethod
-    def from_default(cls, *args: Any, **kwargs: Any) -> "SourceNodesFromToolCall":
-        return cls()
@@ -1,142 +0,0 @@
-import logging
-import os
-from enum import Enum
-from typing import Any, Dict, List, Optional
-
-from llama_index.core.schema import NodeWithScore
-from llama_index.core.types import ChatMessage, MessageRole
-from llama_index.core.workflow import Event
-from llama_index.server.settings import server_settings
-from pydantic import BaseModel, Field, field_validator
-
-logger = logging.getLogger("uvicorn")
-
-
-class ChatConfig(BaseModel):
-    next_question_suggestions: bool = Field(
-        default=True,
-        description="Whether to suggest next questions",
-    )
-
-
-class ChatAPIMessage(BaseModel):
-    role: MessageRole
-    content: str
-
-    def to_llamaindex_message(self) -> ChatMessage:
-        return ChatMessage(role=self.role, content=self.content)
-
-
-class ChatRequest(BaseModel):
-    messages: List[ChatAPIMessage]
-    data: Optional[Any] = None
-    config: Optional[ChatConfig] = ChatConfig()
-
-    @field_validator("messages")
-    def validate_messages(cls, v: List[ChatAPIMessage]) -> List[ChatAPIMessage]:
-        if v[-1].role != MessageRole.USER:
-            raise ValueError("Last message must be from user")
-        return v
-
-
-class AgentRunEventType(Enum):
-    TEXT = "text"
-    PROGRESS = "progress"
-
-
-class AgentRunEvent(Event):
-    name: str
-    msg: str
-    event_type: AgentRunEventType = AgentRunEventType.TEXT
-    data: Optional[dict] = None
-
-    def to_response(self) -> dict:
-        return {
-            "type": "agent",
-            "data": {
-                "agent": self.name,
-                "type": self.event_type.value,
-                "text": self.msg,
-                "data": self.data,
-            },
-        }
-
-
-class SourceNodesEvent(Event):
-    nodes: List[NodeWithScore]
-
-    def to_response(self) -> dict:
-        return {
-            "type": "sources",
-            "data": {
-                "nodes": [
-                    SourceNodes.from_source_node(node).model_dump()
-                    for node in self.nodes
-                ]
-            },
-        }
-
-
-class SourceNodes(BaseModel):
-    id: str
-    metadata: Dict[str, Any]
-    score: Optional[float]
-    text: str
-    url: Optional[str]
-
-    @classmethod
-    def from_source_node(cls, source_node: NodeWithScore) -> "SourceNodes":
-        metadata = source_node.node.metadata
-        url = cls.get_url_from_metadata(metadata)
-
-        return cls(
-            id=source_node.node.node_id,
-            metadata=metadata,
-            score=source_node.score,
-            text=source_node.node.text,  # type: ignore
-            url=url,
-        )
-
-    @classmethod
-    def get_url_from_metadata(
-        cls,
-        metadata: Dict[str, Any],
-        data_dir: Optional[str] = None,
-    ) -> Optional[str]:
-        url_prefix = server_settings.file_server_url_prefix
-        if data_dir is None:
-            data_dir = "data"
-        file_name = metadata.get("file_name")
-
-        if file_name and url_prefix:
-            # file_name exists and file server is configured
-            pipeline_id = metadata.get("pipeline_id")
-            if pipeline_id:
-                # file is from LlamaCloud
-                file_name = f"{pipeline_id}${file_name}"
-                return f"{url_prefix}/output/llamacloud/{file_name}"
-            is_private = metadata.get("private", "false") == "true"
-            if is_private:
-                # file is a private upload
-                return f"{url_prefix}/output/uploaded/{file_name}"
-            # file is from calling the 'generate' script
-            # Get the relative path of file_path to data_dir
-            file_path = metadata.get("file_path")
-            data_dir = os.path.abspath(data_dir)
-            if file_path and data_dir:
-                relative_path = os.path.relpath(file_path, data_dir)
-                return f"{url_prefix}/data/{relative_path}"
-        # fallback to URL in metadata (e.g. for websites)
-        return metadata.get("URL")
-
-    @classmethod
-    def from_source_nodes(
-        cls, source_nodes: List[NodeWithScore]
-    ) -> List["SourceNodes"]:
-        return [cls.from_source_node(node) for node in source_nodes]
-
-
-class ComponentDefinition(BaseModel):
-    type: str
-    code: str
-    filename: str
@@ -1,4 +0,0 @@
-from llama_index.server.api.routers.chat import chat_router
-from llama_index.server.api.routers.ui import custom_components_router
-
-__all__ = ["chat_router", "custom_components_router"]
@@ -1,20 +0,0 @@
-import logging
-from typing import List
-
-from fastapi import APIRouter
-from llama_index.server.api.models import ComponentDefinition
-from llama_index.server.services.custom_ui import CustomUI
-
-
-def custom_components_router(
-    component_dir: str,
-    logger: logging.Logger,
-) -> APIRouter:
-    router = APIRouter(prefix="/components")
-
-    @router.get("")
-    async def components() -> List[ComponentDefinition]:
-        custom_ui = CustomUI(component_dir=component_dir, logger=logger)
-        return custom_ui.get_components()
-
-    return router
@@ -1,55 +0,0 @@
-import logging
-import shutil
-from pathlib import Path
-from typing import Optional
-
-import requests
-
-CHAT_UI_VERSION = "0.0.9"
-
-
-def download_chat_ui(
-    logger: Optional[logging.Logger] = None, target_path: str = ".ui"
-) -> None:
-    if logger is None:
-        logger = logging.getLogger("uvicorn")
-    path = Path(target_path)
-    temp_dir = _download_package(_get_download_link(CHAT_UI_VERSION))
-    _copy_ui_files(temp_dir, path)
-    logger.info("Chat UI downloaded and copied to static folder")
-
-
-def _get_download_link(version: str) -> str:
-    """Get the download link for the chat UI from the npm registry."""
-    return f"https://registry.npmjs.org/@llamaindex/server/-/server-{version}.tgz"
-
-
-def _download_package(url: str) -> Path:
-    """Download tar.gz file and extract all files into a temporary directory."""
-    import io
-    import tarfile
-    import tempfile
-
-    response = requests.get(url, headers={"User-Agent": "Mozilla/5.0"})
-    content = response.content
-
-    temp_dir = Path(tempfile.mkdtemp())
-
-    with tarfile.open(fileobj=io.BytesIO(content), mode="r:gz") as tar:
-        tar.extractall(path=temp_dir)
-
-    return temp_dir
-
-
-def _copy_ui_files(temp_dir: Path, target_path: Path) -> None:
-    """Copy files from the .next directory to the static directory."""
-    target_path.mkdir(parents=True, exist_ok=True)
-    next_dir = temp_dir / "package/dist/static"
-
-    if next_dir.exists():
-        for item in next_dir.iterdir():
-            dest = target_path / item.name
-            if item.is_dir():
-                shutil.copytree(item, dest, dirs_exist_ok=True)
-            else:
-                shutil.copy2(item, dest)
@@ -1,208 +0,0 @@
-import json
-import logging
-import os
-from typing import Any, Callable, Optional
-
-from fastapi import FastAPI
-from fastapi.middleware.cors import CORSMiddleware
-from fastapi.staticfiles import StaticFiles
-from llama_index.core.workflow import Workflow
-from llama_index.server.api.routers import chat_router, custom_components_router
-from llama_index.server.chat_ui import download_chat_ui
-from llama_index.server.settings import server_settings
-
-
-class LlamaIndexServer(FastAPI):
-    workflow_factory: Callable[..., Workflow]
-    include_ui: Optional[bool]
-    starter_questions: Optional[list[str]]
-    verbose: bool = False
-    ui_path: str = ".ui"
-    component_dir: Optional[str] = None
-
-    def __init__(
-        self,
-        workflow_factory: Callable[..., Workflow],
-        logger: Optional[logging.Logger] = None,
-        use_default_routers: Optional[bool] = True,
-        env: Optional[str] = None,
-        include_ui: Optional[bool] = None,
-        component_dir: Optional[str] = None,
-        starter_questions: Optional[list[str]] = None,
-        server_url: Optional[str] = None,
-        api_prefix: Optional[str] = None,
-        verbose: bool = False,
-        *args: Any,
-        **kwargs: Any,
-    ):
-        """
-        Initialize the LlamaIndexServer.
-
-        Args:
-            workflow_factory: A factory function that creates a workflow instance for each request.
-            logger: The logger to use.
-            use_default_routers: Whether to use the default routers (chat, mount `data` and `output` directories).
-            env: The environment to run the server in.
-            include_ui: Whether to show an chat UI in the root path.
-            component_dir: The directory to custom UI components code.
-            starter_questions: A list of starter questions to display in the chat UI.
-            server_url: The URL of the server.
-            api_prefix: The prefix for the API endpoints.
-            verbose: Whether to show verbose logs.
-        """
-        super().__init__(*args, **kwargs)
-
-        self.workflow_factory = workflow_factory
-        self.logger = logger or logging.getLogger("uvicorn")
-        self.verbose = verbose
-        self.include_ui = include_ui  # Store the explicitly passed value first
-        self.starter_questions = starter_questions
-        self.use_default_routers = use_default_routers or True
-        if component_dir:
-            self.component_dir = component_dir
-
-        # Update the settings
-        if server_url:
-            server_settings.set_url(server_url)
-        if api_prefix:
-            server_settings.set_api_prefix(api_prefix)
-
-        if self.use_default_routers:
-            self.add_default_routers()
-
-        if str(env).lower() == "dev":
-            self.allow_cors("*")
-            if self.include_ui is None:
-                self.include_ui = True
-
-        if self.include_ui is None:
-            self.include_ui = False
-
-        if self.include_ui:
-            self.mount_ui()
-
-    @property
-    def _ui_config(self) -> dict:
-        config = {
-            "CHAT_API": f"{server_settings.api_url}/chat",
-            "STARTER_QUESTIONS": self.starter_questions,
-        }
-        is_llamacloud_configured = os.getenv("LLAMA_CLOUD_API_KEY") is not None
-        if is_llamacloud_configured:
-            config["LLAMA_CLOUD_API"] = (
-                f"{server_settings.api_url}/chat/config/llamacloud"
-            )
-        if self.component_dir:
-            config["COMPONENTS_API"] = f"{server_settings.api_url}/components"
-        return config
-
-    # Default routers
-    def add_default_routers(self) -> None:
-        self.add_chat_router()
-        self.mount_data_dir()
-        self.mount_output_dir()
-
-    def add_chat_router(self) -> None:
-        """
-        Add the chat router.
-        """
-        self.include_router(
-            chat_router(
-                self.workflow_factory,
-                self.logger,
-            ),
-            prefix=server_settings.api_prefix,
-        )
-
-    def add_components_router(self) -> None:
-        """
-        Add the UI router.
-        """
-        if self.component_dir is None:
-            raise ValueError("component_dir must be specified to add components router")
-
-        self.include_router(
-            custom_components_router(self.component_dir, self.logger),
-            prefix=server_settings.api_prefix,
-        )
-
-    def mount_ui(self) -> None:
-        """
-        Mount the UI.
-        """
-        if self.include_ui:
-            if self.component_dir:
-                if not os.path.exists(self.component_dir):
-                    os.makedirs(self.component_dir)
-                self.add_components_router()
-            # Check if the static folder exists
-            if not os.path.exists(self.ui_path):
-                self.logger.warning(
-                    f"UI files not found, downloading UI to {self.ui_path}"
-                )
-                download_chat_ui(logger=self.logger, target_path=self.ui_path)
-            self._mount_static_files(directory=self.ui_path, path="/", html=True)
-            self._override_ui_config()
-
-    def _override_ui_config(self) -> None:
-        """
-        Override the UI config by writing a complete configuration file.
-        """
-        try:
-            config_path = os.path.join(self.ui_path, "config.js")
-            if not os.path.exists(config_path):
-                self.logger.error("Config file not found")
-                return
-            config_content = (
-                f"window.LLAMAINDEX = {json.dumps(self._ui_config, indent=2)};"
-            )
-            with open(config_path, "w") as f:
-                f.write(config_content)
-        except Exception as e:
-            self.logger.error(f"Error overriding UI config: {e}")
-
-    def mount_data_dir(self, data_dir: str = "data") -> None:
-        """
-        Mount the data directory.
-        """
-        self._mount_static_files(
-            directory=data_dir,
-            path=f"{server_settings.api_prefix}/files/data",
-            html=True,
-        )
-
-    def mount_output_dir(self, output_dir: str = "output") -> None:
-        """
-        Mount the output directory.
-        """
-        self._mount_static_files(
-            directory=output_dir,
-            path=f"{server_settings.api_prefix}/files/output",
-            html=True,
-        )
-
-    def _mount_static_files(
-        self, directory: str, path: str, html: bool = False
-    ) -> None:
-        """
-        Mount static files from a directory if it exists.
-        """
-        if os.path.exists(directory):
-            self.logger.info(f"Mounting static files '{directory}' at '{path}'")
-            self.mount(
-                path,
-                StaticFiles(directory=directory, check_dir=False, html=html),
-                name=f"{directory}-static",
-            )
-
-    def allow_cors(self, origin: str = "*") -> None:
-        """
-        Allow CORS for a specific origin.
-        """
-        self.add_middleware(
-            CORSMiddleware,
-            allow_origins=[origin],
-            allow_credentials=True,
-            allow_methods=["*"],
-            allow_headers=["*"],
-        )
@@ -1,117 +0,0 @@
-import logging
-import os
-import re
-import uuid
-from pathlib import Path
-from typing import List, Optional, Union
-
-from llama_index.server.settings import server_settings
-from pydantic import BaseModel, Field
-
-logger = logging.getLogger(__name__)
-
-PRIVATE_STORE_PATH = str(Path("output", "uploaded"))
-TOOL_STORE_PATH = str(Path("output", "tools"))
-LLAMA_CLOUD_STORE_PATH = str(Path("output", "llamacloud"))
-
-
-class DocumentFile(BaseModel):
-    id: str
-    name: str  # Stored file name
-    type: Optional[str] = None
-    size: Optional[int] = None
-    url: Optional[str] = None
-    path: Optional[str] = Field(
-        None,
-        description="The stored file path. Used internally in the server.",
-        exclude=True,
-    )
-    refs: Optional[List[str]] = Field(
-        None, description="The document ids in the index."
-    )
-
-
-class FileService:
-    """
-    To store the files uploaded by the user.
-    """
-
-    @classmethod
-    def save_file(
-        cls,
-        content: Union[bytes, str],
-        file_name: str,
-        save_dir: Optional[str] = None,
-    ) -> DocumentFile:
-        """
-        Save the content to a file in the local file server (accessible via URL).
-
-        Args:
-            content (bytes | str): The content to save, either bytes or string.
-            file_name (str): The original name of the file.
-            save_dir (Optional[str]): The relative path from the current working directory. Defaults to the `output/uploaded` directory.
-
-        Returns:
-            The metadata of the saved file.
-        """
-        if save_dir is None:
-            save_dir = os.path.join("output", "uploaded")
-
-        file_id = str(uuid.uuid4())
-        name, extension = os.path.splitext(file_name)
-        extension = extension.lstrip(".")
-        sanitized_name = _sanitize_file_name(name)
-        if extension == "":
-            raise ValueError("File is not supported!")
-        new_file_name = f"{sanitized_name}_{file_id}.{extension}"
-
-        file_path = os.path.join(save_dir, new_file_name)
-
-        if isinstance(content, str):
-            content = content.encode()
-
-        try:
-            os.makedirs(os.path.dirname(file_path), exist_ok=True)
-            with open(file_path, "wb") as file:
-                file.write(content)
-        except PermissionError as e:
-            logger.error(f"Permission denied when writing to file {file_path}: {e!s}")
-            raise
-        except OSError as e:
-            logger.error(f"IO error occurred when writing to file {file_path}: {e!s}")
-            raise
-        except Exception as e:
-            logger.error(f"Unexpected error when writing to file {file_path}: {e!s}")
-            raise
-
-        logger.info(f"Saved file to {file_path}")
-
-        file_size = os.path.getsize(file_path)
-        file_url = (
-            f"{server_settings.file_server_url_prefix}/{save_dir}/{new_file_name}"
-        )
-        return DocumentFile(
-            id=file_id,
-            name=new_file_name,
-            type=extension,
-            size=file_size,
-            path=file_path,
-            url=file_url,
-            refs=None,
-        )
-
-    @classmethod
-    def get_file_url(cls, file_name: str, save_dir: Optional[str] = None) -> str:
-        """
-        Get the URL of a file.
-        """
-        if save_dir is None:
-            save_dir = os.path.join("output", "uploaded")
-        return f"{server_settings.file_server_url_prefix}/{save_dir}/{file_name}"
-
-
-def _sanitize_file_name(file_name: str) -> str:
-    """
-    Sanitize the file name by replacing all non-alphanumeric characters with underscores.
-    """
-    return re.sub(r"[^a-zA-Z0-9.]", "_", file_name)
@@ -1,3 +0,0 @@
-from .query import get_query_engine_tool
-
-__all__ = ["get_query_engine_tool"]
@@ -1,64 +0,0 @@
-[build-system]
-build-backend = "poetry.core.masonry.api"
-requires = ["poetry-core"]
-
-[tool.codespell]
-check-filenames = true
-check-hidden = true
-# Feel free to un-skip examples, and experimental, you will just need to
-# work through many typos (--write-changes and --interactive will help)
-skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb"
-
-[tool.mypy]
-disallow_untyped_defs = true
-# Remove venv skip when integrated with pre-commit
-exclude = ["_static", "build", "examples", "notebooks", "venv"]
-ignore_missing_imports = true
-namespace_packages = true
-explicit_package_bases = true
-python_version = "3.10"
-
-[tool.poetry]
-authors = ["Your Name <you@example.com>"]
-description = "llama-index fastapi server"
-exclude = ["**/BUILD"]
-license = "MIT"
-name = "llama-index-server"
-packages = [{include = "llama_index/"}]
-readme = "README.md"
-version = "0.1.9"
-
-[tool.poetry.dependencies]
-python = ">=3.9,<4.0"
-fastapi = {extras = ["standard"], version = "^0.115.11"}
-cachetools = "^5.5.2"
-requests = "^2.32.3"
-pydantic-settings = "^2.8.1"
-llama-index-core = "0.12.28"
-llama-index-readers-file = "^0.4.6"
-llama-index-indices-managed-llama-cloud = "0.6.3"
-
-[tool.poetry.group.dev.dependencies]
-black = {extras = ["jupyter"], version = "<=23.9.1,>=23.7.0"}
-codespell = {extras = ["toml"], version = ">=v2.2.6"}
-e2b-code-interpreter = "^1.1.1"
-ipython = "8.10.0"
-jupyter = "^1.0.0"
-markdown = "^3.7"
-mypy = "1.15.0"
-pre-commit = "3.2.0"
-pylint = "2.15.10"
-pytest = "^8.3.5"
-pytest-asyncio = "^0.25.3"
-pytest-mock = "3.11.1"
-ruff = "0.0.292"
-tree-sitter-languages = "^1.8.0"
-types-Deprecated = ">=0.1.0"
-types-PyYAML = "^6.0.12.12"
-types-protobuf = "^4.24.0.4"
-types-redis = "4.5.5.0"
-types-requests = "2.28.11.8"  # TODO: unpin when mypy>0.991
-types-setuptools = "67.1.0.0"
-xhtml2pdf = "^0.2.17"
-pytest-cov = "^6.0.0"
-llama-cloud = "^0.1.17"
@@ -1,201 +0,0 @@
-import pytest
-from httpx import ASGITransport, AsyncClient
-from llama_index.core.agent.workflow import AgentWorkflow
-from llama_index.core.llms import MockLLM
-from llama_index.server import LlamaIndexServer
-
-
-def fetch_weather(city: str) -> str:
-    """Fetch the weather for a given city."""
-    return f"The weather in {city} is sunny."
-
-
-def _agent_workflow() -> AgentWorkflow:
-    # Use MockLLM instead of default OpenAI
-    mock_llm = MockLLM()
-    return AgentWorkflow.from_tools_or_functions(
-        tools_or_functions=[fetch_weather],
-        verbose=True,
-        llm=mock_llm,
-    )
-
-
-@pytest.fixture()
-def server() -> LlamaIndexServer:
-    """Fixture to create a LlamaIndexServer instance."""
-    return LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        use_default_routers=True,
-        mount_ui=False,
-        env="dev",
-    )
-
-
-@pytest.mark.asyncio()
-async def test_server_has_chat_route(server: LlamaIndexServer) -> None:
-    """Test that the server has the chat API route."""
-    chat_route_exists = any(route.path == "/api/chat" for route in server.routes)
-    assert chat_route_exists, "Chat API route not found in server routes"
-
-
-@pytest.mark.asyncio()
-async def test_server_swagger_docs(server: LlamaIndexServer) -> None:
-    """Test that the server serves Swagger UI docs."""
-    async with AsyncClient(
-        transport=ASGITransport(app=server), base_url="http://test"
-    ) as ac:
-        response = await ac.get("/docs")
-        assert response.status_code == 200
-        assert "text/html" in response.headers["content-type"]
-        assert "Swagger UI" in response.text
-
-
-@pytest.mark.asyncio()
-async def test_ui_is_downloaded(server: LlamaIndexServer) -> None:
-    """
-    Test if the UI is downloaded and mounted correctly.
-    """
-    import os
-    import shutil
-
-    # Clean up any existing static directory first
-    if os.path.exists(".ui"):
-        shutil.rmtree(".ui")
-
-    # Create a new server with UI enabled
-    ui_server = LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        use_default_routers=True,
-        env="dev",
-        include_ui=True,
-    )
-
-    # Verify that static directory was created with index.html
-    assert os.path.exists("./.ui"), "Static directory was not created"
-    assert os.path.isdir("./.ui"), "Static path is not a directory"
-    assert os.path.exists("./.ui/index.html"), "index.html was not downloaded"
-
-    # Check if the UI is mounted and accessible
-    async with AsyncClient(
-        transport=ASGITransport(app=ui_server), base_url="http://test"
-    ) as ac:
-        response = await ac.get("/")
-        assert response.status_code == 200
-        assert "text/html" in response.headers["content-type"]
-
-    # Clean up after test
-    shutil.rmtree("./.ui")
-
-
-@pytest.mark.asyncio()
-async def test_ui_is_accessible(server: LlamaIndexServer) -> None:
-    """
-    Test if the UI is accessible.
-    """
-    # Manually trigger UI mounting
-    server.mount_ui()
-
-    async with AsyncClient(
-        transport=ASGITransport(app=server), base_url="http://test"
-    ) as ac:
-        response = await ac.get("/")
-        assert response.status_code == 200
-        assert "text/html" in response.headers["content-type"]
-
-
-@pytest.mark.asyncio()
-async def test_component_dir_creation(server: LlamaIndexServer) -> None:
-    """
-    Test if the component directory is created when specified and doesn't exist.
-    """
-    import os
-    import shutil
-
-    test_component_dir = "./test_components"
-
-    # Clean up any existing directory
-    if os.path.exists(test_component_dir):
-        shutil.rmtree(test_component_dir)
-
-    # Create server with component directory
-    _ = LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        component_dir=test_component_dir,
-        include_ui=True,
-    )
-
-    # Verify directory was created
-    assert os.path.exists(test_component_dir), "Component directory was not created"
-    assert os.path.isdir(test_component_dir), "Component path is not a directory"
-
-    # Clean up after test
-    shutil.rmtree(test_component_dir)
-
-
-@pytest.mark.asyncio()
-async def test_component_router_addition(server: LlamaIndexServer, tmp_path) -> None:
-    """
-    Test if the component router is added when component directory is specified.
-    """
-    test_component_dir = tmp_path / "test_components"
-
-    # Create server with component directory
-    component_server = LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        component_dir=str(test_component_dir),
-        include_ui=True,
-    )
-
-    # Verify component route exists
-    component_route_exists = any(
-        route.path == "/api/components" for route in component_server.routes
-    )
-    assert component_route_exists, "Component API route not found in server routes"
-
-
-@pytest.mark.asyncio()
-async def test_ui_config_includes_components_api(
-    server: LlamaIndexServer, tmp_path
-) -> None:
-    """
-    Test if the UI config includes components API when component directory is set.
-    """
-    test_component_dir = tmp_path / "test_components"
-
-    # Create server with component directory
-    component_server = LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        component_dir=str(test_component_dir),
-        include_ui=True,
-    )
-
-    # Check if components API is in UI config
-    ui_config = component_server._ui_config
-    assert "COMPONENTS_API" in ui_config, "Components API not found in UI config"
-    assert ui_config["COMPONENTS_API"].endswith("/components"), (
-        "Incorrect components API path"
-    )
-
-
-@pytest.mark.asyncio()
-async def test_component_router_requires_component_dir(
-    server: LlamaIndexServer,
-) -> None:
-    """
-    Test that adding components router without component_dir raises an error.
-    """
-    server_without_component_dir = LlamaIndexServer(
-        workflow_factory=_agent_workflow,
-        verbose=True,
-        include_ui=True,
-    )
-
-    with pytest.raises(
-        ValueError, match="component_dir must be specified to add components router"
-    ):
-        server_without_component_dir.add_components_router()
@@ -1,83 +1,55 @@
 {
-  "name": "create-llama",
-  "version": "0.5.2",
-  "description": "Create LlamaIndex-powered apps with one command",
+  "name": "create-llama-monorepo",
+  "version": "1.0.0",
+  "private": true,
+  "description": "Monorepo for create-llama",
  "keywords": [
    "rag",
-    "llamaindex",
-    "next.js"
+    "llamaindex"
  ],
  "repository": {
    "type": "git",
-    "url": "https://github.com/run-llama/create-llama",
-    "directory": "packages/create-llama"
+    "url": "https://github.com/run-llama/create-llama"
  },
  "license": "MIT",
-  "bin": {
-    "create-llama": "./dist/index.js"
-  },
-  "files": [
-    "dist"
+  "workspaces": [
+    "packages/*",
+    "python/*"
  ],
  "scripts": {
-    "build": "bash ./scripts/build.sh",
-    "build:ncc": "pnpm run clean && ncc build ./index.ts -o ./dist/ --minify --no-cache --no-source-map-register",
-    "clean": "rimraf --glob ./dist ./templates/**/__pycache__ ./templates/**/node_modules ./templates/**/poetry.lock",
-    "dev": "ncc build ./index.ts -w -o dist/",
-    "e2e": "playwright test",
-    "e2e:python": "playwright test e2e/shared e2e/python",
-    "e2e:typescript": "playwright test e2e/shared e2e/typescript",
+    "dev": "pnpm -r dev",
+    "build": "pnpm -r build",
+    "e2e": "pnpm -r e2e",
+    "lint": "eslint .",
    "format": "prettier --ignore-unknown --cache --check .",
    "format:write": "prettier --ignore-unknown --write .",
-    "lint": "eslint . --ignore-pattern dist --ignore-pattern e2e/cache",
-    "new-snapshot": "pnpm run build && changeset version --snapshot",
-    "new-version": "pnpm run build && changeset version",
-    "pack-install": "bash ./scripts/pack.sh",
    "prepare": "husky",
-    "release": "pnpm run build && changeset publish",
-    "release-snapshot": "pnpm run build && changeset publish --tag snapshot"
-  },
-  "dependencies": {
-    "@types/async-retry": "1.4.2",
-    "@types/ci-info": "2.0.0",
-    "@types/cross-spawn": "6.0.0",
-    "@types/fs-extra": "11.0.4",
-    "@types/node": "^20.11.7",
-    "@types/prompts": "2.4.2",
-    "@types/tar": "6.1.5",
-    "@types/validate-npm-package-name": "3.0.0",
-    "async-retry": "1.3.1",
-    "async-sema": "3.0.1",
-    "ci-info": "github:watson/ci-info#f43f6a1cefff47fb361c88cf4b943fdbcaafe540",
-    "commander": "12.1.0",
-    "cross-spawn": "7.0.3",
-    "fast-glob": "3.3.1",
-    "fs-extra": "11.2.0",
-    "global-agent": "^3.0.0",
-    "got": "10.7.0",
-    "ollama": "^0.5.0",
-    "ora": "^8.0.1",
-    "picocolors": "1.0.0",
-    "prompts": "2.4.2",
-    "smol-toml": "^1.1.4",
-    "tar": "6.1.15",
-    "terminal-link": "^3.0.0",
-    "update-check": "1.5.4",
-    "validate-npm-package-name": "3.0.0",
-    "yaml": "2.4.1"
+    "new-snapshot": "pnpm -r build && changeset version --snapshot",
+    "new-version-python": "pnpm --filter @create-llama/llama-index-server new-version",
+    "new-version": "pnpm -r build && changeset version && pnpm new-version-python",
+    "release-python": "pnpm --filter @create-llama/llama-index-server release",
+    "release": "pnpm -r build && changeset publish && pnpm release-python",
+    "release-snapshot": "pnpm -r build && changeset publish --tag snapshot"
  },
  "devDependencies": {
    "@changesets/cli": "^2.27.1",
-    "@playwright/test": "^1.41.1",
-    "@vercel/ncc": "0.38.1",
-    "eslint": "^8.56.0",
-    "eslint-config-prettier": "^8.10.0",
+    "bunchee": "6.4.0",
    "husky": "^9.0.10",
-    "prettier": "^3.2.5",
-    "prettier-plugin-organize-imports": "^3.2.4",
-    "rimraf": "^5.0.5",
-    "typescript": "^5.3.3",
-    "wait-port": "^1.1.0"
+    "lint-staged": "^15.2.11",
+    "typescript-eslint": "^8.18.0",
+    "globals": "^15.12.0",
+    "eslint": "9.22.0",
+    "@eslint/js": "^9.25.0",
+    "eslint-config-next": "^15.1.0",
+    "eslint-config-prettier": "^9.1.0",
+    "eslint-plugin-react": "7.37.2",
+    "prettier": "^3.4.2",
+    "prettier-plugin-organize-imports": "^4.1.0",
+    "prettier-plugin-tailwindcss": "^0.6.11",
+    "typescript": "^5.7.3",
+    "@types/node": "^22.9.0",
+    "@types/react": "^19",
+    "@types/react-dom": "^19"
  },
  "packageManager": "pnpm@9.0.5",
  "engines": {
@@ -0,0 +1,65 @@
+# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
+
+# dependencies
+node_modules
+.pnp
+.pnpm-store
+.pnp.js
+
+# testing
+coverage
+.coverage
+
+# next.js
+.next/
+out/
+build
+
+# misc
+.DS_Store
+*.pem
+
+# debug
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
+
+# local env files
+.env
+.env.local
+.env.development.local
+.env.test.local
+.env.production.local
+
+# build
+dist/
+lib/
+
+# e2e
+.cache
+test-results/
+playwright-report/
+blob-report/
+playwright/.cache/
+.tsbuildinfo
+e2e/cache
+
+# intellij
+**/.idea
+
+# Python
+.mypy_cache/
+venv/
+.venv/
+dist/
+.__pycache__
+__pycache__
+.python-version
+.ui
+
+# build artifacts
+create-llama-*.tgz
+
+# copied from root
+README.md
+LICENSE.md
@@ -1,5 +1,136 @@
 # create-llama

+## 0.5.22
+
+### Patch Changes
+
+- e2486eb: feat: support human in the loop for TS
+
+## 0.5.21
+
+### Patch Changes
+
+- af9ad3c: feat: show document artifact after generating report
+- a543a27: feat: bump chat-ui with inline artifact
+
+## 0.5.20
+
+### Patch Changes
+
+- 3ff0a18: fix: default header padding
+
+## 0.5.19
+
+### Patch Changes
+
+- 5fe9e17: support eject to fully customize next folder
+- b8a1ff6: Support citation for agentic template (Python)
+
+## 0.5.18
+
+### Patch Changes
+
+- 8d59ef0: Add layout_dir config to the generated python code
+
+## 0.5.17
+
+### Patch Changes
+
+- eee3230: feat: support custom layout
+
+## 0.5.16
+
+### Patch Changes
+
+- 6f75d4a: fix: unsupported language in code gen workflow
+- d0618fa: Fix LlamaCloud generate script issue
+
+## 0.5.15
+
+### Patch Changes
+
+- 527075c: Enable dev mode that allows updating code directly in the UI
+
+## 0.5.14
+
+### Patch Changes
+
+- 1df8cfb: Split artifacts use case to document generator and code generator
+- 1b5a519: chore: improve dev experience with nodemon
+- b3eb0ba: Fix typing check issue
+- 556f33c: fix chromadb dependency issue
+- 2451539: fix: remove dead generated ai code
+- 7a70390: Deprecate pro mode
+
+## 0.5.13
+
+### Patch Changes
+
+- f4ca602: Add artifact use case for Typescript template
+- f4ca602: Update typescript use cases to use the new workflow engine
+
+## 0.5.12
+
+### Patch Changes
+
+- 241d82a: Add artifacts use case (python)
+
+## 0.5.11
+
+### Patch Changes
+
+- 3960618: chore: create-llama monorepo
+- 8fe5fc2: chore: add llamaindex server package
+
+## 0.5.10
+
+### Patch Changes
+
+- 0a2e12a: Use uv as the default package manager
+
+## 0.5.9
+
+### Patch Changes
+
+- 4bc53ac: Bump new chat ui and update deep research component
+- 4bc53ac: Support generate UI for deep research use case (Typescript)
+
+## 0.5.8
+
+### Patch Changes
+
+- 765181a: chore: test typescript e2e with node 20 and 22
+
+## 0.5.7
+
+### Patch Changes
+
+- 5988657: chore: bump llmaindex
+
+## 0.5.6
+
+### Patch Changes
+
+- d363ced: Bump llamaindex server packages
+
+## 0.5.5
+
+### Patch Changes
+
+- ee85320: The default custom deep research component does not work.
+
+## 0.5.4
+
+### Patch Changes
+
+- 7c3b279: Support code generation of event components using an LLM (Python)
+
+## 0.5.3
+
+### Patch Changes
+
+- 76ec360: Update templates to use new chat ui config
+
 ## 0.5.2

 ### Patch Changes
@@ -0,0 +1,108 @@
+# create-llama Package
+
+## Overview
+
+The `create-llama` package is a CLI tool for creating LlamaIndex-powered applications with one command. It's designed as a project generator that scaffolds various types of RAG (Retrieval-Augmented Generation) applications using different frameworks, databases, and AI model providers.
+
+## Package Structure
+
+### Core Files
+
+- **`index.ts`**: Main CLI entry point using Commander.js for argument parsing
+- **`create-app.ts`**: Core application creation logic and orchestration
+- **`package.json`**: Package configuration with binary entry point at `./dist/index.js`
+
+### Key Directories
+
+- **`helpers/`**: Utility functions for package management, file operations, and configuration
+- **`questions/`**: Interactive prompts for user configuration
+- **`templates/`**: Project templates for different frameworks and use cases
+- **`e2e/`**: End-to-end tests using Playwright
+
+## Core Functionality
+
+### CLI Interface
+
+The tool accepts numerous command-line options including:
+
+- Framework selection (`--framework`: nextjs, express, fastapi)
+- Template type (`--template`: streaming, multiagent, reflex, llamaindexserver)
+- Model providers (OpenAI, Anthropic, Groq, Ollama, etc.)
+- Vector databases (none, mongo, pg, pinecone, milvus, etc.)
+- Data sources (files, web URLs, databases)
+- Tools and observability options
+
+### Application Generation Flow
+
+1. **Project validation**: Checks project name validity and directory permissions
+2. **Interactive questioning**: Prompts user for configuration if not provided via CLI
+3. **Template installation**: Copies and configures appropriate templates
+4. **Environment setup**: Creates `.env` files with API keys and configuration
+5. **Dependencies**: Installs packages using detected/specified package manager
+6. **Post-install actions**: Can run the app, open VSCode, or install dependencies
+
+### Template System
+
+Templates are organized by:
+
+- **Framework**: NextJS (frontend), Express (Node backend), FastAPI (Python backend)
+- **Type**: Streaming chat, multiagent workflows, Reflex UI, LlamaIndex server
+- **Components**: Engines, loaders, providers, UI components, observability
+
+### Helper Functions
+
+Key helper modules include:
+
+- **Installation**: Package manager detection and dependency installation
+- **Data sources**: File copying, web scraping, database connection setup
+- **Providers**: Model provider configuration (OpenAI, Anthropic, etc.)
+- **Tools**: Integration with external tools (Wikipedia, weather, code generation)
+- **Environment**: `.env` file generation with API keys and settings
+
+## Development Commands
+
+### Build & Development
+
+- `npm run build`: Build the CLI using bash script
+- `npm run dev`: Watch mode development build
+- `npm run clean`: Clean build artifacts and temporary files
+
+### Testing
+
+- `npm run e2e`: Run all end-to-end tests
+- `npm run e2e:python`: Test Python-specific templates
+- `npm run e2e:typescript`: Test TypeScript-specific templates
+
+### Package Management
+
+- `npm run pack-install`: Create and install local package for testing
+
+## Architecture Notes
+
+### Model Configuration
+
+The tool supports multiple AI providers with a unified `ModelConfig` interface that includes:
+
+- Provider selection and API key management
+- Model and embedding model specification
+- Dimension configuration for embeddings
+
+### Data Source Handling
+
+Flexible data source configuration supporting:
+
+- Local files and directories
+- Web URLs with configurable crawling depth
+- Database connections with custom queries
+- Automatic file downloading and copying
+
+### Template Flexibility
+
+Templates use a component-based system allowing mix-and-match of:
+
+- Different frameworks (NextJS, Express, FastAPI)
+- Various vector databases
+- Multiple observability tools
+- Configurable tools and integrations
+
+This package serves as the foundation for rapidly prototyping and deploying LlamaIndex applications across different technology stacks and use cases.
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import path from "path";
 import { green, yellow } from "picocolors";
 import { tryGitInit } from "./helpers/git";
@@ -0,0 +1,286 @@
+import { expect, test } from "@playwright/test";
+import { exec } from "child_process";
+import fs from "fs";
+import path from "path";
+import util from "util";
+import { TemplateFramework, TemplateType, TemplateUseCase, TemplateVectorDB } from "../../helpers/types";
+import { RunCreateLlamaOptions, createTestDir, runCreateLlama } from "../utils";
+
+const execAsync = util.promisify(exec);
+
+const templateFramework: TemplateFramework = process.env.FRAMEWORK
+  ? (process.env.FRAMEWORK as TemplateFramework)
+  : "fastapi";
+const templateType: TemplateType = process.env.TEMPLATE_TYPE
+  ? (process.env.TEMPLATE_TYPE as TemplateType)
+  : "llamaindexserver";
+const useCases: TemplateUseCase[] = [
+  "agentic_rag",
+  "deep_research",
+  "financial_report",
+  "code_generator",
+  "document_generator",
+  "hitl",
+];
+const dataSource: string = process.env.DATASOURCE
+  ? process.env.DATASOURCE
+  : "--example-file";
+
+test.describe("Mypy check", () => {
+  test.describe.configure({ retries: 0 });
+
+    // Test for streaming template
+    test.describe("StreamingTemplate", () => {
+      test.skip(templateType !== "streaming", `skipping streaming test for ${templateType}`);
+      if (
+        dataSource === "--example-file" // XXX: this test provides its own data source - only trigger it on one data source (usually the CI matrix will trigger multiple data sources)
+      ) {
+        // vectorDBs, tools, and data source combinations to test
+        const vectorDbs: TemplateVectorDB[] = [
+          "mongo",
+          "pg",
+          "pinecone",
+          "milvus",
+          "astra",
+          "qdrant",
+          "chroma",
+          "weaviate",
+        ];
+        const toolOptions = [
+          "wikipedia.WikipediaToolSpec",
+          "google.GoogleSearchToolSpec",
+          "document_generator",
+          "artifact",
+        ];
+
+        const dataSources = [
+          "--example-file",
+          "--web-source https://www.example.com",
+          "--db-source mysql+pymysql://user:pass@localhost:3306/mydb",
+        ];
+
+        const observabilityOptions = ["llamatrace", "traceloop"];
+
+        // Test vector databases
+        for (const vectorDb of vectorDbs) {
+          test(`vectorDB: ${vectorDb} ${templateType}`, async () => {
+            const cwd = await createTestDir();
+            const { pyprojectPath } = await createAndCheckLlamaProject({
+              options: {
+                cwd,
+                templateType: "streaming",
+                templateFramework,
+                dataSource: "--example-file",
+                vectorDb,
+                tools: "none",
+                port: 3000,
+                postInstallAction: "none",
+                templateUI: undefined,
+                appType: "--no-frontend",
+                llamaCloudProjectName: undefined,
+                llamaCloudIndexName: undefined,
+                observability: undefined,
+              },
+            });
+
+            const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
+            if (vectorDb !== "none") {
+              if (vectorDb === "pg") {
+                expect(pyprojectContent).toContain(
+                  "llama-index-vector-stores-postgres",
+                );
+              } else {
+                expect(pyprojectContent).toContain(
+                  `llama-index-vector-stores-${vectorDb}`,
+                );
+              }
+            }
+          });
+        }
+
+        // // Test tools
+        for (const tool of toolOptions) {
+          test(`tool: ${tool} ${templateType}`, async () => {
+            const cwd = await createTestDir();
+            const { pyprojectPath } = await createAndCheckLlamaProject({
+              options: {
+                cwd,
+                templateType: "streaming",
+                templateFramework,
+                dataSource: "--example-file",
+                vectorDb: "none",
+                tools: tool,
+                port: 3000,
+                postInstallAction: "none",
+                templateUI: undefined,
+                appType: "--no-frontend",
+                llamaCloudProjectName: undefined,
+                llamaCloudIndexName: undefined,
+                observability: undefined,
+              },
+            });
+
+            const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
+            if (tool === "wikipedia.WikipediaToolSpec") {
+              expect(pyprojectContent).toContain("wikipedia");
+            }
+            if (tool === "google.GoogleSearchToolSpec") {
+              expect(pyprojectContent).toContain("google");
+            }
+          });
+        }
+
+        // // Test data sources
+        for (const dataSource of dataSources) {
+          test(`data source: ${dataSource} ${templateType}`, async () => {
+          const dataSourceType = dataSource.split(" ")[0];
+            const cwd = await createTestDir();
+            const { pyprojectPath } = await createAndCheckLlamaProject({
+              options: {
+                cwd,
+                templateType: "streaming",
+                templateFramework,
+                dataSource,
+                vectorDb: "none",
+                tools: "none",
+                port: 3000,
+                postInstallAction: "none",
+                templateUI: undefined,
+                appType: "--no-frontend",
+                llamaCloudProjectName: undefined,
+                llamaCloudIndexName: undefined,
+                observability: undefined,
+              },
+            });
+
+            const pyprojectContent = fs.readFileSync(pyprojectPath, "utf-8");
+            if (dataSource.includes("--web-source")) {
+              expect(pyprojectContent).toContain("llama-index-readers-web");
+            }
+            if (dataSource.includes("--db-source")) {
+              expect(pyprojectContent).toContain("llama-index-readers-database");
+            }
+          });
+        }
+
+        // Test observability options
+        for (const observability of observabilityOptions) {
+          test.describe(`observability: ${observability} ${templateType}`, async () => {
+            const cwd = await createTestDir();
+
+            const { pyprojectPath } = await createAndCheckLlamaProject({
+              options: {
+                cwd,
+                templateType: "streaming",
+                templateFramework,
+                dataSource: "--example-file",
+                vectorDb: "none",
+                tools: "none",
+                port: 3000,
+                postInstallAction: "none",
+                templateUI: undefined,
+                appType: "--no-frontend",
+                llamaCloudProjectName: undefined,
+                llamaCloudIndexName: undefined,
+                observability,
+              },
+            });
+          });
+        }
+      }
+    });
+
+    test.describe("LlamaIndexServer", async () => {
+      test.skip(templateType !== "llamaindexserver", `skipping llamaindexserver test for ${templateType}`);
+      test.skip(dataSource !== "--example-file", `skipping llamaindexserver test for ${dataSource}`);
+      for (const useCase of useCases) {
+        const cwd = await createTestDir();
+        await createAndCheckLlamaProject({
+          options: {
+            cwd,
+            templateType: "llamaindexserver",
+            templateFramework,
+            dataSource,
+            vectorDb: "none",
+            tools: "none",
+            port: 3000,
+            postInstallAction: "none",
+            templateUI: undefined,
+            appType: "--no-frontend",
+            llamaCloudProjectName: undefined,
+            llamaCloudIndexName: undefined,
+            observability: undefined,
+            useCase,
+          },
+        });
+      }
+    });
+
+    async function createAndCheckLlamaProject({
+      options,
+    }: {
+      options: RunCreateLlamaOptions;
+    }): Promise<{ pyprojectPath: string; projectPath: string }> {
+      const result = await runCreateLlama(options);
+      const name = result.projectName;
+      const projectPath = path.join(options.cwd, name);
+
+      // Check if the app folder exists
+      expect(fs.existsSync(projectPath)).toBeTruthy();
+
+      // Check if pyproject.toml exists
+      const pyprojectPath = path.join(projectPath, "pyproject.toml");
+      expect(fs.existsSync(pyprojectPath)).toBeTruthy();
+
+      // Modify environment for the command
+      const commandEnv = {
+        ...process.env,
+      };
+
+      console.log("Running uv venv...");
+      try {
+        const { stdout: venvStdout, stderr: venvStderr } = await execAsync(
+          "uv venv",
+          { cwd: projectPath, env: commandEnv },
+        );
+        console.log("uv venv stdout:", venvStdout);
+        console.error("uv venv stderr:", venvStderr);
+      } catch (error) {
+        console.error("Error running uv venv:", error);
+        throw error; // Re-throw error to fail the test
+      }
+
+      console.log("Running uv sync...");
+      try {
+        const { stdout: syncStdout, stderr: syncStderr } = await execAsync(
+          "uv sync --all-extras",
+          { cwd: projectPath, env: commandEnv },
+        );
+        console.log("uv sync stdout:", syncStdout);
+        console.error("uv sync stderr:", syncStderr);
+      } catch (error) {
+        console.error("Error running uv sync:", error);
+        throw error; // Re-throw error to fail the test
+      }
+
+      console.log("Running uv run mypy ....");
+      try {
+        const { stdout: mypyStdout, stderr: mypyStderr } = await execAsync(
+          "uv run mypy .",
+          { cwd: projectPath, env: commandEnv },
+        );
+        console.log("uv run mypy stdout:", mypyStdout);
+        console.error("uv run mypy stderr:", mypyStderr);
+        // Assuming mypy success means no output or specific success message
+        // Adjust checks based on actual expected mypy output
+      } catch (error) {
+        console.error("Error running mypy:", error);
+        throw error;
+      }
+
+      // If we reach this point without throwing an error, the test passes
+      expect(true).toBeTruthy();
+
+    return { pyprojectPath, projectPath };
+  }
+});
@@ -1,6 +1,5 @@
-/* eslint-disable turbo/no-undeclared-env-vars */
 import { expect, test } from "@playwright/test";
-import { ChildProcess } from "child_process";
+import { ChildProcess, execSync } from "child_process";
 import fs from "fs";
 import path from "path";
 import type {
@@ -13,21 +12,32 @@ import { createTestDir, runCreateLlama, type AppType } from "../utils";
 const templateFramework: TemplateFramework = process.env.FRAMEWORK
  ? (process.env.FRAMEWORK as TemplateFramework)
  : "fastapi";
-const dataSource: string = "--example-file";
+const dataSource: string = process.env.DATASOURCE
+  ? (process.env.DATASOURCE as string)
+  : "--example-file";
+const llamaCloudProjectName = "create-llama";
+const llamaCloudIndexName = "e2e-test";
+
 const templateUI: TemplateUI = "shadcn";
 const templatePostInstallAction: TemplatePostInstallAction = "runApp";
 const appType: AppType = "--frontend";
 const userMessage = "Write a blog post about physical standards for letters";
-const templateUseCases = ["financial_report", "agentic_rag", "deep_research"];
+const templateUseCases = [
+  "agentic_rag",
+  "financial_report",
+  "deep_research",
+  "code_generator",
+  // "hitl",
+];
+const ejectDir = "next";

 for (const useCase of templateUseCases) {
  test.describe(`Test use case ${useCase} ${templateFramework} ${dataSource} ${templateUI} ${appType} ${templatePostInstallAction}`, async () => {
    test.skip(
-      process.platform !== "linux" ||
-        process.env.DATASOURCE === "--no-files" ||
-        templateFramework === "express",
+      dataSource === "--no-files" || templateFramework === "express",
      "The llamaindexserver template currently only works with nextjs, fastapi. We also only run on Linux to speed up tests.",
    );
+    const useLlamaParse = dataSource === "--llamacloud";
    let port: number;
    let cwd: string;
    let name: string;
@@ -49,6 +59,9 @@ for (const useCase of templateUseCases) {
        templateUI,
        appType,
        useCase,
+        llamaCloudProjectName,
+        llamaCloudIndexName,
+        useLlamaParse,
      });
      name = result.projectName;
      appProcess = result.appProcess;
@@ -65,7 +78,9 @@ for (const useCase of templateUseCases) {
          templateFramework === "express",
      );
      await page.goto(`http://localhost:${port}`);
-      await expect(page.getByText("Built by LlamaIndex")).toBeVisible();
+      await expect(page.getByText("Built by LlamaIndex")).toBeVisible({
+        timeout: 5 * 60 * 1000,
+      });
    });

    test("Frontend should be able to submit a message and receive the start of a streamed response", async ({
@@ -97,6 +112,28 @@ for (const useCase of templateUseCases) {
      expect(response.ok()).toBeTruthy();
    });

+    test("Should successfully eject, install dependencies and build without errors", async () => {
+      test.skip(
+        templateFramework !== "nextjs" ||
+          useCase !== "code_generator" ||
+          dataSource === "--llamacloud",
+        "Eject test only applies to Next.js framework, code generator use case, and non-llamacloud",
+      );
+
+      // Run eject command
+      execSync("npm run eject", { cwd: path.join(cwd, name) });
+
+      // Verify next directory exists
+      const nextDirExists = fs.existsSync(path.join(cwd, name, ejectDir));
+      expect(nextDirExists).toBeTruthy();
+
+      // Install dependencies in next directory
+      execSync("npm install", { cwd: path.join(cwd, name, ejectDir) });
+
+      // Run build
+      execSync("npm run build", { cwd: path.join(cwd, name, ejectDir) });
+    });
+
    // clean processes
    test.afterAll(async () => {
      appProcess?.kill();
@@ -1,4 +1,3 @@
-/* eslint-disable turbo/no-undeclared-env-vars */
 import { expect, test } from "@playwright/test";
 import { ChildProcess } from "child_process";
 import fs from "fs";
@@ -1,4 +1,3 @@
-/* eslint-disable turbo/no-undeclared-env-vars */
 import { expect, test } from "@playwright/test";
 import { ChildProcess } from "child_process";
 import fs from "fs";
@@ -0,0 +1,163 @@
+import { expect, test } from "@playwright/test";
+import { exec } from "child_process";
+import fs from "fs";
+import path from "path";
+import util from "util";
+import { NO_DATA_USE_CASES } from "../../helpers/constant";
+import {
+  TemplateFramework,
+  TemplateType,
+  TemplateUseCase,
+  TemplateVectorDB,
+} from "../../helpers/types";
+import { createTestDir, runCreateLlama } from "../utils";
+
+const execAsync = util.promisify(exec);
+
+const templateFramework: TemplateFramework = process.env.FRAMEWORK
+  ? (process.env.FRAMEWORK as TemplateFramework)
+  : "nextjs";
+const templateType: TemplateType = process.env.TEMPLATE_TYPE
+  ? (process.env.TEMPLATE_TYPE as TemplateType)
+  : "llamaindexserver";
+const useCases: TemplateUseCase[] = [
+  "agentic_rag",
+  "deep_research",
+  "financial_report",
+  "code_generator",
+  "document_generator",
+  "hitl",
+];
+const dataSource: string = process.env.DATASOURCE
+  ? process.env.DATASOURCE
+  : "--example-file";
+
+// vectorDBs combinations to test
+const vectorDbs: TemplateVectorDB[] = [
+  "mongo",
+  "pg",
+  "qdrant",
+  "pinecone",
+  "milvus",
+  "astra",
+  "chroma",
+  "llamacloud",
+  "weaviate",
+];
+
+test.describe("Test resolve TS dependencies", () => {
+  test.describe.configure({ retries: 0 });
+
+  // Test vector DBs without LlamaParse
+  for (const vectorDb of vectorDbs) {
+    const optionDescription = `templateType: ${templateType}, vectorDb: ${vectorDb}, dataSource: ${dataSource}`;
+
+    test(`Vector DB test - ${optionDescription}`, async () => {
+      // skip vectordb test for llamaindexserver
+      test.skip(
+        templateType === "llamaindexserver",
+        "skipping vectorDB test for llamaindexserver",
+      );
+
+      await runTest({
+        templateType: templateType,
+        useLlamaParse: false, // Disable LlamaParse for vectorDB test
+        vectorDb: vectorDb,
+      });
+    });
+  }
+
+  // No vectorDB, with LlamaParse and useCase
+  // Only need to test use case with example data source
+  if (dataSource === "--example-file") {
+    for (const useCase of useCases) {
+      const optionDescription = `templateType: ${templateType}, useCase: ${useCase}`;
+      test.describe(`useCase test - ${optionDescription}`, () => {
+        test.skip(
+          templateType === "streaming",
+          "Skipping use case test for streaming template.",
+        );
+        test(`no llamaParse - ${optionDescription}`, async () => {
+          await runTest({
+            templateType: templateType,
+            useLlamaParse: false,
+            useCase: useCase,
+          });
+        });
+        // Skipping llamacloud for the use case doesn't use index.
+        if (!useCase || !NO_DATA_USE_CASES.includes(useCase)) {
+          test(`llamaParse - ${optionDescription}`, async () => {
+            await runTest({
+              templateType: templateType,
+              useLlamaParse: true,
+              useCase: useCase,
+            });
+          });
+        }
+      });
+    }
+  }
+});
+
+async function runTest(options: {
+  templateType: TemplateType;
+  useLlamaParse: boolean;
+  useCase?: TemplateUseCase;
+  vectorDb?: TemplateVectorDB;
+}) {
+  const cwd = await createTestDir();
+
+  const result = await runCreateLlama({
+    cwd: cwd,
+    templateType: options.templateType,
+    templateFramework: templateFramework,
+    dataSource: dataSource,
+    vectorDb: options.vectorDb ?? "none",
+    port: 3000,
+    postInstallAction: "none",
+    templateUI: undefined,
+    appType: templateFramework === "nextjs" ? "" : "--no-frontend",
+    llamaCloudProjectName: undefined,
+    llamaCloudIndexName: undefined,
+    tools: undefined,
+    useLlamaParse: options.useLlamaParse,
+    useCase: options.useCase,
+  });
+  const name = result.projectName;
+
+  // Check if the app folder exists
+  const appDir = path.join(cwd, name);
+  const dirExists = fs.existsSync(appDir);
+  expect(dirExists).toBeTruthy();
+
+  // Install dependencies using pnpm
+  try {
+    const { stderr: installStderr } = await execAsync(
+      "pnpm install --prefer-offline --ignore-workspace",
+      {
+        cwd: appDir,
+      },
+    );
+  } catch (error) {
+    console.error("Error installing dependencies:", error);
+    throw error;
+  }
+
+  // Run tsc type check and capture the output
+  try {
+    const { stdout, stderr } = await execAsync(
+      "pnpm exec tsc -b --diagnostics",
+      {
+        cwd: appDir,
+      },
+    );
+    // Check if there's any error output
+    expect(stderr).toBeFalsy();
+
+    // Log the stdout for debugging purposes
+    console.log("TypeScript type-check output:", stdout);
+  } catch (error) {
+    console.error("Error running tsc:", error);
+    throw error;
+  }
+}
@@ -67,8 +67,8 @@ export async function runCreateLlama({
  ].join("-");

  // Handle different data source types
-  let dataSourceArgs = [];
-  if (dataSource.includes("--web-source" || "--db-source")) {
+  const dataSourceArgs = [];
+  if (dataSource.includes("--web-source")) {
    const webSource = dataSource.split(" ")[1];
    dataSourceArgs.push("--web-source", webSource);
  } else if (dataSource.includes("--db-source")) {
@@ -1,6 +1,15 @@
+import { TemplateUseCase } from "./types";
+
 export const COMMUNITY_OWNER = "run-llama";
 export const COMMUNITY_REPO = "create_llama_projects";
 export const LLAMA_PACK_OWNER = "run-llama";
 export const LLAMA_PACK_REPO = "llama_index";
 export const LLAMA_PACK_FOLDER = "llama-index-packs";
 export const LLAMA_PACK_FOLDER_PATH = `${LLAMA_PACK_OWNER}/${LLAMA_PACK_REPO}/main/${LLAMA_PACK_FOLDER}`;
+
+// these use cases don't have data folder, so no need to run generate and no need to getIndex
+export const NO_DATA_USE_CASES: TemplateUseCase[] = [
+  "code_generator",
+  "document_generator",
+  "hitl",
+];
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import { async as glob } from "fast-glob";
 import fs from "fs";
 import path from "path";
@@ -181,7 +181,7 @@ const getVectorDBEnvs = (
            ]
          : []),
      ];
-    case "chroma":
+    case "chroma": {
      const envs = [
        {
          name: "CHROMA_COLLECTION",
@@ -206,6 +206,7 @@ Otherwise, use CHROMA_HOST and CHROMA_PORT config above`,
        });
      }
      return envs;
+    }
    case "weaviate":
      return [
        {
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import { execSync } from "child_process";
 import fs from "fs";
 import path from "path";
@@ -4,12 +4,12 @@ import path from "path";
 import picocolors, { cyan } from "picocolors";

 import fsExtra from "fs-extra";
+import { NO_DATA_USE_CASES } from "./constant";
 import { writeLoadersConfig } from "./datasources";
 import { createBackendEnvFile, createFrontendEnvFile } from "./env-variables";
 import { PackageManager } from "./get-pkg-manager";
 import { installLlamapackProject } from "./llama-pack";
 import { makeDir } from "./make-dir";
-import { isHavingPoetryLockFile, tryPoetryRun } from "./poetry";
 import { installPythonTemplate } from "./python";
 import { downloadAndExtractRepo } from "./repo";
 import { ConfigFileType, writeToolsConfig } from "./tools";
@@ -19,9 +19,11 @@ import {
  ModelConfig,
  TemplateDataSource,
  TemplateFramework,
+  TemplateUseCase,
  TemplateVectorDB,
 } from "./types";
 import { installTSTemplate } from "./typescript";
+import { isHavingUvLockFile, tryUvRun } from "./uv";

 const checkForGenerateScript = (
  modelConfig: ModelConfig,
@@ -60,11 +62,12 @@ async function generateContextData(
  vectorDb?: TemplateVectorDB,
  llamaCloudKey?: string,
  useLlamaParse?: boolean,
+  useCase?: TemplateUseCase,
 ) {
  if (packageManager) {
    const runGenerate = `${cyan(
      framework === "fastapi"
-        ? "poetry run generate"
+        ? "uv run generate"
        : `${packageManager} run generate`,
    )}`;

@@ -78,19 +81,31 @@ async function generateContextData(
    if (!missingSettings.length) {
      // If all the required environment variables are set, run the generate script
      if (framework === "fastapi") {
-        if (isHavingPoetryLockFile()) {
+        if (isHavingUvLockFile()) {
          console.log(`Running ${runGenerate} to generate the context data.`);
-          const result = tryPoetryRun("poetry run generate");
+          const result = tryUvRun("generate");
          if (!result) {
            console.log(`Failed to run ${runGenerate}.`);
            process.exit(1);
          }
          console.log(`Generated context data`);
          return;
+        } else {
+          console.log(
+            picocolors.yellow(
+              `\nWarning: uv.lock not found. Dependency installation might be incomplete. Skipping context generation.\nIf dependencies were installed, try running '${runGenerate}' manually.\n`,
+            ),
+          );
        }
      } else {
        console.log(`Running ${runGenerate} to generate the context data.`);
-        await callPackageManager(packageManager, true, ["run", "generate"]);
+
+        const shouldRunGenerate =
+          !useCase || !NO_DATA_USE_CASES.includes(useCase);
+
+        if (shouldRunGenerate) {
+          await callPackageManager(packageManager, true, ["run", "generate"]);
+        }
        return;
      }
    }
@@ -103,7 +118,7 @@ async function generateContextData(
 const downloadFile = async (url: string, destPath: string) => {
  const response = await fetch(url);
  const fileBuffer = await response.arrayBuffer();
-  await fsExtra.writeFile(destPath, Buffer.from(fileBuffer));
+  await fsExtra.writeFile(destPath, new Uint8Array(fileBuffer));
 };

 const prepareContextData = async (
@@ -218,6 +233,7 @@ export const installTemplate = async (
        props.vectorDb,
        props.llamaCloudKey,
        props.useLlamaParse,
+        props.useCase,
      );
    }

@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import spawn from "cross-spawn";
 import { yellow } from "picocolors";
 import type { PackageManager } from "./get-pkg-manager";
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import fs from "fs";
 import path from "path";
 import { blue, green } from "picocolors";
@@ -143,6 +143,6 @@ export const installLlamapackProject = async ({
  await copyData({ root });
  await installLlamapackExample({ root, llamapack });
  if (postInstallAction === "runApp" || postInstallAction === "dependencies") {
-    installPythonDependencies({ noRoot: true });
+    installPythonDependencies();
  }
 };
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import { execSync } from "child_process";
 import fs from "fs";

@@ -28,7 +28,7 @@ export async function askModelConfig({
 }: ModelConfigQuestionsParams): Promise<ModelConfig> {
  let modelProvider: ModelProvider = DEFAULT_MODEL_PROVIDER;
  if (askModels) {
-    let choices = [
+    const choices = [
      { title: "OpenAI", value: "openai" },
      { title: "Groq", value: "groq" },
      { title: "Ollama", value: "ollama" },
@@ -3,10 +3,11 @@ import path from "path";
 import { cyan, red } from "picocolors";
 import { parse, stringify } from "smol-toml";
 import terminalLink from "terminal-link";
+import { isUvAvailable, tryUvSync } from "./uv";

+import { isCI } from "ci-info";
 import { assetRelocator, copy } from "./copy";
 import { templatesDir } from "./dir";
-import { isPoetryAvailable, tryPoetryInstall } from "./poetry";
 import { Tool } from "./tools";
 import {
  InstallTemplateArgs,
@@ -31,6 +32,7 @@ const getAdditionalDependencies = (
  tools?: Tool[],
  templateType?: TemplateType,
  observability?: TemplateObservability,
+  // eslint-disable-next-line max-params
 ) => {
  const dependencies: Dependency[] = [];

@@ -39,21 +41,21 @@ const getAdditionalDependencies = (
    case "mongo": {
      dependencies.push({
        name: "llama-index-vector-stores-mongodb",
-        version: "^0.6.0",
+        version: ">=0.3.2,<0.4.0",
      });
      break;
    }
    case "pg": {
      dependencies.push({
        name: "llama-index-vector-stores-postgres",
-        version: "^0.3.2",
+        version: ">=0.3.2,<0.4.0",
      });
      break;
    }
    case "pinecone": {
      dependencies.push({
        name: "llama-index-vector-stores-pinecone",
-        version: "^0.4.1",
+        version: ">=0.4.1,<0.5.0",
        constraints: {
          python: ">=3.11,<3.13",
        },
@@ -63,25 +65,25 @@ const getAdditionalDependencies = (
    case "milvus": {
      dependencies.push({
        name: "llama-index-vector-stores-milvus",
-        version: "^0.3.0",
+        version: ">=0.3.0,<0.4.0",
      });
      dependencies.push({
        name: "pymilvus",
-        version: "2.4.4",
+        version: ">=2.4.4,<3.0.0",
      });
      break;
    }
    case "astra": {
      dependencies.push({
        name: "llama-index-vector-stores-astra-db",
-        version: "^0.4.0",
+        version: ">=0.4.0,<0.5.0",
      });
      break;
    }
    case "qdrant": {
      dependencies.push({
        name: "llama-index-vector-stores-qdrant",
-        version: "^0.4.0",
+        version: ">=0.4.0,<0.5.0",
        constraints: {
          python: ">=3.11,<3.13",
        },
@@ -91,21 +93,25 @@ const getAdditionalDependencies = (
    case "chroma": {
      dependencies.push({
        name: "llama-index-vector-stores-chroma",
-        version: "^0.4.0",
+        version: ">=0.4.0,<0.5.0",
+      });
+      dependencies.push({
+        name: "onnxruntime",
+        version: "<1.22.0",
      });
      break;
    }
    case "weaviate": {
      dependencies.push({
        name: "llama-index-vector-stores-weaviate",
-        version: "^1.2.3",
+        version: ">=1.2.3,<2.0.0",
      });
      break;
    }
    case "llamacloud":
      dependencies.push({
        name: "llama-index-indices-managed-llama-cloud",
-        version: "0.6.3",
+        version: ">=0.6.3,<0.7.0",
      });
      break;
  }
@@ -118,28 +124,28 @@ const getAdditionalDependencies = (
        case "file":
          dependencies.push({
            name: "docx2txt",
-            version: "^0.8",
+            version: ">=0.8,<0.9",
          });
          break;
        case "web":
          dependencies.push({
            name: "llama-index-readers-web",
-            version: "^0.3.0",
+            version: ">=0.3.0,<0.4.0",
          });
          break;
        case "db":
          dependencies.push({
            name: "llama-index-readers-database",
-            version: "^0.3.0",
+            version: ">=0.3.0,<0.4.0",
          });
          dependencies.push({
            name: "pymysql",
-            version: "^1.1.0",
+            version: ">=1.1.0,<2.0.0",
            extras: ["rsa"],
          });
          dependencies.push({
            name: "psycopg2-binary",
-            version: "^2.9.9",
+            version: ">=2.9.9,<3.0.0",
          });
          break;
      }
@@ -158,114 +164,102 @@ const getAdditionalDependencies = (
    case "ollama":
      dependencies.push({
        name: "llama-index-llms-ollama",
-        version: "0.3.0",
+        version: ">=0.5.0,<0.6.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-ollama",
-        version: "0.3.0",
+        version: ">=0.6.0,<0.7.0",
      });
      break;
    case "openai":
      if (templateType !== "multiagent") {
        dependencies.push({
          name: "llama-index-llms-openai",
-          version: "^0.3.2",
+          version: ">=0.3.2,<0.4.0",
        });
        dependencies.push({
          name: "llama-index-embeddings-openai",
-          version: "^0.3.1",
+          version: ">=0.3.1,<0.4.0",
        });
        dependencies.push({
          name: "llama-index-agent-openai",
-          version: "^0.4.0",
+          version: ">=0.4.0,<0.5.0",
        });
      }
      break;
    case "groq":
-      // Fastembed==0.2.0 does not support python3.13 at the moment
-      // Fixed the python version less than 3.13
-      dependencies.push({
-        name: "python",
-        version: "^3.11,<3.13",
-      });
      dependencies.push({
        name: "llama-index-llms-groq",
-        version: "0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-fastembed",
-        version: "^0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
    case "anthropic":
-      // Fastembed==0.2.0 does not support python3.13 at the moment
-      // Fixed the python version less than 3.13
-      dependencies.push({
-        name: "python",
-        version: "^3.11,<3.13",
-      });
      dependencies.push({
        name: "llama-index-llms-anthropic",
-        version: "0.3.0",
+        version: ">=0.6.0,<0.7.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-fastembed",
-        version: "^0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
    case "gemini":
      dependencies.push({
        name: "llama-index-llms-gemini",
-        version: "0.3.4",
+        version: ">=0.4.0,<0.5.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-gemini",
-        version: "^0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
    case "mistral":
      dependencies.push({
        name: "llama-index-llms-mistralai",
-        version: "0.2.1",
+        version: ">=0.4.0,<0.5.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-mistralai",
-        version: "0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
    case "azure-openai":
      dependencies.push({
        name: "llama-index-llms-azure-openai",
-        version: "0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-azure-openai",
-        version: "0.2.4",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
    case "huggingface":
      dependencies.push({
        name: "llama-index-llms-huggingface",
-        version: "^0.3.5",
+        version: ">=0.5.0,<0.6.0",
      });
      dependencies.push({
        name: "llama-index-embeddings-huggingface",
-        version: "^0.3.1",
+        version: ">=0.5.0,<0.6.0",
      });
      dependencies.push({
        name: "optimum",
-        version: "^1.23.3",
+        version: ">=1.23.3,<2.0.0",
        extras: ["onnxruntime"],
      });
      break;
    case "t-systems":
      dependencies.push({
        name: "llama-index-agent-openai",
-        version: "0.3.0",
+        version: ">=0.4.0,<0.5.0",
      });
      dependencies.push({
        name: "llama-index-llms-openai-like",
-        version: "0.2.0",
+        version: ">=0.3.0,<0.4.0",
      });
      break;
  }
@@ -274,54 +268,31 @@ const getAdditionalDependencies = (
    if (observability === "traceloop") {
      dependencies.push({
        name: "traceloop-sdk",
-        version: "^0.15.11",
+        version: ">=0.15.11",
      });
    }
    if (observability === "llamatrace") {
      dependencies.push({
        name: "llama-index-callbacks-arize-phoenix",
-        version: "^0.3.0",
+        version: ">=0.3.0,<0.4.0",
      });
    }
  }

-  return dependencies;
-};
-
-const mergePoetryDependencies = (
-  dependencies: Dependency[],
-  existingDependencies: Record<string, Omit<Dependency, "name"> | string>,
-) => {
-  for (const dependency of dependencies) {
-    let value = existingDependencies[dependency.name] ?? {};
-
-    // default string value is equal to attribute "version"
-    if (typeof value === "string") {
-      value = { version: value };
-    }
-
-    value.version = dependency.version ?? value.version;
-    value.extras = dependency.extras ?? value.extras;
-
-    // Merge constraints if they exist
-    if (dependency.constraints) {
-      value = { ...value, ...dependency.constraints };
-    }
-
-    if (value.version === undefined) {
-      throw new Error(
-        `Dependency "${dependency.name}" is missing attribute "version"!`,
-      );
-    }
-
-    // Serialize as object if there are any additional properties
-    if (Object.keys(value).length > 1) {
-      existingDependencies[dependency.name] = value;
-    } else {
-      // Otherwise, serialize just the version string
-      existingDependencies[dependency.name] = value.version;
-    }
+  // If app template is llama-index-server and CI and SERVER_PACKAGE_PATH is set,
+  // add @llamaindex/server to dependencies
+  if (
+    templateType === "llamaindexserver" &&
+    isCI &&
+    process.env.SERVER_PACKAGE_PATH
+  ) {
+    dependencies.push({
+      name: "llama-index-server",
+      version: `@file://${process.env.SERVER_PACKAGE_PATH}`,
+    });
  }
+
+  return dependencies;
 };

 const copyRouterCode = async (root: string, tools: Tool[]) => {
@@ -346,19 +317,100 @@ export const addDependencies = async (
    // Parse toml file
    const file = path.join(projectDir, FILENAME);
    const fileContent = await fs.readFile(file, "utf8");
-    const fileParsed = parse(fileContent);
+    let fileParsed: any;
+    try {
+      fileParsed = parse(fileContent);
+    } catch (parseError) {
+      console.error(`Error parsing ${FILENAME}:`, parseError);
+      throw new Error(
+        `Failed to parse ${FILENAME}. Please ensure it's valid TOML.`,
+      );
+    }

-    // Modify toml dependencies
-    const tool = fileParsed.tool as any;
-    const existingDependencies = tool.poetry.dependencies;
-    mergePoetryDependencies(dependencies, existingDependencies);
+    // Ensure [project] and [project.dependencies] exist
+    if (!fileParsed.project) {
+      fileParsed.project = {};
+    }
+    if (
+      !fileParsed.project.dependencies ||
+      !Array.isArray(fileParsed.project.dependencies)
+    ) {
+      // If dependencies exist but aren't an array, log a warning or error.
+      // For now, we'll overwrite it, assuming the intent is to use the standard array format.
+      console.warn(
+        `[project.dependencies] in ${FILENAME} is not an array. It will be overwritten.`,
+      );
+      fileParsed.project.dependencies = [];
+    }
+
+    const existingDependencies: string[] = fileParsed.project.dependencies;
+    const addedDeps: string[] = [];
+    const updatedDeps: string[] = [];
+
+    // Add or update dependencies
+    for (const newDep of dependencies) {
+      let depString = newDep.name;
+      if (newDep.extras && newDep.extras.length > 0) {
+        depString += `[${newDep.extras.join(",")}]`;
+      }
+      if (newDep.version) {
+        depString += newDep.version;
+      }
+
+      let found = false;
+      for (let i = 0; i < existingDependencies.length; i++) {
+        const existingDepNameMatch =
+          existingDependencies[i].match(/^([a-zA-Z0-9._-]+)/);
+        if (
+          existingDepNameMatch &&
+          existingDepNameMatch[1].toLowerCase() === depString.toLowerCase()
+        ) {
+          // Found existing dependency, update it
+          if (existingDependencies[i] !== depString) {
+            updatedDeps.push(`${existingDependencies[i]} -> ${depString}`);
+            existingDependencies[i] = depString;
+          }
+          found = true;
+          break;
+        }
+      }
+
+      if (!found) {
+        // Add new dependency
+        existingDependencies.push(depString);
+        addedDeps.push(depString);
+      }
+      // Handle python version constraints separately (if any)
+      if (newDep.constraints?.python) {
+        if (
+          !fileParsed.project["requires-python"] ||
+          fileParsed.project["requires-python"] !== newDep.constraints.python
+        ) {
+          // This simple overwrite might not be ideal; merging constraints is complex.
+          // For now, let's just set it if the new dependency has one.
+          console.log(
+            `Setting requires-python = "${newDep.constraints.python}" from dependency ${newDep.name}`,
+          );
+          fileParsed.project["requires-python"] = newDep.constraints.python;
+        }
+      }
+    }

    // Write toml file
    const newFileContent = stringify(fileParsed);
    await fs.writeFile(file, newFileContent);

-    const dependenciesString = dependencies.map((d) => d.name).join(", ");
-    console.log(`\nAdded ${dependenciesString} to ${cyan(FILENAME)}\n`);
+    if (addedDeps.length > 0) {
+      console.log(`\nAdded dependencies to ${cyan(FILENAME)}:`);
+      addedDeps.forEach((dep) => console.log(`  ${dep}`));
+    }
+    if (updatedDeps.length > 0) {
+      console.log(`\nUpdated dependencies in ${cyan(FILENAME)}:`);
+      updatedDeps.forEach((dep) => console.log(`  ${dep}`));
+    }
+    if (addedDeps.length > 0 || updatedDeps.length > 0) {
+      console.log(""); // Newline for spacing
+    }
  } catch (error) {
    console.log(
      `Error while updating dependencies for Poetry project file ${FILENAME}\n`,
@@ -367,18 +419,16 @@ export const addDependencies = async (
  }
 };

-export const installPythonDependencies = (
-  { noRoot }: { noRoot: boolean } = { noRoot: false },
-) => {
-  if (isPoetryAvailable()) {
+export const installPythonDependencies = () => {
+  if (isUvAvailable()) {
    console.log(
-      `Installing python dependencies using poetry. This may take a while...`,
+      `Installing Python dependencies using uv. This may take a while...`,
    );
-    const installSuccessful = tryPoetryInstall(noRoot);
+    const installSuccessful = tryUvSync();
    if (!installSuccessful) {
      console.error(
        red(
-          "Installing dependencies using poetry failed. Please check error log above and try running create-llama again.",
+          "Installing dependencies using uv failed. Please check the error log above and ensure uv is installed correctly.",
        ),
      );
      process.exit(1);
@@ -386,10 +436,10 @@ export const installPythonDependencies = (
  } else {
    console.error(
      red(
-        `Poetry is not available in the current environment. Please check ${terminalLink(
-          "Poetry Installation",
-          `https://python-poetry.org/docs/#installation`,
-        )} to install poetry first, then run create-llama again.`,
+        `uv is not available in the current environment. Please check ${terminalLink(
+          "uv Installation",
+          `https://github.com/astral-sh/uv#installation`,
+        )} to install uv first, then run create-llama again.`,
      ),
    );
    process.exit(1);
@@ -531,15 +581,21 @@ const installLlamaIndexServerTemplate = async ({
    process.exit(1);
  }

-  await copy("workflow.py", path.join(root, "app"), {
+  await copy("*.py", path.join(root, "app"), {
    parents: true,
-    cwd: path.join(templatesDir, "components", "workflows", "python", useCase),
+    cwd: path.join(templatesDir, "components", "use-cases", "python", useCase),
  });

  // Copy custom UI component code
  await copy(`*`, path.join(root, "components"), {
    parents: true,
-    cwd: path.join(templatesDir, "components", "ui", "workflows", useCase),
+    cwd: path.join(templatesDir, "components", "ui", "use-cases", useCase),
+  });
+
+  // Copy layout components to layout folder in root
+  await copy("*", path.join(root, "layout"), {
+    parents: true,
+    cwd: path.join(templatesDir, "components", "ui", "layout"),
  });

  if (useLlamaParse) {
@@ -570,7 +626,7 @@ const installLlamaIndexServerTemplate = async ({
  // Copy README.md
  await copy("README-template.md", path.join(root), {
    parents: true,
-    cwd: path.join(templatesDir, "components", "workflows", "python", useCase),
+    cwd: path.join(templatesDir, "components", "use-cases", "python", useCase),
    rename: assetRelocator,
  });
 };
@@ -641,6 +697,7 @@ export const installPythonTemplate = async ({
    dataSources,
    tools,
    template,
+    observability,
  );

  await addDependencies(root, addOnDependencies);
@@ -34,14 +34,24 @@ export function runReflexApp(appPath: string, port: number) {
    "--frontend-port",
    port.toString(),
  ];
-  return createProcess("poetry", commandArgs, {
+  return createProcess("uv", commandArgs, {
    stdio: "inherit",
    cwd: appPath,
  });
 }

-export function runFastAPIApp(appPath: string, port: number) {
-  return createProcess("poetry", ["run", "dev"], {
+export function runFastAPIApp(
+  appPath: string,
+  port: number,
+  template: TemplateType,
+) {
+  let commandArgs: string[];
+  if (template === "streaming") {
+    commandArgs = ["run", "dev"];
+  } else {
+    commandArgs = ["run", "fastapi", "dev", "--port", `${port}`];
+  }
+  return createProcess("uv", commandArgs, {
    stdio: "inherit",
    cwd: appPath,
    env: { ...process.env, APP_PORT: `${port}` },
@@ -73,7 +83,7 @@ export async function runApp(
        : framework === "fastapi"
          ? runFastAPIApp
          : runTSApp;
-    await appRunner(appPath, port || defaultPort);
+    await appRunner(appPath, port || defaultPort, template);
  } catch (error) {
    console.error("Failed to run app:", error);
    throw error;
@@ -41,7 +41,7 @@ export const supportedTools: Tool[] = [
    dependencies: [
      {
        name: "llama-index-tools-google",
-        version: "^0.3.0",
+        version: ">=0.3.0,<0.4.0",
      },
    ],
    supportedFrameworks: ["fastapi"],
@@ -62,7 +62,7 @@ export const supportedTools: Tool[] = [
    dependencies: [
      {
        name: "duckduckgo-search",
-        version: "^6.3.5",
+        version: ">=6.3.5,<7.0.0",
      },
    ],
    supportedFrameworks: ["fastapi"], // TODO: Re-enable this tool once the duck-duck-scrape TypeScript library works again
@@ -82,7 +82,7 @@ For better results, you can specify the region parameter to get results from a s
    dependencies: [
      {
        name: "llama-index-tools-wikipedia",
-        version: "^0.3.0",
+        version: ">=0.3.0,<0.4.0",
      },
    ],
    supportedFrameworks: ["fastapi", "express", "nextjs"],
@@ -102,11 +102,11 @@ For better results, you can specify the region parameter to get results from a s
    dependencies: [
      {
        name: "xhtml2pdf",
-        version: "^0.2.14",
+        version: ">=0.2.14,<0.3.0",
      },
      {
        name: "markdown",
-        version: "^3.7",
+        version: ">=3.7.0,<4.0.0",
      },
    ],
    type: ToolType.LOCAL,
@@ -124,7 +124,7 @@ For better results, you can specify the region parameter to get results from a s
    dependencies: [
      {
        name: "e2b_code_interpreter",
-        version: "1.1.1",
+        version: ">=1.1.1,<1.2.0",
      },
    ],
    supportedFrameworks: ["fastapi", "express", "nextjs"],
@@ -155,7 +155,7 @@ For better results, you can specify the region parameter to get results from a s
    dependencies: [
      {
        name: "e2b_code_interpreter",
-        version: "1.1.1",
+        version: ">=1.1.1,<1.2.0",
      },
    ],
    supportedFrameworks: ["fastapi", "express", "nextjs"],
@@ -184,7 +184,7 @@ For better results, you can specify the region parameter to get results from a s
      },
      {
        name: "jsonschema",
-        version: "^4.22.0",
+        version: ">=4.22.0,<5.0.0",
      },
      {
        name: "llama-index-tools-requests",
@@ -247,11 +247,11 @@ For better results, you can specify the region parameter to get results from a s
    dependencies: [
      {
        name: "pandas",
-        version: "^2.2.3",
+        version: ">=2.2.3,<3.0.0",
      },
      {
        name: "tabulate",
-        version: "^0.9.0",
+        version: ">=0.9.0,<1.0.0",
      },
    ],
  },
@@ -57,7 +57,10 @@ export type TemplateUseCase =
  | "form_filling"
  | "extractor"
  | "contract_review"
-  | "agentic_rag";
+  | "agentic_rag"
+  | "code_generator"
+  | "document_generator"
+  | "hitl";
 // Config for both file and folder
 export type FileSourceConfig =
  | {
@@ -4,6 +4,7 @@ import path from "path";
 import { bold, cyan, red, yellow } from "picocolors";
 import { assetRelocator, copy } from "../helpers/copy";
 import { callPackageManager } from "../helpers/install";
+import { NO_DATA_USE_CASES } from "./constant";
 import { templatesDir } from "./dir";
 import { PackageManager } from "./get-pkg-manager";
 import { InstallTemplateArgs, ModelProvider, TemplateVectorDB } from "./types";
@@ -31,23 +32,30 @@ const installLlamaIndexServerTemplate = async ({
    process.exit(1);
  }

-  await copy("workflow.ts", path.join(root, "src", "app"), {
-    parents: true,
+  await copy("**", path.join(root), {
    cwd: path.join(
      templatesDir,
      "components",
-      "workflows",
+      "use-cases",
      "typescript",
      useCase,
    ),
+    rename: assetRelocator,
  });

-  // copy workflow UI components to output/components folder
+  // copy workflow UI components to components folder in root
  await copy("*", path.join(root, "components"), {
    parents: true,
-    cwd: path.join(templatesDir, "components", "ui", "workflows", useCase),
+    cwd: path.join(templatesDir, "components", "ui", "use-cases", useCase),
  });

+  // copy layout components to layout folder in root
+  await copy("*", path.join(root, "layout"), {
+    parents: true,
+    cwd: path.join(templatesDir, "components", "ui", "layout"),
+  });
+
+  // Override generate.ts if workflow use case doesn't use custom UI
  if (vectorDb === "llamacloud") {
    await copy("generate.ts", path.join(root, "src"), {
      parents: true,
@@ -74,18 +82,14 @@ const installLlamaIndexServerTemplate = async ({
      rename: () => "data.ts",
    });
  }
-  // Copy README.md
-  await copy("README-template.md", path.join(root), {
-    parents: true,
-    cwd: path.join(
-      templatesDir,
-      "components",
-      "workflows",
-      "typescript",
-      useCase,
-    ),
-    rename: assetRelocator,
-  });
+
+  // Simplify use case code
+  if (useCase && NO_DATA_USE_CASES.includes(useCase)) {
+    // Artifact use case doesn't use index.
+    // We don't need data.ts, generate.ts
+    await fs.rm(path.join(root, "src", "app", "data.ts"));
+    // TODO: Remove generate index in generate.ts and package.json if possible
+  }
 };

 const installLegacyTSTemplate = async ({
@@ -390,7 +394,7 @@ const providerDependencies: {
  [key in ModelProvider]?: Record<string, string>;
 } = {
  openai: {
-    "@llamaindex/openai": "^0.2.0",
+    "@llamaindex/openai": "~0.4.0",
  },
  gemini: {
    "@llamaindex/google": "^0.2.0",
@@ -516,7 +520,7 @@ async function updatePackageJson({
  if (backend) {
    packageJson.dependencies = {
      ...packageJson.dependencies,
-      "@llamaindex/readers": "^2.0.0",
+      "@llamaindex/readers": "~3.1.4",
    };

    if (vectorDb && vectorDb in vectorDbDependencies) {
@@ -546,6 +550,16 @@ async function updatePackageJson({
    };
  }

+  // if having custom server package tgz file, use it for testing @llamaindex/server
+  const serverPackagePath = process.env.SERVER_PACKAGE_PATH;
+  if (serverPackagePath && template === "llamaindexserver") {
+    const relativePath = path.relative(process.cwd(), serverPackagePath);
+    packageJson.dependencies = {
+      ...packageJson.dependencies,
+      "@llamaindex/server": `file:${relativePath}`,
+    };
+  }
+
  await fs.writeFile(
    packageJsonFile,
    JSON.stringify(packageJson, null, 2) + os.EOL,
@@ -0,0 +1,42 @@
+// Migrate poetry to uv
+import { execSync } from "child_process";
+import fs from "fs";
+import { red } from "picocolors";
+
+export function isUvAvailable(): boolean {
+  try {
+    execSync("uv --version", { stdio: "ignore" });
+    return true;
+  } catch (_) {}
+  return false;
+}
+
+export function tryUvSync(): boolean {
+  try {
+    console.log("Syncing environment with pyproject.toml...");
+    execSync(`uv sync`, {
+      stdio: "inherit",
+    });
+    return true;
+  } catch (_) {}
+  return false;
+}
+
+export function tryUvRun(command: string): boolean {
+  try {
+    // Use uv run <command>
+    execSync(`uv run ${command}`, { stdio: "inherit" });
+    return true;
+  } catch (error) {
+    console.error(red(`Failed to run ${command}. Error: ${error}`));
+    return false;
+  }
+}
+
+export function isHavingUvLockFile(): boolean {
+  try {
+    // Check if uv.lock exists in the current directory
+    return fs.existsSync("uv.lock");
+  } catch (_) {}
+  return false;
+}
@@ -1,4 +1,3 @@
-// eslint-disable-next-line import/no-extraneous-dependencies
 import validateProjectName from "validate-npm-package-name";

 export function validateNpmName(name: string): {
@@ -1,4 +1,3 @@
-/* eslint-disable import/no-extraneous-dependencies */
 import { execSync } from "child_process";
 import { Command } from "commander";
 import fs from "fs";
@@ -197,7 +196,7 @@ const program = new Command(packageJson.name)
    "--pro",
    `

-  Allow interactive selection of all features.
+  Deprecated: Allow interactive selection of all features.
 `,
    false,
  )
@@ -0,0 +1,76 @@
+{
+  "name": "create-llama",
+  "version": "0.5.22",
+  "description": "Create LlamaIndex-powered apps with one command",
+  "keywords": [
+    "rag",
+    "llamaindex",
+    "next.js"
+  ],
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/run-llama/create-llama",
+    "directory": "packages/create-llama"
+  },
+  "license": "MIT",
+  "bin": {
+    "create-llama": "./dist/index.js"
+  },
+  "files": [
+    "dist",
+    "README.md",
+    "LICENSE.md"
+  ],
+  "scripts": {
+    "copy": "cp -r ../../README.md ../../LICENSE.md .",
+    "build": "bash ./scripts/build.sh",
+    "build:ncc": "pnpm run clean && ncc build ./index.ts -o ./dist/ --minify --no-cache --no-source-map-register",
+    "postbuild": "pnpm run copy",
+    "clean": "rimraf --glob ./dist ./templates/**/__pycache__ ./templates/**/node_modules ./templates/**/poetry.lock",
+    "dev": "ncc build ./index.ts -w -o dist/",
+    "e2e": "playwright test",
+    "e2e:python": "playwright test e2e/shared e2e/python",
+    "e2e:typescript": "playwright test e2e/shared e2e/typescript",
+    "pack-install": "bash ./scripts/pack.sh"
+  },
+  "dependencies": {
+    "@types/async-retry": "1.4.2",
+    "@types/ci-info": "2.0.0",
+    "@types/cross-spawn": "6.0.0",
+    "@types/fs-extra": "11.0.4",
+    "@types/node": "^20.11.7",
+    "@types/prompts": "2.4.2",
+    "@types/tar": "6.1.5",
+    "@types/validate-npm-package-name": "3.0.0",
+    "async-retry": "1.3.1",
+    "async-sema": "3.0.1",
+    "ci-info": "github:watson/ci-info#f43f6a1cefff47fb361c88cf4b943fdbcaafe540",
+    "commander": "12.1.0",
+    "cross-spawn": "7.0.3",
+    "fast-glob": "3.3.1",
+    "fs-extra": "11.2.0",
+    "global-agent": "^3.0.0",
+    "got": "10.7.0",
+    "ollama": "^0.5.0",
+    "ora": "^8.0.1",
+    "picocolors": "1.0.0",
+    "prompts": "2.4.2",
+    "smol-toml": "^1.1.4",
+    "tar": "6.1.15",
+    "terminal-link": "^3.0.0",
+    "update-check": "1.5.4",
+    "validate-npm-package-name": "3.0.0",
+    "yaml": "2.4.1"
+  },
+  "devDependencies": {
+    "@playwright/test": "^1.41.1",
+    "@vercel/ncc": "0.38.1",
+    "rimraf": "^5.0.5",
+    "typescript": "^5.3.3",
+    "wait-port": "^1.1.0"
+  },
+  "packageManager": "pnpm@9.0.5",
+  "engines": {
+    "node": ">=16.14.0"
+  }
+}
@@ -1,4 +1,3 @@
-/* eslint-disable turbo/no-undeclared-env-vars */
 import { defineConfig, devices } from "@playwright/test";

 export default defineConfig({
@@ -6,7 +6,7 @@ const defaults: Omit<QuestionArgs, "modelConfig"> = {
  framework: "nextjs",
  ui: "shadcn",
  frontend: false,
-  llamaCloudKey: "",
+  llamaCloudKey: undefined,
  useLlamaParse: false,
  communityProjectConfig: undefined,
  llamapack: "",
@@ -1,4 +1,5 @@
 import ciInfo from "ci-info";
+import { bold, yellow } from "picocolors";
 import { getCIQuestionResults } from "./ci";
 import { askProQuestions } from "./questions";
 import { askSimpleQuestions } from "./simple";
@@ -13,6 +14,12 @@ export const askQuestions = async (
    return await getCIQuestionResults(args);
  } else if (args.pro) {
    // TODO: refactor pro questions to return a result object
+    console.log(
+      yellow(
+        `Pro mode is deprecated. Please use the new templates using the ${bold("LlamaIndexServer")} by not specifying pro mode.`,
+      ),
+    );
+
    await askProQuestions(args);
    return args as unknown as QuestionResults;
  }
@@ -1,4 +1,5 @@
 import prompts from "prompts";
+import { NO_DATA_USE_CASES } from "../helpers/constant";
 import { EXAMPLE_10K_SEC_FILES, EXAMPLE_FILE } from "../helpers/datasources";
 import { askModelConfig } from "../helpers/providers";
 import { getTools } from "../helpers/tools";
@@ -6,7 +7,13 @@ import { ModelConfig, TemplateFramework } from "../helpers/types";
 import { PureQuestionArgs, QuestionResults } from "./types";
 import { askPostInstallAction, questionHandlers } from "./utils";

-type AppType = "agentic_rag" | "financial_report" | "deep_research";
+type AppType =
+  | "agentic_rag"
+  | "financial_report"
+  | "deep_research"
+  | "code_generator"
+  | "document_generator"
+  | "hitl";

 type SimpleAnswers = {
  appType: AppType;
@@ -42,6 +49,22 @@ export const askSimpleQuestions = async (
          description:
            "Researches and analyzes provided documents from multiple perspectives, generating a comprehensive report with citations to support key findings and insights.",
        },
+        {
+          title: "Code Generator",
+          value: "code_generator",
+          description: "Build a Vercel v0 styled code generator.",
+        },
+        {
+          title: "Document Generator",
+          value: "document_generator",
+          description: "Build a OpenAI canvas-styled document generator.",
+        },
+        {
+          title: "Human in the Loop",
+          value: "hitl",
+          description:
+            "Build a CLI command workflow that is reviewed by a human before execution",
+        },
      ],
    },
    questionHandlers,
@@ -52,35 +75,36 @@ export const askSimpleQuestions = async (

  let useLlamaCloud = false;

-  if (appType !== "extractor" && appType !== "contract_review") {
-    const { language: newLanguage } = await prompts(
-      {
-        type: "select",
-        name: "language",
-        message: "What language do you want to use?",
-        choices: [
-          { title: "Python (FastAPI)", value: "fastapi" },
-          { title: "Typescript (NextJS)", value: "nextjs" },
-        ],
-      },
-      questionHandlers,
-    );
-    language = newLanguage;
-  }
-
-  const { useLlamaCloud: newUseLlamaCloud } = await prompts(
+  const { language: newLanguage } = await prompts(
    {
-      type: "toggle",
-      name: "useLlamaCloud",
-      message: "Do you want to use LlamaCloud services?",
-      initial: false,
-      active: "Yes",
-      inactive: "No",
-      hint: "see https://www.llamaindex.ai/enterprise for more info",
+      type: "select",
+      name: "language",
+      message: "What language do you want to use?",
+      choices: [
+        { title: "Python (FastAPI)", value: "fastapi" },
+        { title: "Typescript (NextJS)", value: "nextjs" },
+      ],
    },
    questionHandlers,
  );
-  useLlamaCloud = newUseLlamaCloud;
+  language = newLanguage;
+
+  const shouldAskLlamaCloud = !NO_DATA_USE_CASES.includes(appType);
+  if (shouldAskLlamaCloud) {
+    const { useLlamaCloud: newUseLlamaCloud } = await prompts(
+      {
+        type: "toggle",
+        name: "useLlamaCloud",
+        message: "Do you want to use LlamaCloud services?",
+        initial: false,
+        active: "Yes",
+        inactive: "No",
+        hint: "see https://www.llamaindex.ai/enterprise for more info",
+      },
+      questionHandlers,
+    );
+    useLlamaCloud = newUseLlamaCloud;
+  }

  if (useLlamaCloud && !llamaCloudKey) {
    // Ask for LlamaCloud API key, if not set
@@ -111,10 +135,10 @@ const convertAnswers = async (
  args: PureQuestionArgs,
  answers: SimpleAnswers,
 ): Promise<QuestionResults> => {
-  const MODEL_GPT4o: ModelConfig = {
+  const MODEL_GPT41: ModelConfig = {
    provider: "openai",
    apiKey: args.openAiKey,
-    model: "gpt-4o",
+    model: "gpt-4.1",
    embeddingModel: "text-embedding-3-large",
    dimensions: 1536,
    isConfigured(): boolean {
@@ -135,13 +159,31 @@ const convertAnswers = async (
      template: "llamaindexserver",
      dataSources: EXAMPLE_10K_SEC_FILES,
      tools: getTools(["interpreter", "document_generator"]),
-      modelConfig: MODEL_GPT4o,
+      modelConfig: MODEL_GPT41,
    },
    deep_research: {
      template: "llamaindexserver",
      dataSources: EXAMPLE_10K_SEC_FILES,
      tools: [],
-      modelConfig: MODEL_GPT4o,
+      modelConfig: MODEL_GPT41,
+    },
+    code_generator: {
+      template: "llamaindexserver",
+      dataSources: [],
+      tools: [],
+      modelConfig: MODEL_GPT41,
+    },
+    document_generator: {
+      template: "llamaindexserver",
+      dataSources: [],
+      tools: [],
+      modelConfig: MODEL_GPT41,
+    },
+    hitl: {
+      template: "llamaindexserver",
+      dataSources: [],
+      tools: [],
+      modelConfig: MODEL_GPT41,
    },
  };

@@ -19,20 +19,20 @@ First, setup the environment with poetry:
 > **_Note:_** This step is not needed if you are using the dev-container.

 ```shell
-poetry install
+uv sync
 ```

 Then check the parameters that have been pre-configured in the `.env` file in this directory. (E.g. you might need to configure an `OPENAI_API_KEY` if you're using OpenAI as model provider).
 Second, generate the embeddings of the documents in the `./data` directory:

 ```shell
-poetry run generate
+uv run generate
 ```

 Third, run the development server:

 ```shell
-poetry run dev
+uv run dev
 ```

 Per default, the example is using the explicit workflow. You can change the example by setting the `EXAMPLE_TYPE` environment variable to `choreography` or `orchestrator`.
@@ -52,7 +52,7 @@ Open [http://localhost:8000](http://localhost:8000) with your browser to start t
 To start the app optimized for **production**, run:

 ```
-poetry run prod
+uv run prod
 ```

 ## Deployments
--- a/Show More
+++ b/Show More