Bump version: 0.28.0-beta.4 → 0.28.0-beta.5

2026-05-23 15:00:39 +00:00 · 2026-04-12 23:51:05 +00:00
153 changed files with 17564 additions and 19504 deletions
--- a/.bumpversion.toml
+++ b/.bumpversion.toml
@@ -1,5 +1,5 @@
 [tool.bumpversion]
-current_version = "0.28.0-beta.11"
+current_version = "0.28.0-beta.5"
 parse = """(?x)
    (?P<major>0|[1-9]\\d*)\\.
    (?P<minor>0|[1-9]\\d*)\\.
--- a/.github/ISSUE_TEMPLATE/documentation.yml
+++ b/.github/ISSUE_TEMPLATE/documentation.yml
@@ -18,6 +18,6 @@ body:
      label: Link
      description: >
        Provide a link to the existing documentation, if applicable.
-      placeholder: ex. https://docs.lancedb.com/tables/...
+      placeholder: ex. https://lancedb.com/docs/tables/...
    validations:
      required: false
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -1,18 +0,0 @@
-version: 2
-
-# Scope: the root Cargo workspace, which produces the Rust binaries we
-# ship to users (the Node.js and Python native extensions). The
-# `rust/lancedb` library crate shares the same lockfile; its consumers
-# pick their own dependency versions, but bumping transitive deps here
-# keeps the binaries we ship current.
-updates:
-  - package-ecosystem: cargo
-    directory: /
-    schedule:
-      interval: weekly
-    open-pull-requests-limit: 10
-    groups:
-      rust-minor-patch:
-        update-types:
-          - minor
-          - patch
--- a/.github/workflows/codex-fix-ci.yml
+++ b/.github/workflows/codex-fix-ci.yml
@@ -45,9 +45,7 @@ jobs:
      - name: Set up Node.js
        uses: actions/setup-node@v4
        with:
-          # pnpm 11 (used by the nodejs install step below) requires
-          # Node >= 22.13; use 24 since 22 hits EOL in October.
-          node-version: 24
+          node-version: 20

      - name: Install Codex CLI
        run: npm install -g @openai/codex
@@ -81,14 +79,10 @@ jobs:
          java-version: '11'
          cache: maven

-      - name: Setup pnpm
-        uses: pnpm/action-setup@v4
-        with:
-          version: 11.1.1
      - name: Install Node.js dependencies for TypeScript bindings
        run: |
          cd nodejs
-          pnpm install --frozen-lockfile
+          npm ci

      - name: Configure git user
        run: |
@@ -143,7 +137,7 @@ jobs:
               - For Rust test failures: Run the specific test with "cargo test -p <crate> <test_name>"
               - For Python test failures: Build with "cd python && maturin develop" then run "pytest <specific_test_file>::<test_name>"
               - For Java test failures: Run "cd java && mvn test -Dtest=<TestClass>#<testMethod>"
-               - For TypeScript test failures: Run "cd nodejs && pnpm build && pnpm test -- --testNamePattern='<test_name>'"
+               - For TypeScript test failures: Run "cd nodejs && npm run build && npm test -- --testNamePattern='<test_name>'"
               - Do NOT run the full test suite - only run the tests that were failing

          7. If the additional guidelines are provided, follow them as well.
--- a/.github/workflows/dev.yml
+++ b/.github/workflows/dev.yml
@@ -8,9 +8,6 @@ concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

-permissions:
-  contents: read
-
 jobs:
  labeler:
    permissions:
--- a/.github/workflows/java-publish.yml
+++ b/.github/workflows/java-publish.yml
@@ -19,9 +19,6 @@ on:
    paths:
      - .github/workflows/java-publish.yml

-permissions:
-  contents: read
-
 jobs:
  publish:
    name: Build and Publish
@@ -43,7 +40,7 @@ jobs:
          server-username: SONATYPE_USER
          server-password: SONATYPE_TOKEN
          gpg-private-key: ${{ secrets.GPG_PRIVATE_KEY }}
-          gpg-passphrase: MAVEN_GPG_PASSPHRASE
+          gpg-passphrase: ${{ secrets.GPG_PASSPHRASE }}
      - name: Set git config
        run: |
          git config --global user.email "dev+gha@lancedb.com"
@@ -58,11 +55,10 @@ jobs:
          echo "use-agent" >> ~/.gnupg/gpg.conf
          echo "pinentry-mode loopback" >> ~/.gnupg/gpg.conf
          export GPG_TTY=$(tty)
-          ./mvnw --batch-mode -DskipTests -DpushChanges=false deploy -pl lancedb-core -am -P deploy-to-ossrh
+          ./mvnw --batch-mode -DskipTests -DpushChanges=false -Dgpg.passphrase=${{ secrets.GPG_PASSPHRASE }} deploy -pl lancedb-core -am -P deploy-to-ossrh
        env:
          SONATYPE_USER: ${{ secrets.SONATYPE_USER }}
          SONATYPE_TOKEN: ${{ secrets.SONATYPE_TOKEN }}
-          MAVEN_GPG_PASSPHRASE: ${{ secrets.GPG_PASSPHRASE }}

  report-failure:
    name: Report Workflow Failure
--- a/.github/workflows/java.yml
+++ b/.github/workflows/java.yml
@@ -24,9 +24,6 @@ on:
      - java/**
      - .github/workflows/java.yml

-permissions:
-  contents: read
-
 jobs:
  build-java:
    runs-on: ubuntu-24.04
--- a/.github/workflows/license-header-check.yml
+++ b/.github/workflows/license-header-check.yml
@@ -10,10 +10,6 @@ on:
      - nodejs/**
      - java/**
      - .github/workflows/license-header-check.yml
-
-permissions:
-  contents: read
-
 jobs:
  check-licenses:
    runs-on: ubuntu-latest
--- a/.github/workflows/nodejs.yml
+++ b/.github/workflows/nodejs.yml
@@ -15,9 +15,6 @@ on:
      - .github/workflows/nodejs.yml
      - docker-compose.yml

-permissions:
-  contents: read
-
 concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true
@@ -42,17 +39,11 @@ jobs:
      with:
        fetch-depth: 0
        lfs: true
-    - uses: pnpm/action-setup@v4
-      with:
-        version: 11.1.1
    - uses: actions/setup-node@v4
      with:
-        # pnpm 11 requires Node >= 22.13; use 24 since 22 hits EOL
-        # in October. The library itself still supports Node >= 18
-        # (see test matrix below).
-        node-version: 24
-        cache: 'pnpm'
-        cache-dependency-path: nodejs/pnpm-lock.yaml
+        node-version: 20
+        cache: 'npm'
+        cache-dependency-path: nodejs/package-lock.json
    - uses: actions-rust-lang/setup-rust-toolchain@v1
      with:
        components: rustfmt, clippy
@@ -67,13 +58,11 @@ jobs:
      run: cargo clippy --profile ci --all --all-features -- -D warnings
    - name: Lint Typescript
      run: |
-        pnpm install --frozen-lockfile
-        pnpm lint-ci
+        npm ci
+        npm run lint-ci
    - name: Lint examples
      working-directory: nodejs/examples
-      # The `@lancedb/lancedb` dep points at file:../dist; pnpm errors if
-      # that dir is missing, so create an empty one for lint-only runs.
-      run: mkdir -p ../dist && pnpm install --frozen-lockfile && pnpm lint-ci
+      run: npm ci && npm run lint-ci
  linux:
    name: Linux (NodeJS ${{ matrix.node-version }})
    timeout-minutes: 30
@@ -90,18 +79,14 @@ jobs:
      with:
        fetch-depth: 0
        lfs: true
-    - uses: pnpm/action-setup@v4
-      with:
-        version: 11.1.1
    - uses: actions/setup-node@v4
-      name: Setup Node.js 24 for build
+      name: Setup Node.js 20 for build
      with:
-        # pnpm 11 requires Node >= 22.13; use 24 since 22 hits EOL
-        # in October. Build/install runs on Node 24; tests run on the
-        # matrix version below using direct jest invocation.
-        node-version: 24
-        cache: 'pnpm'
-        cache-dependency-path: nodejs/pnpm-lock.yaml
+        # @napi-rs/cli v3 requires Node >= 20.12 (via @inquirer/prompts@8).
+        # Build always on Node 20; tests run on the matrix version below.
+        node-version: 20
+        cache: 'npm'
+        cache-dependency-path: nodejs/package-lock.json
    - uses: Swatinem/rust-cache@v2
    - name: Install dependencies
      run: |
@@ -109,52 +94,45 @@ jobs:
        sudo apt install -y protobuf-compiler libssl-dev
    - name: Build
      run: |
-        pnpm install --frozen-lockfile
-        # No `--` separator: pnpm forwards it literally, which would
-        # make napi-rs treat `--profile ci` as a cargo passthrough arg.
-        pnpm build:debug --profile ci
-        pnpm tsc
-    - name: Setup examples
-      working-directory: nodejs/examples
-      run: pnpm install --frozen-lockfile
-    - name: Check docs
-      run: |
-        # We run this as part of the job because the binary needs to be built
-        # first to export the types of the native code.
-        set -e
-        # `pnpm docs` would invoke pnpm's built-in `docs` command, not
-        # the script — use `pnpm run docs`.
-        pnpm run docs
-        if ! git diff --exit-code -- ../ ':(exclude)Cargo.lock'; then
-          echo "Docs need to be updated"
-          echo "Run 'pnpm run docs', fix any warnings, and commit the changes."
-          exit 1
-        fi
+        npm ci --include=optional
+        npm run build:debug -- --profile ci
    - uses: actions/setup-node@v4
      name: Setup Node.js ${{ matrix.node-version }} for test
      with:
        node-version: ${{ matrix.node-version }}
+    - name: Compile TypeScript
+      run: npm run tsc
    - name: Setup localstack
      working-directory: .
      run: docker compose up --detach --wait
    - name: Test
      env:
        S3_TEST: "1"
-        # Newer @smithy/core uses dynamic ESM imports.
-        NODE_OPTIONS: "--experimental-vm-modules"
-      # Invoke jest directly because pnpm 11 itself requires Node 22+
-      # while the matrix tests on older Node versions.
-      run: npx jest --verbose
+      run: npm run test
+    - name: Setup examples
+      working-directory: nodejs/examples
+      run: npm ci
    - name: Test examples
      working-directory: ./
      env:
        OPENAI_API_KEY: test
        OPENAI_BASE_URL: http://0.0.0.0:8000
-        NODE_OPTIONS: "--experimental-vm-modules"
      run: |
        python ci/mock_openai.py &
        cd nodejs/examples
-        npx jest --testEnvironment jest-environment-node-single-context --verbose
+        npm test
+    - name: Check docs
+      run: |
+        # We run this as part of the job because the binary needs to be built
+        # first to export the types of the native code.
+        set -e
+        npm ci
+        npm run docs
+        if ! git diff --exit-code -- ../ ':(exclude)Cargo.lock'; then
+          echo "Docs need to be updated"
+          echo "Run 'npm run docs', fix any warnings, and commit the changes."
+          exit 1
+        fi
  macos:
    timeout-minutes: 30
    runs-on: "macos-14"
@@ -167,28 +145,20 @@ jobs:
      with:
        fetch-depth: 0
        lfs: true
-    - uses: pnpm/action-setup@v4
-      with:
-        version: 11.1.1
    - uses: actions/setup-node@v4
      with:
-        # pnpm 11 requires Node >= 22.13; use 24 since 22 hits EOL
-        # in October.
-        node-version: 24
-        cache: 'pnpm'
-        cache-dependency-path: nodejs/pnpm-lock.yaml
-    - uses: dtolnay/rust-toolchain@stable
+        node-version: 20
+        cache: 'npm'
+        cache-dependency-path: nodejs/package-lock.json
    - uses: Swatinem/rust-cache@v2
    - name: Install dependencies
      run: |
        brew install protobuf
    - name: Build
      run: |
-        pnpm install --frozen-lockfile
-        # No `--` separator: pnpm forwards it literally, which would
-        # make napi-rs treat `--profile ci` as a cargo passthrough arg.
-        pnpm build:debug --profile ci
-        pnpm tsc
+        npm ci --include=optional
+        npm run build:debug -- --profile ci
+        npm run tsc
    - name: Test
      run: |
-        pnpm test
+        npm run test
--- a/.github/workflows/npm-publish.yml
+++ b/.github/workflows/npm-publish.yml
@@ -171,18 +171,13 @@ jobs:
        working-directory: nodejs
    steps:
      - uses: actions/checkout@v4
-      - name: Setup pnpm
-        uses: pnpm/action-setup@v4
-        with:
-          version: 11.1.1
      - name: Setup node
        uses: actions/setup-node@v4
+        if: ${{ !matrix.settings.docker }}
        with:
-          # pnpm 11 requires Node >= 22.13; use 24 since 22 hits EOL
-          # in October.
-          node-version: 24
-          cache: pnpm
-          cache-dependency-path: nodejs/pnpm-lock.yaml
+          node-version: 20
+          cache: npm
+          cache-dependency-path: nodejs/package-lock.json
      - name: Install
        uses: dtolnay/rust-toolchain@stable
        if: ${{ !matrix.settings.docker }}
@@ -200,7 +195,7 @@ jobs:
            target/
          key: nodejs-${{ matrix.settings.target }}-cargo-${{ matrix.settings.host }}
      - name: Install dependencies
-        run: pnpm install --frozen-lockfile
+        run: npm ci
      - name: Install Zig
        uses: mlugg/setup-zig@v2
        if: ${{ contains(matrix.settings.target, 'musl') }}
@@ -253,7 +248,7 @@ jobs:
      # one to do the upload.
      - name: Make generic artifacts
        if: ${{ matrix.settings.target == 'aarch64-apple-darwin' }}
-        run: pnpm tsc
+        run: npm run tsc
      - name: Upload Generic Artifacts
        if: ${{ matrix.settings.target == 'aarch64-apple-darwin' }}
        uses: actions/upload-artifact@v4
@@ -288,24 +283,14 @@ jobs:
        working-directory: nodejs
    steps:
      - uses: actions/checkout@v4
-      - name: Setup pnpm
-        uses: pnpm/action-setup@v4
-        with:
-          version: 11.1.1
-      - name: Setup Node.js 24 for install
-        uses: actions/setup-node@v4
-        with:
-          # pnpm 11 requires Node >= 22.13; use 24 since 22 hits EOL
-          # in October.
-          node-version: 24
-          cache: pnpm
-          cache-dependency-path: nodejs/pnpm-lock.yaml
-      - name: Install dependencies
-        run: pnpm install --frozen-lockfile
-      - name: Setup Node.js ${{ matrix.node }} for test
+      - name: Setup node
        uses: actions/setup-node@v4
        with:
          node-version: ${{ matrix.node }}
+          cache: npm
+          cache-dependency-path: nodejs/package-lock.json
+      - name: Install dependencies
+        run: npm ci
      - name: Download artifacts
        uses: actions/download-artifact@v4
        with:
@@ -326,9 +311,7 @@ jobs:
      - name: Move built files
        run: cp dist/native.d.ts dist/native.js dist/*.node lancedb/
      - name: Test bindings
-        # Invoke jest directly because pnpm 11 itself requires Node 22+
-        # while the matrix tests on older Node versions.
-        run: npx jest --verbose
+        run: npm test
  publish:
    name: Publish
    runs-on: ubuntu-latest
@@ -340,19 +323,15 @@ jobs:
      - test-lancedb
    steps:
      - uses: actions/checkout@v4
-      - name: Setup pnpm
-        uses: pnpm/action-setup@v4
-        with:
-          version: 11.1.1
      - name: Setup node
        uses: actions/setup-node@v4
        with:
          node-version: 24
-          cache: pnpm
-          cache-dependency-path: nodejs/pnpm-lock.yaml
+          cache: npm
+          cache-dependency-path: nodejs/package-lock.json
          registry-url: "https://registry.npmjs.org"
      - name: Install dependencies
-        run: pnpm install --frozen-lockfile
+        run: npm ci
      - uses: actions/download-artifact@v4
        with:
          name: nodejs-dist
@@ -372,7 +351,7 @@ jobs:
      - name: Display structure of downloaded files
        run: find dist && find nodejs-artifacts
      - name: Move artifacts
-        run: pnpm exec napi artifacts -d nodejs-artifacts
+        run: npx napi artifacts -d nodejs-artifacts
      - name: List packages
        run: find npm
      - name: Publish
--- a/.github/workflows/pypi-publish.yml
+++ b/.github/workflows/pypi-publish.yml
@@ -14,16 +14,10 @@ on:
 env:
  PIP_EXTRA_INDEX_URL: "https://pypi.fury.io/lance-format/ https://pypi.fury.io/lancedb/"

-permissions:
-  contents: read
-
 jobs:
  linux:
    name: Python ${{ matrix.config.platform }} manylinux${{ matrix.config.manylinux }}
    timeout-minutes: 60
-    permissions:
-      id-token: write
-      contents: read
    strategy:
      matrix:
        config:
@@ -63,12 +57,10 @@ jobs:
      - uses: ./.github/workflows/upload_wheel
        if: startsWith(github.ref, 'refs/tags/python-v')
        with:
+          pypi_token: ${{ secrets.LANCEDB_PYPI_API_TOKEN }}
          fury_token: ${{ secrets.FURY_TOKEN }}
  mac:
    timeout-minutes: 90
-    permissions:
-      id-token: write
-      contents: read
    runs-on: ${{ matrix.config.runner }}
    strategy:
      matrix:
@@ -93,12 +85,10 @@ jobs:
      - uses: ./.github/workflows/upload_wheel
        if: startsWith(github.ref, 'refs/tags/python-v')
        with:
+          pypi_token: ${{ secrets.LANCEDB_PYPI_API_TOKEN }}
          fury_token: ${{ secrets.FURY_TOKEN }}
  windows:
    timeout-minutes: 60
-    permissions:
-      id-token: write
-      contents: read
    runs-on: windows-latest
    steps:
      - uses: actions/checkout@v4
@@ -117,6 +107,7 @@ jobs:
      - uses: ./.github/workflows/upload_wheel
        if: startsWith(github.ref, 'refs/tags/python-v')
        with:
+          pypi_token: ${{ secrets.LANCEDB_PYPI_API_TOKEN }}
          fury_token: ${{ secrets.FURY_TOKEN }}
  gh-release:
    if: startsWith(github.ref, 'refs/tags/python-v')
--- a/.github/workflows/python.yml
+++ b/.github/workflows/python.yml
@@ -17,9 +17,6 @@ on:
      - .github/workflows/build_windows_wheel/**
      - .github/workflows/run_tests/**

-permissions:
-  contents: read
-
 concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true
@@ -111,6 +108,7 @@ jobs:
      - name: Install
        run: |
          pip install --extra-index-url https://pypi.fury.io/lance-format/ --extra-index-url https://pypi.fury.io/lancedb/ -e .[tests,dev,embeddings]
+          pip install tantivy
          pip install mlx
      - name: Doctest
        run: pytest --doctest-modules python/lancedb
@@ -229,5 +227,6 @@ jobs:
          pip install "pydantic<2"
          pip install pyarrow==16
          pip install --extra-index-url https://pypi.fury.io/lance-format/ --extra-index-url https://pypi.fury.io/lancedb/ -e .[tests]
+          pip install tantivy
      - name: Run tests
        run: pytest -m "not slow and not s3_test" -x -v --durations=30 python/tests
--- a/.github/workflows/rust.yml
+++ b/.github/workflows/rust.yml
@@ -9,15 +9,9 @@ on:
      - Cargo.toml
      - Cargo.lock
      - rust-toolchain.toml
-      - deny.toml
      - rust/**
-      - nodejs/Cargo.toml
-      - python/Cargo.toml
      - .github/workflows/rust.yml

-permissions:
-  contents: read
-
 concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true
@@ -59,17 +53,6 @@ jobs:
      - name: Run clippy (without remote feature)
        run: cargo clippy --profile ci --workspace --tests -- -D warnings

-  deny:
-    # Supply-chain checks: advisories, licenses, banned crates, and source
-    # restrictions. Configuration lives in `deny.toml` at the workspace root.
-    timeout-minutes: 10
-    runs-on: ubuntu-24.04
-    steps:
-      - uses: actions/checkout@v4
-      - uses: EmbarkStudios/cargo-deny-action@v2
-        with:
-          command: check advisories bans licenses sources
-
  build-no-lock:
    runs-on: ubuntu-24.04
    timeout-minutes: 30
--- a/.github/workflows/update_package_lock_run.yml
+++ b/.github/workflows/update_package_lock_run.yml
@@ -3,9 +3,6 @@ name: Update package-lock.json
 on:
  workflow_dispatch:

-permissions:
-  contents: read
-
 jobs:
  publish:
    runs-on: ubuntu-latest
--- a/.github/workflows/update_package_lock_run_nodejs.yml
+++ b/.github/workflows/update_package_lock_run_nodejs.yml
@@ -3,9 +3,6 @@ name: Update NodeJs package-lock.json
 on:
  workflow_dispatch:

-permissions:
-  contents: read
-
 jobs:
  publish:
    runs-on: ubuntu-latest
--- a/.github/workflows/upload_wheel/action.yml
+++ b/.github/workflows/upload_wheel/action.yml
@@ -2,6 +2,9 @@ name: upload-wheel

 description: "Upload wheels to Pypi"
 inputs:
+  pypi_token:
+    required: true
+    description: "release token for the repo"
  fury_token:
    required: true
    description: "release token for the fury repo"
@@ -9,6 +12,12 @@ inputs:
 runs:
  using: "composite"
  steps:
+  - name: Install dependencies
+    shell: bash
+    run: |
+      python -m pip install --upgrade pip
+      pip install twine
+      python3 -m pip install --upgrade pkginfo
  - name: Choose repo
    shell: bash
    id: choose_repo
@@ -18,17 +27,19 @@ runs:
      else
        echo "repo=pypi" >> $GITHUB_OUTPUT
      fi
-  - name: Publish to Fury
-    if: steps.choose_repo.outputs.repo == 'fury'
+  - name: Publish to PyPI
    shell: bash
    env:
      FURY_TOKEN: ${{ inputs.fury_token }}
+      PYPI_TOKEN: ${{ inputs.pypi_token }}
    run: |
-      WHEEL=$(ls target/wheels/lancedb-*.whl 2> /dev/null | head -n 1)
-      echo "Uploading $WHEEL to Fury"
-      curl -f -F package=@$WHEEL https://$FURY_TOKEN@push.fury.io/lancedb/
-  - name: Publish to PyPI
-    if: steps.choose_repo.outputs.repo == 'pypi'
-    uses: pypa/gh-action-pypi-publish@release/v1
-    with:
-      packages-dir: target/wheels/
+      if [[ ${{ steps.choose_repo.outputs.repo }} == fury ]]; then
+        WHEEL=$(ls target/wheels/lancedb-*.whl 2> /dev/null | head -n 1)
+        echo "Uploading $WHEEL to Fury"
+        curl -f -F package=@$WHEEL https://$FURY_TOKEN@push.fury.io/lancedb/
+      else
+        twine upload --repository ${{ steps.choose_repo.outputs.repo }} \
+          --username __token__ \
+          --password $PYPI_TOKEN \
+          target/wheels/lancedb-*.whl
+      fi
--- a/Cargo.lock
+++ b/Cargo.lock
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,5 +1,7 @@
 [workspace]
 members = ["rust/lancedb", "nodejs", "python"]
+# Python package needs to be built by maturin.
+exclude = ["python"]
 resolver = "2"

 [workspace.package]
@@ -13,40 +15,40 @@ categories = ["database-implementations"]
 rust-version = "1.91.0"

 [workspace.dependencies]
-lance = { "version" = "=7.0.0-beta.9", default-features = false, "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-core = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-datagen = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-file = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-io = { "version" = "=7.0.0-beta.9", default-features = false, "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-index = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-linalg = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-namespace = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-namespace-impls = { "version" = "=7.0.0-beta.9", default-features = false, "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-table = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-testing = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-datafusion = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-encoding = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
-lance-arrow = { "version" = "=7.0.0-beta.9", "tag" = "v7.0.0-beta.9", "git" = "https://github.com/lance-format/lance.git" }
+lance = { "version" = "=5.1.0-beta.3", default-features = false, "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-core = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-datagen = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-file = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-io = { "version" = "=5.1.0-beta.3", default-features = false, "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-index = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-linalg = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-namespace = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-namespace-impls = { "version" = "=5.1.0-beta.3", default-features = false, "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-table = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-testing = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-datafusion = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-encoding = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
+lance-arrow = { "version" = "=5.1.0-beta.3", "tag" = "v5.1.0-beta.3", "git" = "https://github.com/lance-format/lance.git" }
 ahash = "0.8"
 # Note that this one does not include pyarrow
-arrow = { version = "58.0.0", optional = false }
-arrow-array = "58.0.0"
-arrow-data = "58.0.0"
-arrow-ipc = "58.0.0"
-arrow-ord = "58.0.0"
-arrow-schema = "58.0.0"
-arrow-select = "58.0.0"
-arrow-cast = "58.0.0"
+arrow = { version = "57.2", optional = false }
+arrow-array = "57.2"
+arrow-data = "57.2"
+arrow-ipc = "57.2"
+arrow-ord = "57.2"
+arrow-schema = "57.2"
+arrow-select = "57.2"
+arrow-cast = "57.2"
 async-trait = "0"
-datafusion = { version = "53.0.0", default-features = false }
-datafusion-catalog = "53.0.0"
-datafusion-common = { version = "53.0.0", default-features = false }
-datafusion-execution = "53.0.0"
-datafusion-expr = "53.0.0"
-datafusion-functions = "53.0.0"
-datafusion-physical-plan = "53.0.0"
-datafusion-physical-expr = "53.0.0"
-datafusion-sql = "53.0.0"
+datafusion = { version = "52.1", default-features = false }
+datafusion-catalog = "52.1"
+datafusion-common = { version = "52.1", default-features = false }
+datafusion-execution = "52.1"
+datafusion-expr = "52.1"
+datafusion-functions = "52.1"
+datafusion-physical-plan = "52.1"
+datafusion-physical-expr = "52.1"
+datafusion-sql = "52.1"
 env_logger = "0.11"
 half = { "version" = "2.7.1", default-features = false, features = [
    "num-traits",
@@ -54,7 +56,7 @@ half = { "version" = "2.7.1", default-features = false, features = [
 futures = "0"
 log = "0.4"
 moka = { version = "0.12", features = ["future"] }
-object_store = "0.13.2"
+object_store = "0.12.0"
 pin-project = "1.0.7"
 rand = "0.9"
 snafu = "0.8"
--- a/README.md
+++ b/README.md
@@ -15,7 +15,7 @@

 # **The Multimodal AI Lakehouse**

-[**How to Install** ](#how-to-install) ✦ [**Detailed Documentation**](https://docs.lancedb.com) ✦ [**Tutorials and Recipes**](https://github.com/lancedb/vectordb-recipes/tree/main) ✦  [**Contributors**](#contributors) 
+[**How to Install** ](#how-to-install) ✦ [**Detailed Documentation**](https://lancedb.com/docs) ✦ [**Tutorials and Recipes**](https://github.com/lancedb/vectordb-recipes/tree/main) ✦  [**Contributors**](#contributors) 

 **The ultimate multimodal data platform for AI/ML applications.** 

@@ -57,7 +57,7 @@ LanceDB is a central location where developers can build, train and analyze thei

 ## **How to Install**:

-Follow the [Quickstart](https://docs.lancedb.com/quickstart) doc to set up LanceDB locally. 
+Follow the [Quickstart](https://lancedb.com/docs/quickstart/) doc to set up LanceDB locally. 

 **API & SDK:** We also support Python, Typescript and Rust SDKs

--- a/deny.toml
+++ b/deny.toml
@@ -1,196 +0,0 @@
-# cargo-deny configuration for LanceDB.
-#
-# Run locally with `cargo deny check`. See
-# https://embarkstudios.github.io/cargo-deny/ for the full reference.
-
-# The set of target triples we care about. cargo-deny will only consider
-# dependencies that are used on at least one of these targets. Keeping this
-# explicit avoids noise from platform-specific crates (e.g. wasm, android,
-# ios) that we never actually ship.
-[graph]
-targets = [
-    "x86_64-unknown-linux-gnu",
-    "aarch64-unknown-linux-gnu",
-    "x86_64-apple-darwin",
-    "aarch64-apple-darwin",
-    "x86_64-pc-windows-msvc",
-    "aarch64-pc-windows-msvc",
-]
-all-features = true
-
-[output]
-feature-depth = 1
-
-# ---------------------------------------------------------------------------
-# Advisories: security vulnerabilities and yanked crates.
-# ---------------------------------------------------------------------------
-[advisories]
-version = 2
-# Fail the check if any crate in the lockfile has been yanked from crates.io.
-# Yanked crates are a signal the author retracted the release (often due to
-# bugs or security issues) and should not be depended on.
-yanked = "deny"
-# Advisory IDs we have explicitly reviewed and chosen to accept. Every
-# entry must include a rationale and, where possible, an upstream issue
-# pointing to a fix. Revisit this list whenever dependencies are updated.
-ignore = [
-    # rsa: Marvin Attack timing side-channel in PKCS#1 v1.5 decryption.
-    # Reached only through opendal → reqsign → rsa. We do not use RSA
-    # decryption in LanceDB ourselves; this is dormant in the signing path.
-    # No fixed release exists upstream as of this writing.
-    # https://rustsec.org/advisories/RUSTSEC-2023-0071
-    { id = "RUSTSEC-2023-0071", reason = "rsa crate via opendal/reqsign; no fixed upstream release" },
-
-    # instant: unmaintained. Pulled in via backoff → instant. Upstream
-    # recommends switching to `web-time`; fix has to come from backoff.
-    # https://rustsec.org/advisories/RUSTSEC-2024-0384
-    { id = "RUSTSEC-2024-0384", reason = "transitive via backoff; waiting on backoff replacement" },
-
-    # paste: unmaintained (author archived the repo). Used transitively by
-    # datafusion and the arrow ecosystem; widespread, no drop-in replacement.
-    # https://rustsec.org/advisories/RUSTSEC-2024-0436
-    { id = "RUSTSEC-2024-0436", reason = "transitive via datafusion; awaiting ecosystem migration" },
-
-    # encoding: unmaintained. Reached through lindera-dictionary, which is
-    # required by the native Lindera tokenizer path. Lindera has not migrated
-    # off this crate yet.
-    # https://rustsec.org/advisories/RUSTSEC-2021-0153
-    { id = "RUSTSEC-2021-0153", reason = "transitive via lindera-dictionary for native Lindera tokenizer" },
-
-    # fast-float: unsound and unmaintained. Reached only through polars-arrow
-    # from the optional Polars integration; replacement requires a Polars
-    # dependency upgrade.
-    # https://rustsec.org/advisories/RUSTSEC-2024-0379
-    { id = "RUSTSEC-2024-0379", reason = "transitive via polars-arrow; waiting on Polars migration" },
-
-    # tantivy: segfault on malformed input due to missing bounds check.
-    # Pulled in via lance for full-text search. We only feed tantivy
-    # documents we construct ourselves, not attacker-controlled bytes.
-    # Tracked for a lance dependency bump.
-    # https://rustsec.org/advisories/RUSTSEC-2025-0003
-    { id = "RUSTSEC-2025-0003", reason = "tantivy via lance; inputs are internally produced, not user-supplied bytes" },
-
-    # backoff: unmaintained. Reached only via async-openai. Replacement
-    # requires async-openai to migrate (or us to drop async-openai).
-    # https://rustsec.org/advisories/RUSTSEC-2025-0012
-    { id = "RUSTSEC-2025-0012", reason = "transitive via async-openai; waiting on upstream migration" },
-
-    # number_prefix: unmaintained. Transitive via indicatif → hf-hub.
-    # No security impact, just maintenance status.
-    # https://rustsec.org/advisories/RUSTSEC-2025-0119
-    { id = "RUSTSEC-2025-0119", reason = "transitive via hf-hub/indicatif; cosmetic formatting crate" },
-
-    # bincode: unmaintained. Reached through lindera and lindera-dictionary,
-    # which are required by the native Lindera tokenizer path. Lindera has not
-    # migrated to another serialization format yet.
-    # https://rustsec.org/advisories/RUSTSEC-2025-0141
-    { id = "RUSTSEC-2025-0141", reason = "transitive via lindera/lindera-dictionary for native Lindera tokenizer" },
-
-    # lru: soundness issue in IterMut. Reached only through aws-sdk-s3 in
-    # LanceDB's dev-dependency graph; LanceDB does not use that iterator
-    # directly. Clearing this requires the AWS SDK chain to update lru.
-    # https://rustsec.org/advisories/RUSTSEC-2026-0002
-    { id = "RUSTSEC-2026-0002", reason = "transitive via aws-sdk-s3 dev-dependency; waiting on AWS SDK lru upgrade" },
-
-    # rustls-webpki 0.101.7 (old major line): name-constraint checks for
-    # URI / wildcard names. Pulled in only via the legacy rustls 0.21 chain
-    # from aws-smithy-http-client. The 0.103 line we actively use is patched.
-    # Clearing the 0.101 copy requires the aws-sdk chain to migrate off
-    # rustls 0.21.
-    # https://rustsec.org/advisories/RUSTSEC-2026-0098
-    # https://rustsec.org/advisories/RUSTSEC-2026-0099
-    { id = "RUSTSEC-2026-0098", reason = "only affects rustls-webpki 0.101 from legacy aws-smithy/rustls 0.21 chain" },
-    { id = "RUSTSEC-2026-0099", reason = "only affects rustls-webpki 0.101 from legacy aws-smithy/rustls 0.21 chain" },
-
-    # rustls-webpki 0.101.7: reachable panic in CRL parsing. Same legacy
-    # rustls 0.21 chain from aws-smithy-http-client as above. The 0.103 line
-    # we actively use is upgraded to 0.103.13 which contains the fix.
-    # https://rustsec.org/advisories/RUSTSEC-2026-0104
-    { id = "RUSTSEC-2026-0104", reason = "only affects rustls-webpki 0.101 from legacy aws-smithy/rustls 0.21 chain" },
-
-    # rand 0.8.5: soundness issue only when ThreadRng reseeds inside a custom
-    # logger. Reached through several transitive chains. LanceDB does not use
-    # rand from a custom logger; upgrade once all pinned chains accept 0.8.6+.
-    # https://rustsec.org/advisories/RUSTSEC-2026-0097
-    { id = "RUSTSEC-2026-0097", reason = "transitive rand 0.8.5; LanceDB does not call ThreadRng from custom logging" },
-]
-
-# ---------------------------------------------------------------------------
-# Licenses: only allow licenses we've reviewed as compatible with Apache-2.0.
-# ---------------------------------------------------------------------------
-[licenses]
-version = 2
-# SPDX identifiers for licenses that are compatible with our Apache-2.0
-# distribution. Additions require legal review.
-allow = [
-    "Apache-2.0",
-    "Apache-2.0 WITH LLVM-exception",
-    "MIT",
-    "BSD-2-Clause",
-    "BSD-3-Clause",
-    "ISC",
-    "Unicode-3.0",
-    "Unicode-DFS-2016",
-    "Zlib",
-    "CC0-1.0",
-    "MPL-2.0",
-    "BSL-1.0",
-    "OpenSSL",
-    # 0BSD ("BSD Zero Clause") is effectively public domain — no attribution
-    # required. Pulled in by `mock_instant`.
-    "0BSD",
-    # bzip2-1.0.6 is the permissive upstream bzip2 license (BSD-like). Pulled
-    # in by `libbz2-rs-sys`, the pure-Rust bzip2 implementation.
-    "bzip2-1.0.6",
-    # CDLA-Permissive-2.0 is a permissive data license used by `webpki-roots`
-    # for the Mozilla CA root bundle. Data-only, distribution-compatible.
-    "CDLA-Permissive-2.0",
-]
-confidence-threshold = 0.8
-# Crates whose license cannot be determined from Cargo metadata but whose
-# license we've manually confirmed from upstream. Keep this list minimal.
-[[licenses.clarify]]
-# polars-arrow-format omits the `license` field in its Cargo.toml, but the
-# upstream repo (pola-rs/polars-arrow-format) is dual-licensed Apache-2.0 OR
-# MIT. See https://github.com/pola-rs/polars-arrow-format/blob/main/LICENSE
-crate = "polars-arrow-format"
-expression = "Apache-2.0 OR MIT"
-license-files = []
-
-# ---------------------------------------------------------------------------
-# Bans: disallow specific crates and flag dependency hygiene issues.
-# ---------------------------------------------------------------------------
-[bans]
-# Warn (not deny) on duplicate versions of the same crate. In a large
-# workspace like this one, duplicates are common and often unavoidable
-# transitively. We surface them to discourage growth, but don't fail CI.
-multiple-versions = "warn"
-# Wildcard version requirements (`foo = "*"`) are a footgun — they let any
-# future release in without review. Ban them outright.
-wildcards = "deny"
-# Internal workspace crates reference each other via `path = "..."`, which
-# cargo-deny sees as a wildcard version. That's fine for private workspace
-# members (not published to crates.io), so allow it specifically for paths.
-allow-wildcard-paths = true
-# Features that, if enabled, should cause the check to fail.
-deny = []
-# Crates to skip when checking for duplicate versions.
-skip = []
-# Similar to `skip`, but also skips the entire transitive subtree.
-skip-tree = []
-
-# ---------------------------------------------------------------------------
-# Sources: restrict where crates can come from.
-# ---------------------------------------------------------------------------
-[sources]
-# Deny any registry other than the ones explicitly listed below.
-unknown-registry = "deny"
-# Deny any git dependency whose host isn't in the allow-list below. This
-# prevents accidental pulls from arbitrary forks.
-unknown-git = "deny"
-allow-registry = ["https://github.com/rust-lang/crates.io-index"]
-# Lance is developed in a sibling repo and pulled as a git dependency until
-# releases are cut to crates.io. Allow that specific host.
-allow-git = [
-    "https://github.com/lance-format/lance",
-]
--- a/dockerfiles/Dockerfile
+++ b/dockerfiles/Dockerfile
@@ -24,4 +24,4 @@ RUN python --version && \
  rustc --version && \
  protoc --version

-RUN pip install --no-cache-dir lancedb
+RUN pip install --no-cache-dir tantivy lancedb
--- a/docs/README.md
+++ b/docs/README.md
@@ -1,6 +1,6 @@
 # LanceDB Documentation

-LanceDB docs are available at [docs.lancedb.com](https://docs.lancedb.com).
+LanceDB docs are available at [lancedb.com/docs](https://lancedb.com/docs).

 The SDK docs are built and deployed automatically by [Github Actions](../.github/workflows/docs.yml)
 whenever a commit is pushed to the `main` branch. So it is possible for the docs to show
--- a/docs/src/java/java.md
+++ b/docs/src/java/java.md
@@ -14,7 +14,7 @@ Add the following dependency to your `pom.xml`:
 <dependency>
    <groupId>com.lancedb</groupId>
    <artifactId>lancedb-core</artifactId>
-    <version>0.28.0-beta.11</version>
+    <version>0.28.0-beta.5</version>
 </dependency>
 ```

--- a/docs/src/js/README.md
+++ b/docs/src/js/README.md
@@ -34,7 +34,7 @@ const results = await table.vectorSearch([0.1, 0.3]).limit(20).toArray();
 console.log(results);
 ```

-The [quickstart](https://docs.lancedb.com/quickstart/) contains more complete examples.
+The [quickstart](https://lancedb.com/docs/quickstart/basic-usage/) contains more complete examples.

 ## Development

--- a/docs/src/js/_media/CONTRIBUTING.md
+++ b/docs/src/js/_media/CONTRIBUTING.md
@@ -12,22 +12,20 @@ Typescript.
 * `src/`: Rust bindings source code
 * `lancedb/`: Typescript package source code
 * `__test__/`: Unit tests
-* `examples/`: A pnpm package with the examples shown in the documentation
+* `examples/`: An npm package with the examples shown in the documentation

 ## Development environment

 To set up your development environment, you will need to install the following:

-1. Node.js 22 or later (required by pnpm 11)
-2. [pnpm](https://pnpm.io/installation) 11 or later (or run via `corepack enable`,
-   which uses the `packageManager` field in `package.json`)
-3. Rust's package manager, Cargo. Use [rustup](https://rustup.rs/) to install.
-4. [protoc](https://grpc.io/docs/protoc-installation/) (Protocol Buffers compiler)
+1. Node.js 14 or later
+2. Rust's package manager, Cargo. Use [rustup](https://rustup.rs/) to install.
+3. [protoc](https://grpc.io/docs/protoc-installation/) (Protocol Buffers compiler)

 Initial setup:

 ```shell
-pnpm install
+npm install
 ```

 ### Commit Hooks
@@ -41,38 +39,38 @@ pre-commit install

 ## Development

-Most common development commands can be run using the pnpm scripts.
+Most common development commands can be run using the npm scripts.

 Build the package

 ```shell
-pnpm install
-pnpm build
+npm install
+npm run build
 ```

 Lint:

 ```shell
-pnpm lint
+npm run lint
 ```

 Format and fix lints:

 ```shell
-pnpm lint-fix
+npm run lint-fix
 ```

 Run tests:

 ```shell
-pnpm test
+npm test
 ```

 To run a single test:

 ```shell
 # Single file: table.test.ts
-pnpm test -- table.test.ts
+npm test -- table.test.ts
 # Single test: 'merge insert' in table.test.ts
-pnpm test -- table.test.ts --testNamePattern=merge\ insert
+npm test -- table.test.ts --testNamePattern=merge\ insert
 ```
--- a/docs/src/js/classes/Connection.md
+++ b/docs/src/js/classes/Connection.md
@@ -148,33 +148,6 @@ Creates a new empty Table

 ***

-### createNamespace()
-
-```ts
-abstract createNamespace(namespacePath, options?): Promise<CreateNamespaceResponse>
-```
-
-Create a new namespace at the given path.
-
-#### Parameters
-
-* **namespacePath**: `string`[]
-    The namespace path to create.
-
-* **options?**: `Partial`&lt;[`CreateNamespaceOptions`](../interfaces/CreateNamespaceOptions.md)&gt;
-    Creation `mode`
-    ("create" | "exist_ok" | "overwrite") and optional `properties`
-    to attach to the namespace.
-
-#### Returns
-
-`Promise`&lt;[`CreateNamespaceResponse`](../interfaces/CreateNamespaceResponse.md)&gt;
-
-The properties of the
-  created namespace and an optional transaction id.
-
-***
-
 ### createTable()

 #### createTable(options, namespacePath)
@@ -257,29 +230,6 @@ Creates a new Table and initialize it with new data.

 ***

-### describeNamespace()
-
-```ts
-abstract describeNamespace(namespacePath): Promise<DescribeNamespaceResponse>
-```
-
-Describe a namespace, returning its properties.
-
-#### Parameters
-
-* **namespacePath**: `string`[]
-    The namespace path to describe, in
-    parent → child order, e.g. `["analytics", "sales"]`.
-
-#### Returns
-
-`Promise`&lt;[`DescribeNamespaceResponse`](../interfaces/DescribeNamespaceResponse.md)&gt;
-
-The namespace's properties
-  (may be undefined if the namespace has none).
-
-***
-
 ### display()

 ```ts
@@ -313,36 +263,6 @@ Drop all tables in the database.

 ***

-### dropNamespace()
-
-```ts
-abstract dropNamespace(namespacePath, options?): Promise<DropNamespaceResponse>
-```
-
-Drop a namespace.
-
-Use `behavior: "cascade"` to also drop everything contained in the
-namespace (sub-namespaces and tables). The default `"restrict"`
-behavior refuses to drop a non-empty namespace.
-
-#### Parameters
-
-* **namespacePath**: `string`[]
-    The namespace path to drop.
-
-* **options?**: `Partial`&lt;[`DropNamespaceOptions`](../interfaces/DropNamespaceOptions.md)&gt;
-    `mode` ("skip" | "fail"
-    for missing-namespace handling) and `behavior` ("restrict" | "cascade").
-
-#### Returns
-
-`Promise`&lt;[`DropNamespaceResponse`](../interfaces/DropNamespaceResponse.md)&gt;
-
-Any properties returned by
-  the server and an optional transaction id.
-
-***
-
 ### dropTable()

 ```ts
@@ -379,36 +299,6 @@ Return true if the connection has not been closed

 ***

-### listNamespaces()
-
-```ts
-abstract listNamespaces(namespacePath?, options?): Promise<ListNamespacesResponse>
-```
-
-List the immediate child namespaces under the given parent.
-
-Results may be paginated. To retrieve subsequent pages, pass the
-`pageToken` returned by a previous call.
-
-#### Parameters
-
-* **namespacePath?**: `string`[]
-    The parent namespace path. Defaults
-    to the root namespace if omitted.
-
-* **options?**: `Partial`&lt;[`ListNamespacesOptions`](../interfaces/ListNamespacesOptions.md)&gt;
-    Pagination options
-    (`pageToken`, `limit`).
-
-#### Returns
-
-`Promise`&lt;[`ListNamespacesResponse`](../interfaces/ListNamespacesResponse.md)&gt;
-
-Child namespace names and
-  an optional token for fetching the next page.
-
-***
-
 ### openTable()

 ```ts
@@ -437,29 +327,6 @@ Open a table in the database.

 ***

-### renameTable()
-
-```ts
-abstract renameTable(
-   oldName,
-   newName,
-   namespacePath?): Promise<void>
-```
-
-#### Parameters
-
-* **oldName**: `string`
-
-* **newName**: `string`
-
-* **namespacePath?**: `string`[]
-
-#### Returns
-
-`Promise`&lt;`void`&gt;
-
-***
-
 ### tableNames()

 #### tableNames(options)
--- a/docs/src/js/classes/Scannable.md
+++ b/docs/src/js/classes/Scannable.md
@@ -1,173 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / Scannable
-
-# Class: Scannable
-
-A data source that can be scanned as a stream of Arrow `RecordBatch`es.
-
-`Scannable` wraps the schema + optional row count + rescannable flag and
-a callback that yields batches one at a time. It is passed to consumers
-(e.g. `Table.add`, `createTable`, `mergeInsert` — follow-up work) that
-need to pull data without materializing the full dataset in JS memory.
-
-Batches cross the JS↔Rust boundary as Arrow IPC Stream messages; a fresh
-writer serializes each batch, and the Rust side decodes it with
-`arrow_ipc::reader::StreamReader`. One batch is in flight at a time.
-
-## Properties
-
-### numRows
-
-```ts
-readonly numRows: null | number;
-```
-
-***
-
-### rescannable
-
-```ts
-readonly rescannable: boolean;
-```
-
-***
-
-### schema
-
-```ts
-readonly schema: Schema<any>;
-```
-
-## Methods
-
-### fromFactory()
-
-```ts
-static fromFactory(
-   schema,
-   factory,
-   opts): Promise<Scannable>
-```
-
-Build a Scannable from an explicit schema and a factory that returns a
-fresh batch iterator on each call.
-
-The factory is invoked once per scan. Each iterator yields
-`RecordBatch`es matching the declared schema. Use this when you need
-direct control over the pull loop — for example, to wrap a streaming
-source whose batches are produced lazily.
-
-#### Parameters
-
-* **schema**: `Schema`&lt;`any`&gt;
-    The Arrow schema of the produced batches.
-
-* **factory**
-    Called at the start of each scan to produce a batch
-    iterator. Must be idempotent when `rescannable` is true.
-
-* **opts**: [`ScannableOptions`](../interfaces/ScannableOptions.md) = `{}`
-    Optional hints. `rescannable` defaults to `true`; set to
-    `false` if calling `factory()` twice would not reproduce the same data.
-
-#### Returns
-
-`Promise`&lt;[`Scannable`](Scannable.md)&gt;
-
-***
-
-### fromIterable()
-
-```ts
-static fromIterable(
-   schema,
-   iter,
-   opts): Promise<Scannable>
-```
-
-Build a Scannable from an iterable of `RecordBatch`es. `rescannable`
-defaults to `false`. Pass an explicit schema so the consumer can
-validate before any batch is pulled.
-
-`opts.rescannable: true` is honest for replayable iterables (Arrays,
-Sets, or custom iterables whose `[Symbol.iterator]()` returns a fresh
-iterator each call). It is rejected for one-shot iterables (generators,
-async generators, or already-an-iterator inputs) because their
-`[Symbol.iterator]()` returns the same exhausted object on the second
-scan. For replayable sources outside this shape, use
-`fromFactory(schema, () => createIter(), { rescannable: true })`.
-
-Note: when `opts.rescannable` is `true`, the constructor calls
-`[Symbol.iterator]()` once on the input to perform the structural check.
-
-#### Parameters
-
-* **schema**: `Schema`&lt;`any`&gt;
-
-* **iter**: `Iterable`&lt;`RecordBatch`&lt;`any`&gt;&gt; \| `AsyncIterable`&lt;`RecordBatch`&lt;`any`&gt;&gt;
-
-* **opts**: [`ScannableOptions`](../interfaces/ScannableOptions.md) = `{}`
-
-#### Returns
-
-`Promise`&lt;[`Scannable`](Scannable.md)&gt;
-
-***
-
-### fromRecordBatchReader()
-
-```ts
-static fromRecordBatchReader(reader, opts): Promise<Scannable>
-```
-
-Build a Scannable from an Arrow `RecordBatchReader`. A reader can only
-be consumed once; `rescannable` defaults to `false`.
-
-The reader must already be opened (via `.open()`) so its `.schema` is
-populated. `RecordBatchReader.from(...)` returns an unopened reader.
-
-`opts.rescannable: true` is rejected because `RecordBatchReader` is a
-self-iterator (its `[Symbol.iterator]()` returns itself), and this
-constructor does not call `reader.reset()` between scans, so a second
-scan would always see an exhausted reader. For genuinely replayable
-sources, use
-`fromFactory(schema, () => openReader(), { rescannable: true })`,
-which mints a fresh reader on each scan.
-
-#### Parameters
-
-* **reader**: `RecordBatchReader`&lt;`any`&gt;
-
-* **opts**: [`ScannableOptions`](../interfaces/ScannableOptions.md) = `{}`
-
-#### Returns
-
-`Promise`&lt;[`Scannable`](Scannable.md)&gt;
-
-***
-
-### fromTable()
-
-```ts
-static fromTable(table, opts): Promise<Scannable>
-```
-
-Build a Scannable from an in-memory Arrow `Table`. Always rescannable;
-the table's batches are replayed on each scan.
-
-The table's row count is authoritative: `opts.numRows` must either be
-omitted or equal to `table.numRows`. `opts.rescannable` of `false` is
-rejected because in-memory Tables are always rescannable.
-
-#### Parameters
-
-* **table**: `Table`&lt;`any`&gt;
-
-* **opts**: [`ScannableOptions`](../interfaces/ScannableOptions.md) = `{}`
-
-#### Returns
-
-`Promise`&lt;[`Scannable`](Scannable.md)&gt;
--- a/docs/src/js/classes/Table.md
+++ b/docs/src/js/classes/Table.md
@@ -501,34 +501,6 @@ Modeled after ``VACUUM`` in PostgreSQL.

 ***

-### prewarmData()
-
-```ts
-abstract prewarmData(columns?): Promise<void>
-```
-
-Prewarm one or more columns of data in the table.
-
-#### Parameters
-
-* **columns?**: `string`[]
-    The columns to prewarm. If undefined, all columns are prewarmed.
-    This will load the column data into the page cache so that future queries that
-    read those columns avoid the initial cold-start latency.  This call initiates
-    prewarming and returns once the request is accepted; the warming itself may
-    continue in the background.  Calling it on already-prewarmed columns is a
-    no-op on the server.
-    Prewarming is generally useful for columns used in filters or projections.
-    Large columns (e.g. high-dimensional vectors or binary data) may not be
-    practical to prewarm.
-    This feature is currently only supported on remote tables.
-
-#### Returns
-
-`Promise`&lt;`void`&gt;
-
-***
-
 ### prewarmIndex()

 ```ts
--- a/docs/src/js/functions/connectNamespace.md
+++ b/docs/src/js/functions/connectNamespace.md
@@ -1,131 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / connectNamespace
-
-# Function: connectNamespace()
-
-## connectNamespace(implName, config, options)
-
-```ts
-function connectNamespace(
-   implName,
-   config,
-   options?): Promise<Connection>
-```
-
-Connect to a LanceDB database through a namespace.
-
-Unlike [connect](connect.md), which routes by URI scheme (local path vs.
-`db://` cloud), `connectNamespace` always returns a namespace-backed
-connection. The `implName` selects the namespace implementation:
-
- `"dir"` — directory namespace, configured with [DirNamespaceConfig](../interfaces/DirNamespaceConfig.md).
- `"rest"` — remote REST catalog, configured with [RestNamespaceConfig](../interfaces/RestNamespaceConfig.md).
- Any other string — full module path for a custom implementation,
-  configured with a free-form string-keyed `properties` map.
-
-### Parameters
-
-* **implName**: `"dir"`
-
-* **config**: [`DirNamespaceConfig`](../interfaces/DirNamespaceConfig.md)
-
-* **options?**: `Partial`&lt;[`ConnectNamespaceOptions`](../interfaces/ConnectNamespaceOptions.md)&gt;
-
-### Returns
-
-`Promise`&lt;[`Connection`](../classes/Connection.md)&gt;
-
-### Examples
-
-```ts
-const db = await connectNamespace("dir", { root: "/path/to/db" });
-await db.createTable("users", [{ id: 1 }]);
-```
-
-```ts
-const db = await connectNamespace("rest", {
-  uri: "https://catalog.example.com",
-  headers: { "x-api-key": process.env.CATALOG_KEY ?? "" },
-});
-```
-
-```ts
-const db = await connectNamespace("my.custom.Namespace", {
-  endpoint: "...",
-});
-```
-
-## connectNamespace(implName, config, options)
-
-```ts
-function connectNamespace(
-   implName,
-   config,
-   options?): Promise<Connection>
-```
-
-Connect through the built-in REST namespace.
-
-Configured with [RestNamespaceConfig](../interfaces/RestNamespaceConfig.md). See the function-level
-documentation above for the full surface, examples, and how this
-relates to [connect](connect.md).
-
-### Parameters
-
-* **implName**: `"rest"`
-
-* **config**: [`RestNamespaceConfig`](../interfaces/RestNamespaceConfig.md)
-
-* **options?**: `Partial`&lt;[`ConnectNamespaceOptions`](../interfaces/ConnectNamespaceOptions.md)&gt;
-
-### Returns
-
-`Promise`&lt;[`Connection`](../classes/Connection.md)&gt;
-
-### Example
-
-```ts
-const db = await connectNamespace("rest", {
-  uri: "https://catalog.example.com",
-  headers: { "x-api-key": process.env.CATALOG_KEY ?? "" },
-});
-```
-
-## connectNamespace(implName, properties, options)
-
-```ts
-function connectNamespace(
-   implName,
-   properties,
-   options?): Promise<Connection>
-```
-
-Connect through a custom namespace implementation by full module path,
-configured with a free-form string-keyed `properties` map. Use the
-typed overloads above for the built-in `"dir"` and `"rest"` impls.
-
-See the function-level documentation above for examples and how this
-relates to [connect](connect.md).
-
-### Parameters
-
-* **implName**: `string`
-
-* **properties**: `Record`&lt;`string`, `string`&gt;
-
-* **options?**: `Partial`&lt;[`ConnectNamespaceOptions`](../interfaces/ConnectNamespaceOptions.md)&gt;
-
-### Returns
-
-`Promise`&lt;[`Connection`](../classes/Connection.md)&gt;
-
-### Example
-
-```ts
-const db = await connectNamespace("my.custom.Namespace", {
-  endpoint: "...",
-});
-```
--- a/docs/src/js/globals.md
+++ b/docs/src/js/globals.md
@@ -32,7 +32,6 @@
 - [PhraseQuery](classes/PhraseQuery.md)
 - [Query](classes/Query.md)
 - [QueryBase](classes/QueryBase.md)
- [Scannable](classes/Scannable.md)
 - [Session](classes/Session.md)
 - [StaticHeaderProvider](classes/StaticHeaderProvider.md)
 - [Table](classes/Table.md)
@@ -52,17 +51,10 @@
 - [ClientConfig](interfaces/ClientConfig.md)
 - [ColumnAlteration](interfaces/ColumnAlteration.md)
 - [CompactionStats](interfaces/CompactionStats.md)
- [ConnectNamespaceOptions](interfaces/ConnectNamespaceOptions.md)
 - [ConnectionOptions](interfaces/ConnectionOptions.md)
- [CreateNamespaceOptions](interfaces/CreateNamespaceOptions.md)
- [CreateNamespaceResponse](interfaces/CreateNamespaceResponse.md)
 - [CreateTableOptions](interfaces/CreateTableOptions.md)
 - [DeleteResult](interfaces/DeleteResult.md)
- [DescribeNamespaceResponse](interfaces/DescribeNamespaceResponse.md)
- [DirNamespaceConfig](interfaces/DirNamespaceConfig.md)
 - [DropColumnsResult](interfaces/DropColumnsResult.md)
- [DropNamespaceOptions](interfaces/DropNamespaceOptions.md)
- [DropNamespaceResponse](interfaces/DropNamespaceResponse.md)
 - [ExecutableQuery](interfaces/ExecutableQuery.md)
 - [FragmentStatistics](interfaces/FragmentStatistics.md)
 - [FragmentSummaryStats](interfaces/FragmentSummaryStats.md)
@@ -77,17 +69,13 @@
 - [IvfFlatOptions](interfaces/IvfFlatOptions.md)
 - [IvfPqOptions](interfaces/IvfPqOptions.md)
 - [IvfRqOptions](interfaces/IvfRqOptions.md)
- [ListNamespacesOptions](interfaces/ListNamespacesOptions.md)
- [ListNamespacesResponse](interfaces/ListNamespacesResponse.md)
 - [MergeResult](interfaces/MergeResult.md)
 - [OpenTableOptions](interfaces/OpenTableOptions.md)
 - [OptimizeOptions](interfaces/OptimizeOptions.md)
 - [OptimizeStats](interfaces/OptimizeStats.md)
 - [QueryExecutionOptions](interfaces/QueryExecutionOptions.md)
 - [RemovalStats](interfaces/RemovalStats.md)
- [RestNamespaceConfig](interfaces/RestNamespaceConfig.md)
 - [RetryConfig](interfaces/RetryConfig.md)
- [ScannableOptions](interfaces/ScannableOptions.md)
 - [ShuffleOptions](interfaces/ShuffleOptions.md)
 - [SplitCalculatedOptions](interfaces/SplitCalculatedOptions.md)
 - [SplitHashOptions](interfaces/SplitHashOptions.md)
@@ -119,7 +107,6 @@

 - [RecordBatchIterator](functions/RecordBatchIterator.md)
 - [connect](functions/connect.md)
- [connectNamespace](functions/connectNamespace.md)
 - [makeArrowTable](functions/makeArrowTable.md)
 - [packBits](functions/packBits.md)
 - [permutationBuilder](functions/permutationBuilder.md)
--- a/docs/src/js/interfaces/ConnectNamespaceOptions.md
+++ b/docs/src/js/interfaces/ConnectNamespaceOptions.md
@@ -1,54 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / ConnectNamespaceOptions
-
-# Interface: ConnectNamespaceOptions
-
-## Properties
-
-### namespaceClientProperties?
-
-```ts
-optional namespaceClientProperties: Record<string, string>;
-```
-
-Extra properties for the backing namespace client.
-
-***
-
-### readConsistencyInterval?
-
-```ts
-optional readConsistencyInterval: number;
-```
-
-The interval, in seconds, at which to check for updates to the table
-from other processes. If None, then consistency is not checked. For
-performance reasons, this is the default. For strong consistency, set
-this to zero seconds. Then every read will check for updates from other
-processes. As a compromise, you can set this to a non-zero value for
-eventual consistency.
-
-***
-
-### session?
-
-```ts
-optional session: Session;
-```
-
-The session to use for this connection. Holds shared caches and other
-session-specific state.
-
-***
-
-### storageOptions?
-
-```ts
-optional storageOptions: Record<string, string>;
-```
-
-Configuration for object storage. The available options are described
-at https://docs.lancedb.com/storage/
--- a/docs/src/js/interfaces/ConnectionOptions.md
+++ b/docs/src/js/interfaces/ConnectionOptions.md
@@ -41,29 +41,6 @@ for testing purposes.

 ***

-### manifestEnabled?
-
-```ts
-optional manifestEnabled: boolean;
-```
-
-(For LanceDB OSS only): use directory namespace manifests as the source
-of truth for table metadata. Existing directory-listed root tables are
-migrated into the manifest on access.
-
-***
-
-### namespaceClientProperties?
-
-```ts
-optional namespaceClientProperties: Record<string, string>;
-```
-
-(For LanceDB OSS only): extra properties for the backing namespace
-client used by manifest-enabled native connections.
-
-***
-
 ### readConsistencyInterval?

 ```ts
@@ -112,4 +89,4 @@ optional storageOptions: Record<string, string>;

 (For LanceDB OSS only): configuration for object storage.

-The available options are described at https://docs.lancedb.com/storage/
+The available options are described at https://lancedb.com/docs/storage/
--- a/docs/src/js/interfaces/CreateNamespaceOptions.md
+++ b/docs/src/js/interfaces/CreateNamespaceOptions.md
@@ -1,27 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / CreateNamespaceOptions
-
-# Interface: CreateNamespaceOptions
-
-## Properties
-
-### mode?
-
-```ts
-optional mode: "overwrite" | "create" | "exist_ok";
-```
-
-Creation mode.
-
-***
-
-### properties?
-
-```ts
-optional properties: Record<string, string>;
-```
-
-Properties to set on the new namespace.
--- a/docs/src/js/interfaces/CreateNamespaceResponse.md
+++ b/docs/src/js/interfaces/CreateNamespaceResponse.md
@@ -1,23 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / CreateNamespaceResponse
-
-# Interface: CreateNamespaceResponse
-
-## Properties
-
-### properties?
-
-```ts
-optional properties: Record<string, string>;
-```
-
-***
-
-### transactionId?
-
-```ts
-optional transactionId: string;
-```
--- a/docs/src/js/interfaces/CreateTableOptions.md
+++ b/docs/src/js/interfaces/CreateTableOptions.md
@@ -97,4 +97,4 @@ Configuration for object storage.
 Options already set on the connection will be inherited by the table,
 but can be overridden here.

-The available options are described at https://docs.lancedb.com/storage/
+The available options are described at https://lancedb.com/docs/storage/
--- a/docs/src/js/interfaces/DescribeNamespaceResponse.md
+++ b/docs/src/js/interfaces/DescribeNamespaceResponse.md
@@ -1,15 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / DescribeNamespaceResponse
-
-# Interface: DescribeNamespaceResponse
-
-## Properties
-
-### properties?
-
-```ts
-optional properties: Record<string, string>;
-```
--- a/docs/src/js/interfaces/DirNamespaceConfig.md
+++ b/docs/src/js/interfaces/DirNamespaceConfig.md
@@ -1,47 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / DirNamespaceConfig
-
-# Interface: DirNamespaceConfig
-
-Configuration for the built-in directory namespace (`"dir"`).
-
-The directory namespace stores tables under a single root path (local
-filesystem or object storage URI). See
-[https://docs.lancedb.com/namespaces](https://docs.lancedb.com/namespaces) for the documented surface;
-less-common knobs live under [DirNamespaceConfig.extraProperties](DirNamespaceConfig.md#extraproperties).
-
-## Properties
-
-### extraProperties?
-
-```ts
-optional extraProperties: Record<string, string>;
-```
-
-Additional raw properties passed verbatim to the namespace
-implementation (e.g. `storage.*`, `credential_vendor.*`). Typed
-fields above take precedence on key collision.
-
-***
-
-### manifestEnabled?
-
-```ts
-optional manifestEnabled: boolean;
-```
-
-Whether to maintain a namespace manifest at the root. Required for
-child namespaces. Defaults to true on the impl side.
-
-***
-
-### root
-
-```ts
-root: string;
-```
-
-Root path or URI containing the LanceDB tables.
--- a/docs/src/js/interfaces/DropNamespaceOptions.md
+++ b/docs/src/js/interfaces/DropNamespaceOptions.md
@@ -1,27 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / DropNamespaceOptions
-
-# Interface: DropNamespaceOptions
-
-## Properties
-
-### behavior?
-
-```ts
-optional behavior: "restrict" | "cascade";
-```
-
-Refuse to drop if non-empty (restrict) or drop recursively (cascade).
-
-***
-
-### mode?
-
-```ts
-optional mode: "fail" | "skip";
-```
-
-Whether to skip if the namespace doesn't exist, or fail.
--- a/docs/src/js/interfaces/DropNamespaceResponse.md
+++ b/docs/src/js/interfaces/DropNamespaceResponse.md
@@ -1,23 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / DropNamespaceResponse
-
-# Interface: DropNamespaceResponse
-
-## Properties
-
-### properties?
-
-```ts
-optional properties: Record<string, string>;
-```
-
-***
-
-### transactionId?
-
-```ts
-optional transactionId: string[];
-```
--- a/docs/src/js/interfaces/ListNamespacesOptions.md
+++ b/docs/src/js/interfaces/ListNamespacesOptions.md
@@ -1,27 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / ListNamespacesOptions
-
-# Interface: ListNamespacesOptions
-
-## Properties
-
-### limit?
-
-```ts
-optional limit: number;
-```
-
-An optional limit to the number of results to return.
-
-***
-
-### pageToken?
-
-```ts
-optional pageToken: string;
-```
-
-Token from a previous response for pagination.
--- a/docs/src/js/interfaces/ListNamespacesResponse.md
+++ b/docs/src/js/interfaces/ListNamespacesResponse.md
@@ -1,23 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / ListNamespacesResponse
-
-# Interface: ListNamespacesResponse
-
-## Properties
-
-### namespaces
-
-```ts
-namespaces: string[];
-```
-
-***
-
-### pageToken?
-
-```ts
-optional pageToken: string;
-```
--- a/docs/src/js/interfaces/OpenTableOptions.md
+++ b/docs/src/js/interfaces/OpenTableOptions.md
@@ -42,4 +42,4 @@ Configuration for object storage.
 Options already set on the connection will be inherited by the table,
 but can be overridden here.

-The available options are described at https://docs.lancedb.com/storage/
+The available options are described at https://lancedb.com/docs/storage/
--- a/docs/src/js/interfaces/RestNamespaceConfig.md
+++ b/docs/src/js/interfaces/RestNamespaceConfig.md
@@ -1,47 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / RestNamespaceConfig
-
-# Interface: RestNamespaceConfig
-
-Configuration for the built-in REST namespace (`"rest"`).
-
-The REST namespace talks to a remote catalog server over HTTP. See
-[https://docs.lancedb.com/namespaces](https://docs.lancedb.com/namespaces) for the documented surface;
-less-common knobs (TLS, metrics) live under
-[RestNamespaceConfig.extraProperties](RestNamespaceConfig.md#extraproperties).
-
-## Properties
-
-### extraProperties?
-
-```ts
-optional extraProperties: Record<string, string>;
-```
-
-Additional raw properties passed verbatim to the namespace
-implementation (e.g. `tls.*`, `ops_metrics_enabled`, `delimiter`).
-Typed fields above take precedence on key collision.
-
-***
-
-### headers?
-
-```ts
-optional headers: Record<string, string>;
-```
-
-HTTP headers forwarded with each request. Keys are passed through
-as-is (e.g. `"x-api-key"`, `"Authorization"`).
-
-***
-
-### uri
-
-```ts
-uri: string;
-```
-
-Catalog endpoint URL.
--- a/docs/src/js/interfaces/ScannableOptions.md
+++ b/docs/src/js/interfaces/ScannableOptions.md
@@ -1,29 +0,0 @@
-[**@lancedb/lancedb**](../README.md) • **Docs**
-
-***
-
-[@lancedb/lancedb](../globals.md) / ScannableOptions
-
-# Interface: ScannableOptions
-
-## Properties
-
-### numRows?
-
-```ts
-optional numRows: number;
-```
-
-Hint about the number of rows. Not validated against the stream.
-
-***
-
-### rescannable?
-
-```ts
-optional rescannable: boolean;
-```
-
-Whether the source can be scanned more than once. Defaults to `true` for
-`fromTable` / `fromFactory` and `false` for `fromIterable` /
-`fromRecordBatchReader`.
--- a/docs/src/python/python.md
+++ b/docs/src/python/python.md
@@ -94,11 +94,11 @@ of raw SQL strings with [where][lancedb.query.LanceQueryBuilder.where] and

 ## Full text search

-Use [lancedb.table.Table.create_fts_index][] for the synchronous API or
-[lancedb.table.AsyncTable.create_index][] with [lancedb.index.FTS][] for the
-asynchronous API.
+::: lancedb.fts.create_index

-::: lancedb.index.FTS
+::: lancedb.fts.populate_index
+
+::: lancedb.fts.search_index

 ## Utilities

--- a/java/lancedb-core/pom.xml
+++ b/java/lancedb-core/pom.xml
@@ -8,7 +8,7 @@
    <parent>
      <groupId>com.lancedb</groupId>
      <artifactId>lancedb-parent</artifactId>
-      <version>0.28.0-beta.11</version>
+      <version>0.28.0-beta.5</version>
      <relativePath>../pom.xml</relativePath>
    </parent>

--- a/java/pom.xml
+++ b/java/pom.xml
@@ -6,7 +6,7 @@

    <groupId>com.lancedb</groupId>
    <artifactId>lancedb-parent</artifactId>
-    <version>0.28.0-beta.11</version>
+    <version>0.28.0-beta.5</version>
    <packaging>pom</packaging>
    <name>${project.artifactId}</name>
    <description>LanceDB Java SDK Parent POM</description>
@@ -28,7 +28,7 @@
    <properties>
        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
        <arrow.version>15.0.0</arrow.version>
-        <lance-core.version>7.0.0-beta.9</lance-core.version>
+        <lance-core.version>5.1.0-beta.3</lance-core.version>
        <spotless.skip>false</spotless.skip>
        <spotless.version>2.30.0</spotless.version>
        <spotless.java.googlejavaformat.version>1.7</spotless.java.googlejavaformat.version>
--- a/nodejs/AGENTS.md
+++ b/nodejs/AGENTS.md
@@ -3,11 +3,11 @@ The core Rust library is in the `../rust/lancedb` directory, the rust binding
 code is in the `src/` directory and the typescript bindings are in
 the `lancedb/` directory.

-Whenever you change the Rust code, you will need to recompile: `pnpm build`.
+Whenever you change the Rust code, you will need to recompile: `npm run build`.

 Common commands:
-* Build: `pnpm build`
-* Lint: `pnpm lint`
-* Fix lints: `pnpm lint-fix`
-* Test: `pnpm test`
-* Run single test file: `pnpm test __test__/arrow.test.ts`
+* Build: `npm run build`
+* Lint: `npm run lint`
+* Fix lints: `npm run lint-fix`
+* Test: `npm test`
+* Run single test file: `npm test __test__/arrow.test.ts`
--- a/nodejs/CONTRIBUTING.md
+++ b/nodejs/CONTRIBUTING.md
@@ -12,22 +12,20 @@ Typescript.
 * `src/`: Rust bindings source code
 * `lancedb/`: Typescript package source code
 * `__test__/`: Unit tests
-* `examples/`: A pnpm package with the examples shown in the documentation
+* `examples/`: An npm package with the examples shown in the documentation

 ## Development environment

 To set up your development environment, you will need to install the following:

-1. Node.js 22 or later (required by pnpm 11)
-2. [pnpm](https://pnpm.io/installation) 11 or later (or run via `corepack enable`,
-   which uses the `packageManager` field in `package.json`)
-3. Rust's package manager, Cargo. Use [rustup](https://rustup.rs/) to install.
-4. [protoc](https://grpc.io/docs/protoc-installation/) (Protocol Buffers compiler)
+1. Node.js 14 or later
+2. Rust's package manager, Cargo. Use [rustup](https://rustup.rs/) to install.
+3. [protoc](https://grpc.io/docs/protoc-installation/) (Protocol Buffers compiler)

 Initial setup:

 ```shell
-pnpm install
+npm install
 ```

 ### Commit Hooks
@@ -41,38 +39,38 @@ pre-commit install

 ## Development

-Most common development commands can be run using the pnpm scripts.
+Most common development commands can be run using the npm scripts.

 Build the package

 ```shell
-pnpm install
-pnpm build
+npm install
+npm run build
 ```

 Lint:

 ```shell
-pnpm lint
+npm run lint
 ```

 Format and fix lints:

 ```shell
-pnpm lint-fix
+npm run lint-fix
 ```

 Run tests:

 ```shell
-pnpm test
+npm test
 ```

 To run a single test:

 ```shell
 # Single file: table.test.ts
-pnpm test -- table.test.ts
+npm test -- table.test.ts
 # Single test: 'merge insert' in table.test.ts
-pnpm test -- table.test.ts --testNamePattern=merge\ insert
+npm test -- table.test.ts --testNamePattern=merge\ insert
 ```
--- a/nodejs/Cargo.toml
+++ b/nodejs/Cargo.toml
@@ -1,8 +1,7 @@
 [package]
 name = "lancedb-nodejs"
 edition.workspace = true
-version = "0.28.0-beta.11"
-publish = false
+version = "0.28.0-beta.5"
 license.workspace = true
 description.workspace = true
 repository.workspace = true
@@ -16,13 +15,12 @@ crate-type = ["cdylib"]
 async-trait.workspace = true
 arrow-ipc.workspace = true
 arrow-array.workspace = true
-arrow-buffer = "58.0.0"
+arrow-buffer = "57.2"
 half.workspace = true
 arrow-schema.workspace = true
 env_logger.workspace = true
 futures.workspace = true
 lancedb = { path = "../rust/lancedb", default-features = false }
-lance-namespace.workspace = true
 napi = { version = "3.8.3", default-features = false, features = [
    "napi9",
    "async"
@@ -33,8 +31,8 @@ lzma-sys = { version = "0.1", features = ["static"] }
 log.workspace = true

 # Pin to resolve build failures; update periodically for security patches.
-aws-lc-sys = "=0.40.0"
-aws-lc-rs = "=1.16.3"
+aws-lc-sys = "=0.38.0"
+aws-lc-rs = "=1.16.1"

 [build-dependencies]
 napi-build = "2.3.1"
--- a/nodejs/README.md
+++ b/nodejs/README.md
@@ -30,7 +30,7 @@ const results = await table.vectorSearch([0.1, 0.3]).limit(20).toArray();
 console.log(results);
 ```

-The [quickstart](https://docs.lancedb.com/quickstart/) contains more complete examples.
+The [quickstart](https://lancedb.com/docs/quickstart/basic-usage/) contains more complete examples.

 ## Development

--- a/nodejs/test/connection.test.ts
+++ b/nodejs/test/connection.test.ts
@@ -4,7 +4,7 @@
 import { readdirSync } from "fs";
 import { Field, Float64, Schema } from "apache-arrow";
 import * as tmp from "tmp";
-import { Connection, Table, connect, connectNamespace } from "../lancedb";
+import { Connection, Table, connect } from "../lancedb";
 import { LocalTable } from "../lancedb/table";

 describe("when connecting", () => {
@@ -81,16 +81,6 @@ describe("given a connection", () => {
    await db.createTable("test4", [{ id: 1 }, { id: 2 }]);
  });

-  it("should expose renameTable and reject on OSS listing DB", async () => {
-    await db.createTable("old_name", [{ id: 1 }]);
-
-    await expect(db.renameTable("old_name", "new_name")).rejects.toThrow(
-      "rename_table is not supported in LanceDB OSS",
-    );
-
-    await expect(db.tableNames()).resolves.toEqual(["old_name"]);
-  });
-
  it("should fail if creating table twice, unless overwrite is true", async () => {
    let tbl = await db.createTable("test", [{ id: 1 }, { id: 2 }]);
    await expect(tbl.countRows()).resolves.toBe(2);
@@ -316,186 +306,3 @@ describe("clone table functionality", () => {
    ).rejects.toThrow("Deep clone is not yet implemented");
  });
 });
-
-describe("namespaces", () => {
-  let tmpDir: tmp.DirResult;
-  let db: Connection;
-
-  beforeEach(async () => {
-    tmpDir = tmp.dirSync({ unsafeCleanup: true });
-    // The local DirectoryNamespace backend only supports child namespaces
-    // when manifest mode is enabled (see lance-namespace-impls/src/dir.rs).
-    db = await connect(tmpDir.name, {
-      // biome-ignore lint/style/useNamingConvention: opaque backend property key, must match Rust
-      namespaceClientProperties: { manifest_enabled: "true" },
-    });
-  });
-  afterEach(() => tmpDir.removeCallback());
-
-  it("should create and describe a namespace", async () => {
-    await db.createNamespace(["myns"]);
-    const desc = await db.describeNamespace(["myns"]);
-    expect(desc).toBeDefined();
-  });
-
-  it("should list namespaces created at the root", async () => {
-    await db.createNamespace(["alpha"]);
-    await db.createNamespace(["beta"]);
-    const list = await db.listNamespaces();
-    expect(list.namespaces).toEqual(expect.arrayContaining(["alpha", "beta"]));
-  });
-
-  it("should list child namespaces under a parent", async () => {
-    await db.createNamespace(["parent"]);
-    await db.createNamespace(["parent", "child"]);
-    const list = await db.listNamespaces(["parent"]);
-    expect(list.namespaces).toContain("child");
-  });
-
-  it("should drop a namespace", async () => {
-    await db.createNamespace(["ephemeral"]);
-    await db.dropNamespace(["ephemeral"]);
-    const list = await db.listNamespaces();
-    expect(list.namespaces).not.toContain("ephemeral");
-  });
-
-  it("should raise an error on any namespace op after close", async () => {
-    await db.close();
-    await expect(db.describeNamespace(["foo"])).rejects.toThrow(
-      "Connection is closed",
-    );
-    await expect(db.listNamespaces()).rejects.toThrow("Connection is closed");
-    await expect(db.createNamespace(["foo"])).rejects.toThrow(
-      "Connection is closed",
-    );
-    await expect(db.dropNamespace(["foo"])).rejects.toThrow(
-      "Connection is closed",
-    );
-  });
-
-  it("should raise an understandable error when describing a non-existent namespace", async () => {
-    await expect(db.describeNamespace(["does-not-exist"])).rejects.toThrow(
-      /not found/i,
-    );
-  });
-
-  it("should raise an error when creating a namespace that already exists", async () => {
-    await db.createNamespace(["dup"]);
-    await expect(db.createNamespace(["dup"])).rejects.toThrow();
-  });
-
-  it("should reject an unrecognized createNamespace mode with a clear error", async () => {
-    await expect(
-      // biome-ignore lint/suspicious/noExplicitAny: deliberately bypass TS to test runtime validation
-      db.createNamespace(["x"], { mode: "frobnicate" as any }),
-    ).rejects.toThrow(/Invalid mode 'frobnicate'/);
-  });
-
-  it("should reject an unrecognized dropNamespace mode with a clear error", async () => {
-    await db.createNamespace(["x"]);
-    await expect(
-      // biome-ignore lint/suspicious/noExplicitAny: deliberately bypass TS to test runtime validation
-      db.dropNamespace(["x"], { mode: "frobnicate" as any }),
-    ).rejects.toThrow(/Invalid mode 'frobnicate'/);
-  });
-
-  it("should reject an unrecognized dropNamespace behavior with a clear error", async () => {
-    await db.createNamespace(["x"]);
-    await expect(
-      // biome-ignore lint/suspicious/noExplicitAny: deliberately bypass TS to test runtime validation
-      db.dropNamespace(["x"], { behavior: "frobnicate" as any }),
-    ).rejects.toThrow(/Invalid behavior 'frobnicate'/);
-  });
-});
-
-describe("connectNamespace", () => {
-  let tmpDir: tmp.DirResult;
-  beforeEach(() => {
-    tmpDir = tmp.dirSync({ unsafeCleanup: true });
-  });
-  afterEach(() => tmpDir.removeCallback());
-
-  it("connects via the dir implementation and supports table ops", async () => {
-    const db = await connectNamespace("dir", { root: tmpDir.name });
-    await db.createTable("users", [{ id: 1 }, { id: 2 }]);
-    await expect(db.tableNames()).resolves.toContain("users");
-  });
-
-  it("throws a clear error when implName is empty", async () => {
-    await expect(connectNamespace("", {})).rejects.toThrow(
-      "implName must be a non-empty string",
-    );
-  });
-
-  it("throws when the namespace implementation is unknown", async () => {
-    await expect(connectNamespace("not-a-real-impl", {})).rejects.toThrow();
-  });
-
-  it("passes storage options through to the namespace", async () => {
-    const db = await connectNamespace(
-      "dir",
-      { root: tmpDir.name },
-      { storageOptions: { newTableDataStorageVersion: "stable" } },
-    );
-    await db.createTable("plumbing", [{ id: 1 }]);
-    await expect(db.tableNames()).resolves.toContain("plumbing");
-  });
-
-  it("supports child namespaces when manifestEnabled is true on the dir config", async () => {
-    const writer = await connectNamespace("dir", {
-      root: tmpDir.name,
-      manifestEnabled: true,
-    });
-    await writer.createNamespace(["analytics"]);
-    await writer.createTable("orders", [{ id: 1 }, { id: 2 }], ["analytics"]);
-    await writer.close();
-
-    const reader = await connectNamespace("dir", {
-      root: tmpDir.name,
-      manifestEnabled: true,
-    });
-    await expect(reader.tableNames(["analytics"])).resolves.toContain("orders");
-    const orders = await reader.openTable("orders", ["analytics"]);
-    await expect(orders.countRows()).resolves.toBe(2);
-  });
-
-  it("merges extraProperties into the dir config and is overridden by typed fields", async () => {
-    // Two observable assertions:
-    // - Typed `root` overrides extraProperties.root: createTable would fail
-    //   under the bogus path if the override didn't happen.
-    // - extraProperties.manifest_enabled="false" is honored end-to-end. Child
-    //   namespaces require manifest mode (default true), so explicitly
-    //   disabling it via extraProperties must make createNamespace reject. If
-    //   extraProperties pass-through were silently broken, the default would
-    //   let createNamespace succeed.
-    const db = await connectNamespace("dir", {
-      root: tmpDir.name,
-      extraProperties: {
-        root: "/should/be/overridden",
-        // biome-ignore lint/style/useNamingConvention: backend property key
-        manifest_enabled: "false",
-      },
-    });
-    await db.createTable("base", [{ id: 1 }]);
-    await expect(db.tableNames()).resolves.toContain("base");
-    await expect(db.createNamespace(["analytics"])).rejects.toThrow();
-  });
-
-  it("flows unknown top-level keys through when implName is dynamic (no silent drop)", async () => {
-    // Routes via the third overload because `impl` is `string`, not the
-    // literal `"dir"`. The dispatcher still notices the runtime value is
-    // "dir", but unknown keys like `manifest_enabled` must not be silently
-    // dropped during the conversion.
-    //
-    // Asserting a *negative* outcome (manifest disabled -> createNamespace
-    // rejects) is required for observability, since the backend default for
-    // `manifest_enabled` is true.
-    const impl: string = "dir";
-    const db = await connectNamespace(impl, {
-      root: tmpDir.name,
-      // biome-ignore lint/style/useNamingConvention: backend property key
-      manifest_enabled: "false",
-    });
-    await expect(db.createNamespace(["mixed"])).rejects.toThrow();
-  });
-});
--- a/nodejs/test/rerankers.test.ts
+++ b/nodejs/test/rerankers.test.ts
@@ -1,8 +1,6 @@
 // SPDX-License-Identifier: Apache-2.0
 // SPDX-FileCopyrightText: Copyright The LanceDB Authors

-import { spawn } from "node:child_process";
-import * as path from "node:path";
 import { RecordBatch } from "apache-arrow";
 import * as tmp from "tmp";
 import { Connection, Index, Table, connect, makeArrowTable } from "../lancedb";
@@ -78,91 +76,4 @@ describe("rerankers", function () {

    expect(result).toHaveLength(2);
  });
-
-  it("does not keep process alive after rerank query", async function () {
-    const script = `
-import * as lancedb from "./dist/index.js";
-import * as os from "node:os";
-import * as path from "node:path";
-import * as fs from "node:fs/promises";
-
-const dir = await fs.mkdtemp(path.join(os.tmpdir(), "lancedb-rerank-exit-"));
-const db = await lancedb.connect(dir);
-const table = await db.createTable("test", [{ text: "hello", vector: [1, 2, 3] }], {
-  mode: "overwrite",
-});
-await table.createIndex("text", { config: lancedb.Index.fts() });
-await table.waitForIndex(["text_idx"], 30);
-
-const reranker = await lancedb.rerankers.RRFReranker.create();
-await table
-  .query()
-  .nearestTo([1, 2, 3])
-  .fullTextSearch("hello")
-  .rerank(reranker)
-  .toArray();
-
-table.close();
-db.close();
-`;
-
-    await new Promise<void>((resolve, reject) => {
-      const child = spawn(
-        process.execPath,
-        ["--input-type=module", "-e", script],
-        {
-          cwd: path.resolve(__dirname, ".."),
-          stdio: ["ignore", "pipe", "pipe"],
-        },
-      );
-
-      let stdout = "";
-      let stderr = "";
-
-      child.stdout.on("data", (chunk) => {
-        stdout += chunk.toString();
-      });
-
-      child.stderr.on("data", (chunk) => {
-        stderr += chunk.toString();
-      });
-
-      const timeout = setTimeout(() => {
-        child.kill();
-        reject(
-          new Error(
-            `child process did not exit in time\nstdout:\n${stdout}\nstderr:\n${stderr}`,
-          ),
-        );
-      }, 20_000);
-
-      child.on("error", (err) => {
-        clearTimeout(timeout);
-        reject(err);
-      });
-
-      child.on("exit", (code, signal) => {
-        clearTimeout(timeout);
-        if (signal !== null) {
-          reject(
-            new Error(
-              `child process exited with signal ${signal}\nstdout:\n${stdout}\nstderr:\n${stderr}`,
-            ),
-          );
-          return;
-        }
-
-        if (code !== 0) {
-          reject(
-            new Error(
-              `child process exited with code ${code}\nstdout:\n${stdout}\nstderr:\n${stderr}`,
-            ),
-          );
-          return;
-        }
-
-        resolve();
-      });
-    });
-  });
 });
--- a/nodejs/test/scannable.test.ts
+++ b/nodejs/test/scannable.test.ts
@@ -1,438 +0,0 @@
-// SPDX-License-Identifier: Apache-2.0
-// SPDX-FileCopyrightText: Copyright The LanceDB Authors
-
-import {
-  Field,
-  Float16,
-  Int32,
-  type RecordBatch,
-  RecordBatchReader,
-  Schema,
-  tableToIPC,
-} from "apache-arrow";
-import { makeArrowTable, makeEmptyTable } from "../lancedb/arrow";
-import { Scannable } from "../lancedb/scannable";
-
-function makeTable() {
-  return makeArrowTable(
-    [
-      { id: 1, name: "a" },
-      { id: 2, name: "b" },
-      { id: 3, name: "c" },
-    ],
-    { vectorColumns: {} },
-  );
-}
-
-async function makeReader(): Promise<RecordBatchReader> {
-  // `RecordBatchReader.from()` returns an unopened reader; `.schema` is only
-  // populated after `.open()`. Opening sync readers is synchronous.
-  const reader = RecordBatchReader.from(tableToIPC(makeTable()));
-  return reader.open() as RecordBatchReader;
-}
-
-describe("Scannable", () => {
-  describe("fromTable", () => {
-    test("reflects schema, numRows, and defaults rescannable=true", async () => {
-      const table = makeTable();
-      const scannable = await Scannable.fromTable(table);
-
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.numRows).toBe(table.numRows);
-      expect(scannable.rescannable).toBe(true);
-    });
-
-    test("throws when opts.numRows does not match table.numRows", async () => {
-      await expect(
-        Scannable.fromTable(makeTable(), { numRows: 42 }),
-      ).rejects.toThrow(/does not match table\.numRows/);
-    });
-
-    test("throws when opts.rescannable is false", async () => {
-      await expect(
-        Scannable.fromTable(makeTable(), { rescannable: false }),
-      ).rejects.toThrow(/always rescannable/);
-    });
-  });
-
-  describe("fromRecordBatchReader", () => {
-    test("reflects schema and defaults numRows=null, rescannable=false", async () => {
-      const reader = await makeReader();
-      const scannable = await Scannable.fromRecordBatchReader(reader);
-
-      expect(scannable.schema).toBe(reader.schema);
-      expect(scannable.numRows).toBeNull();
-      expect(scannable.rescannable).toBe(false);
-    });
-
-    test("honors numRows override", async () => {
-      const scannable = await Scannable.fromRecordBatchReader(
-        await makeReader(),
-        { numRows: 3 },
-      );
-
-      expect(scannable.numRows).toBe(3);
-      expect(scannable.rescannable).toBe(false);
-    });
-
-    test("rescannable: false explicit does not throw", async () => {
-      const reader = await makeReader();
-      const scannable = await Scannable.fromRecordBatchReader(reader, {
-        rescannable: false,
-      });
-      expect(scannable.rescannable).toBe(false);
-    });
-
-    test("throws when opts.rescannable is true", async () => {
-      const reader = await makeReader();
-      await expect(
-        Scannable.fromRecordBatchReader(reader, { rescannable: true }),
-      ).rejects.toThrow(/does not accept rescannable/);
-    });
-
-    test("throws when opts.rescannable is true even alongside numRows", async () => {
-      const reader = await makeReader();
-      await expect(
-        Scannable.fromRecordBatchReader(reader, {
-          numRows: 3,
-          rescannable: true,
-        }),
-      ).rejects.toThrow(/does not accept rescannable/);
-    });
-  });
-
-  describe("fromIterable", () => {
-    test("accepts a sync iterable of batches", async () => {
-      const table = makeTable();
-      const scannable = await Scannable.fromIterable(
-        table.schema,
-        table.batches,
-      );
-
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.numRows).toBeNull();
-      expect(scannable.rescannable).toBe(false);
-    });
-
-    test("accepts an async iterable of batches", async () => {
-      const table = makeTable();
-      async function* generator(): AsyncGenerator<RecordBatch> {
-        for (const batch of table.batches) {
-          yield batch;
-        }
-      }
-
-      const scannable = await Scannable.fromIterable(table.schema, generator());
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.rescannable).toBe(false);
-    });
-
-    describe("rescannable: true detection", () => {
-      // Replayable inputs: [Symbol.iterator]() / [Symbol.asyncIterator]()
-      // returns a fresh iterator each call. Must NOT throw.
-
-      test("Array passes (fresh ArrayIterator each call)", async () => {
-        const table = makeTable();
-        const scannable = await Scannable.fromIterable(
-          table.schema,
-          table.batches,
-          { rescannable: true },
-        );
-        expect(scannable.rescannable).toBe(true);
-      });
-
-      test("Set passes (fresh SetIterator each call)", async () => {
-        const table = makeTable();
-        const set = new Set<RecordBatch>(table.batches);
-        const scannable = await Scannable.fromIterable(table.schema, set, {
-          rescannable: true,
-        });
-        expect(scannable.rescannable).toBe(true);
-      });
-
-      test("custom Iterable returning a fresh iterator passes", async () => {
-        const table = makeTable();
-        const replayable: Iterable<RecordBatch> = {
-          [Symbol.iterator]() {
-            return table.batches[Symbol.iterator]();
-          },
-        };
-        const scannable = await Scannable.fromIterable(
-          table.schema,
-          replayable,
-          { rescannable: true },
-        );
-        expect(scannable.rescannable).toBe(true);
-      });
-
-      test("object with generator method passes (fresh generator each call)", async () => {
-        const table = makeTable();
-        const replayable: Iterable<RecordBatch> = {
-          *[Symbol.iterator]() {
-            for (const batch of table.batches) yield batch;
-          },
-        };
-        const scannable = await Scannable.fromIterable(
-          table.schema,
-          replayable,
-          { rescannable: true },
-        );
-        expect(scannable.rescannable).toBe(true);
-      });
-
-      test("empty Array passes (replayable degenerate case)", async () => {
-        const schema = makeTable().schema;
-        const scannable = await Scannable.fromIterable(
-          schema,
-          [] as RecordBatch[],
-          { rescannable: true },
-        );
-        expect(scannable.rescannable).toBe(true);
-      });
-
-      // One-shot inputs: [Symbol.iterator]() / [Symbol.asyncIterator]()
-      // returns the same object, or the input is already-an-iterator.
-      // Must throw with a /one-shot/ message.
-
-      test("sync generator throws", async () => {
-        const table = makeTable();
-        function* generator(): Generator<RecordBatch> {
-          for (const batch of table.batches) yield batch;
-        }
-        await expect(
-          Scannable.fromIterable(table.schema, generator(), {
-            rescannable: true,
-          }),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      test("async generator throws", async () => {
-        const table = makeTable();
-        async function* generator(): AsyncGenerator<RecordBatch> {
-          for (const batch of table.batches) yield batch;
-        }
-        await expect(
-          Scannable.fromIterable(table.schema, generator(), {
-            rescannable: true,
-          }),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      test("empty generator throws (one-shot degenerate case)", async () => {
-        const schema = makeTable().schema;
-        function* generator(): Generator<RecordBatch> {
-          // intentionally empty; yields nothing.
-        }
-        await expect(
-          Scannable.fromIterable(schema, generator(), { rescannable: true }),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      test("custom self-iterator throws", async () => {
-        const table = makeTable();
-        const batches = table.batches;
-        let i = 0;
-        const oneShot: Iterable<RecordBatch> & Iterator<RecordBatch> = {
-          [Symbol.iterator]() {
-            return this;
-          },
-          next() {
-            if (i >= batches.length) {
-              return { done: true, value: undefined };
-            }
-            return { done: false, value: batches[i++] };
-          },
-        };
-        await expect(
-          Scannable.fromIterable(table.schema, oneShot, { rescannable: true }),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      test("Array.values() (IterableIterator) throws", async () => {
-        const table = makeTable();
-        const iter = table.batches.values();
-        await expect(
-          Scannable.fromIterable(table.schema, iter, { rescannable: true }),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      test("raw iterator (only `.next`) throws", async () => {
-        const table = makeTable();
-        const batches = table.batches;
-        let i = 0;
-        const rawIter = {
-          next(): IteratorResult<RecordBatch> {
-            if (i >= batches.length) {
-              return { done: true, value: undefined };
-            }
-            return { done: false, value: batches[i++] };
-          },
-        };
-        await expect(
-          Scannable.fromIterable(
-            table.schema,
-            rawIter as unknown as Iterable<RecordBatch>,
-            { rescannable: true },
-          ),
-        ).rejects.toThrow(/one-shot/);
-      });
-
-      // Edge: null/undefined must not crash the detection helper. The
-      // null check belongs to `normalizeIterator` and only fires when a
-      // scan starts.
-
-      test("null input does not crash detection at construction", async () => {
-        const schema = makeTable().schema;
-        await expect(
-          Scannable.fromIterable(
-            schema,
-            null as unknown as Iterable<RecordBatch>,
-            {
-              rescannable: true,
-            },
-          ),
-        ).resolves.toBeDefined();
-      });
-
-      test("undefined input does not crash detection at construction", async () => {
-        const schema = makeTable().schema;
-        await expect(
-          Scannable.fromIterable(
-            schema,
-            undefined as unknown as Iterable<RecordBatch>,
-            { rescannable: true },
-          ),
-        ).resolves.toBeDefined();
-      });
-
-      // Default (rescannable omitted) skips the check entirely, so even
-      // pathological inputs construct without throwing here.
-
-      test("rescannable omitted skips detection entirely (generator passes)", async () => {
-        const table = makeTable();
-        function* generator(): Generator<RecordBatch> {
-          for (const batch of table.batches) yield batch;
-        }
-        const scannable = await Scannable.fromIterable(
-          table.schema,
-          generator(),
-        );
-        expect(scannable.rescannable).toBe(false);
-      });
-
-      test("rescannable: false explicit skips detection entirely (generator passes)", async () => {
-        const table = makeTable();
-        function* generator(): Generator<RecordBatch> {
-          for (const batch of table.batches) yield batch;
-        }
-        const scannable = await Scannable.fromIterable(
-          table.schema,
-          generator(),
-          { rescannable: false },
-        );
-        expect(scannable.rescannable).toBe(false);
-      });
-    });
-  });
-
-  describe("fromFactory", () => {
-    test("defaults rescannable=true and does not invoke the factory eagerly", async () => {
-      const table = makeTable();
-      const factory = jest.fn(() => table.batches);
-
-      const scannable = await Scannable.fromFactory(table.schema, factory);
-
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.rescannable).toBe(true);
-      expect(factory).not.toHaveBeenCalled();
-    });
-
-    test("honors rescannable and numRows overrides", async () => {
-      const table = makeTable();
-      const scannable = await Scannable.fromFactory(
-        table.schema,
-        () => table.batches,
-        { numRows: 7, rescannable: false },
-      );
-
-      expect(scannable.numRows).toBe(7);
-      expect(scannable.rescannable).toBe(false);
-    });
-  });
-
-  describe("validation", () => {
-    test("throws when numRows is negative", async () => {
-      await expect(
-        Scannable.fromFactory(makeTable().schema, () => [], { numRows: -1 }),
-      ).rejects.toThrow(/non-negative/);
-    });
-
-    test("throws when numRows is not an integer", async () => {
-      await expect(
-        Scannable.fromFactory(makeTable().schema, () => [], { numRows: 3.5 }),
-      ).rejects.toThrow(/integer/);
-    });
-  });
-
-  describe("native handle", () => {
-    test("exposes a native handle via inner", async () => {
-      const scannable = await Scannable.fromTable(makeTable());
-      expect(scannable.inner).toBeDefined();
-      expect(typeof scannable.inner).toBe("object");
-      expect(scannable.inner).not.toBeNull();
-    });
-  });
-
-  // Schema-variety construction tests. Each asserts that construction
-  // succeeds against a richer Arrow schema, which transitively exercises
-  // schema serialization and the Rust-side `ipc_file_to_schema` for types
-  // beyond flat primitives.
-  describe("schema variety", () => {
-    test("accepts an empty table", async () => {
-      const schema = new Schema([new Field("id", new Int32(), true)]);
-      const table = makeEmptyTable(schema);
-      const scannable = await Scannable.fromTable(table);
-
-      expect(scannable.numRows).toBe(0);
-      expect(scannable.schema).toBe(table.schema);
-    });
-
-    test("accepts nested struct and list columns", async () => {
-      const table = makeArrowTable(
-        [
-          { id: 1, point: { x: 0, y: 0 }, tags: ["a", "b"] },
-          { id: 2, point: { x: 1, y: 2 }, tags: ["c"] },
-        ],
-        { vectorColumns: {} },
-      );
-      const scannable = await Scannable.fromTable(table);
-
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.numRows).toBe(2);
-    });
-
-    test("accepts a FixedSizeList (vector) column", async () => {
-      const table = makeArrowTable(
-        [
-          { id: 1, vec: [1, 2, 3] },
-          { id: 2, vec: [4, 5, 6] },
-        ],
-        { vectorColumns: { vec: { type: new Float16() } } },
-      );
-      const scannable = await Scannable.fromTable(table);
-
-      expect(scannable.schema).toBe(table.schema);
-      expect(scannable.numRows).toBe(2);
-    });
-
-    test("accepts a table with many columns", async () => {
-      const row: Record<string, number> = {};
-      for (let i = 0; i < 50; i++) row[`c${i}`] = i;
-      const table = makeArrowTable([row, row], { vectorColumns: {} });
-      const scannable = await Scannable.fromTable(table);
-
-      expect(scannable.schema.fields.length).toBe(50);
-      expect(scannable.numRows).toBe(2);
-    });
-  });
-});
--- a/nodejs/test/table.test.ts
+++ b/nodejs/test/table.test.ts
@@ -1870,25 +1870,6 @@ describe.each([arrow15, arrow16, arrow17, arrow18])(
      expect(results.length).toBe(3);
    });

-    test("prewarmData errors on local tables", async () => {
-      const db = await connect(tmpDir.name);
-      const data = [
-        { text: "alpha", vector: [0.1, 0.2, 0.3] },
-        { text: "beta", vector: [0.4, 0.5, 0.6] },
-      ];
-      const table = await db.createTable("prewarm_data_test", data);
-
-      // prewarmData is only supported on remote tables. We verify the call
-      // is wired through napi and surfaces the expected error for both
-      // arg shapes (undefined and string[]).
-      await expect(table.prewarmData()).rejects.toThrow(
-        "prewarm_data is currently only supported on remote tables",
-      );
-      await expect(table.prewarmData(["text"])).rejects.toThrow(
-        "prewarm_data is currently only supported on remote tables",
-      );
-    });
-
    test("full text index on list", async () => {
      const db = await connect(tmpDir.name);
      const data = [
--- a/nodejs/examples/package-lock.json
+++ b/nodejs/examples/package-lock.json
--- a/nodejs/examples/package.json
+++ b/nodejs/examples/package.json
@@ -11,17 +11,16 @@
    "test": "node --experimental-vm-modules node_modules/.bin/jest --testEnvironment jest-environment-node-single-context --verbose",
    "lint": "biome check *.ts && biome format *.ts",
    "lint-ci": "biome ci .",
-    "lint-fix": "biome check --write *.ts && pnpm format",
+    "lint-fix": "biome check --write *.ts && npm run format",
    "format": "biome format --write *.ts"
  },
  "author": "Lance Devs",
  "license": "Apache-2.0",
-  "packageManager": "pnpm@11.1.1",
  "dependencies": {
-    "@huggingface/transformers": "3.0.2",
+    "@huggingface/transformers": "^3.0.2",
    "@lancedb/lancedb": "file:../dist",
-    "openai": "4.29.2",
-    "sharp": "0.33.5"
+    "openai": "^4.29.2",
+    "sharp": "^0.33.5"
  },
  "devDependencies": {
    "@biomejs/biome": "^1.7.3",
--- a/nodejs/examples/pnpm-lock.yaml
+++ b/nodejs/examples/pnpm-lock.yaml
--- a/nodejs/examples/pnpm-workspace.yaml
+++ b/nodejs/examples/pnpm-workspace.yaml
@@ -1,13 +0,0 @@
-# Block resolution of versions less than 24h old (Shai-Hulud window).
-# This is the pnpm 11 default but pinned here so it's visible to
-# reviewers and survives a future pnpm major flipping the default.
-minimumReleaseAge: 1440
-
-# Fail install if a transitive dep tries to run an unapproved script.
-strictDepBuilds: true
-
-allowBuilds:
-  '@biomejs/biome': true
-  onnxruntime-node: true
-  protobufjs: true
-  sharp: true
--- a/nodejs/lancedb/arrow.ts
+++ b/nodejs/lancedb/arrow.ts
@@ -1291,18 +1291,6 @@ export async function fromRecordBatchToBuffer(
  return Buffer.from(await writer.toUint8Array());
 }

-/**
- * Create a buffer containing a single record batch using the Arrow IPC Stream
- * serialization. Each call produces a self-contained Stream message (schema +
- * batch + EOS) suitable for incremental decode by `arrow_ipc::reader::StreamReader`.
- */
-export async function fromRecordBatchToStreamBuffer(
-  batch: RecordBatch,
-): Promise<Buffer> {
-  const writer = RecordBatchStreamWriter.writeAll([batch]);
-  return Buffer.from(await writer.toUint8Array());
-}
-
 /**
 * Serialize an Arrow Table into a buffer using the Arrow IPC Stream serialization
 *
--- a/nodejs/lancedb/connection.ts
+++ b/nodejs/lancedb/connection.ts
@@ -16,18 +16,6 @@ import {
 } from "./arrow";
 import { EmbeddingFunctionConfig, getRegistry } from "./embedding/registry";
 import { Connection as LanceDbConnection } from "./native";
-import type {
-  CreateNamespaceResponse,
-  DescribeNamespaceResponse,
-  DropNamespaceResponse,
-  ListNamespacesResponse,
-} from "./native";
-export type {
-  CreateNamespaceResponse,
-  DescribeNamespaceResponse,
-  DropNamespaceResponse,
-  ListNamespacesResponse,
-};
 import { sanitizeTable } from "./sanitize";
 import { LocalTable, Table } from "./table";

@@ -54,7 +42,7 @@ export interface CreateTableOptions {
   * Options already set on the connection will be inherited by the table,
   * but can be overridden here.
   *
-   * The available options are described at https://docs.lancedb.com/storage/
+   * The available options are described at https://lancedb.com/docs/storage/
   */
  storageOptions?: Record<string, string>;

@@ -90,7 +78,7 @@ export interface OpenTableOptions {
   * Options already set on the connection will be inherited by the table,
   * but can be overridden here.
   *
-   * The available options are described at https://docs.lancedb.com/storage/
+   * The available options are described at https://lancedb.com/docs/storage/
   */
  storageOptions?: Record<string, string>;
  /**
@@ -122,28 +110,6 @@ export interface TableNamesOptions {
  /** An optional limit to the number of results to return. */
  limit?: number;
 }
-
-export interface ListNamespacesOptions {
-  /** Token from a previous response for pagination. */
-  pageToken?: string;
-  /** An optional limit to the number of results to return. */
-  limit?: number;
-}
-
-export interface CreateNamespaceOptions {
-  /** Creation mode. */
-  mode?: "create" | "exist_ok" | "overwrite";
-  /** Properties to set on the new namespace. */
-  properties?: Record<string, string>;
-}
-
-export interface DropNamespaceOptions {
-  /** Whether to skip if the namespace doesn't exist, or fail. */
-  mode?: "skip" | "fail";
-  /** Refuse to drop if non-empty (restrict) or drop recursively (cascade). */
-  behavior?: "restrict" | "cascade";
-}
-
 /**
 * A LanceDB Connection that allows you to open tables and create new ones.
 *
@@ -296,81 +262,12 @@ export abstract class Connection {
   */
  abstract dropTable(name: string, namespacePath?: string[]): Promise<void>;

-  abstract renameTable(
-    oldName: string,
-    newName: string,
-    namespacePath?: string[],
-  ): Promise<void>;
-
  /**
   * Drop all tables in the database.
   * @param {string[]} namespacePath The namespace path to drop tables from (defaults to root namespace).
   */
  abstract dropAllTables(namespacePath?: string[]): Promise<void>;

-  /**
-   * Describe a namespace, returning its properties.
-   *
-   * @param {string[]} namespacePath - The namespace path to describe, in
-   *   parent → child order, e.g. `["analytics", "sales"]`.
-   * @returns {Promise<DescribeNamespaceResponse>} The namespace's properties
-   *   (may be undefined if the namespace has none).
-   */
-  abstract describeNamespace(
-    namespacePath: string[],
-  ): Promise<DescribeNamespaceResponse>;
-
-  /**
-   * List the immediate child namespaces under the given parent.
-   *
-   * Results may be paginated. To retrieve subsequent pages, pass the
-   * `pageToken` returned by a previous call.
-   *
-   * @param {string[]} namespacePath - The parent namespace path. Defaults
-   *   to the root namespace if omitted.
-   * @param {Partial<ListNamespacesOptions>} options - Pagination options
-   *   (`pageToken`, `limit`).
-   * @returns {Promise<ListNamespacesResponse>} Child namespace names and
-   *   an optional token for fetching the next page.
-   */
-  abstract listNamespaces(
-    namespacePath?: string[],
-    options?: Partial<ListNamespacesOptions>,
-  ): Promise<ListNamespacesResponse>;
-
-  /**
-   * Create a new namespace at the given path.
-   *
-   * @param {string[]} namespacePath - The namespace path to create.
-   * @param {Partial<CreateNamespaceOptions>} options - Creation `mode`
-   *   ("create" | "exist_ok" | "overwrite") and optional `properties`
-   *   to attach to the namespace.
-   * @returns {Promise<CreateNamespaceResponse>} The properties of the
-   *   created namespace and an optional transaction id.
-   */
-  abstract createNamespace(
-    namespacePath: string[],
-    options?: Partial<CreateNamespaceOptions>,
-  ): Promise<CreateNamespaceResponse>;
-
-  /**
-   * Drop a namespace.
-   *
-   * Use `behavior: "cascade"` to also drop everything contained in the
-   * namespace (sub-namespaces and tables). The default `"restrict"`
-   * behavior refuses to drop a non-empty namespace.
-   *
-   * @param {string[]} namespacePath - The namespace path to drop.
-   * @param {Partial<DropNamespaceOptions>} options - `mode` ("skip" | "fail"
-   *   for missing-namespace handling) and `behavior` ("restrict" | "cascade").
-   * @returns {Promise<DropNamespaceResponse>} Any properties returned by
-   *   the server and an optional transaction id.
-   */
-  abstract dropNamespace(
-    namespacePath: string[],
-    options?: Partial<DropNamespaceOptions>,
-  ): Promise<DropNamespaceResponse>;
-
  /**
   * Clone a table from a source table.
   *
@@ -615,56 +512,9 @@ export class LocalConnection extends Connection {
    return this.inner.dropTable(name, namespacePath ?? []);
  }

-  async renameTable(
-    oldName: string,
-    newName: string,
-    namespacePath?: string[],
-  ): Promise<void> {
-    return this.inner.renameTable(oldName, newName, namespacePath ?? []);
-  }
-
  async dropAllTables(namespacePath?: string[]): Promise<void> {
    return this.inner.dropAllTables(namespacePath ?? []);
  }
-
-  describeNamespace(
-    namespacePath: string[],
-  ): Promise<DescribeNamespaceResponse> {
-    return this.inner.describeNamespace(namespacePath);
-  }
-
-  listNamespaces(
-    namespacePath?: string[],
-    options?: Partial<ListNamespacesOptions>,
-  ): Promise<ListNamespacesResponse> {
-    return this.inner.listNamespaces(
-      namespacePath ?? [],
-      options?.pageToken,
-      options?.limit,
-    );
-  }
-
-  createNamespace(
-    namespacePath: string[],
-    options?: Partial<CreateNamespaceOptions>,
-  ): Promise<CreateNamespaceResponse> {
-    return this.inner.createNamespace(
-      namespacePath,
-      options?.mode,
-      options?.properties,
-    );
-  }
-
-  dropNamespace(
-    namespacePath: string[],
-    options?: Partial<DropNamespaceOptions>,
-  ): Promise<DropNamespaceResponse> {
-    return this.inner.dropNamespace(
-      namespacePath,
-      options?.mode,
-      options?.behavior,
-    );
-  }
 }

 /**
--- a/nodejs/lancedb/index.ts
+++ b/nodejs/lancedb/index.ts
@@ -8,7 +8,6 @@ import {
 } from "./connection";

 import {
-  ConnectNamespaceOptions,
  ConnectionOptions,
  Connection as LanceDbConnection,
  JsHeaderProvider as NativeJsHeaderProvider,
@@ -23,7 +22,6 @@ export { JsHeaderProvider as NativeJsHeaderProvider } from "./native.js";
 export {
  AddColumnsSql,
  ConnectionOptions,
-  ConnectNamespaceOptions,
  IndexStatistics,
  IndexConfig,
  ClientConfig,
@@ -64,13 +62,6 @@ export {
  CreateTableOptions,
  TableNamesOptions,
  OpenTableOptions,
-  ListNamespacesOptions,
-  CreateNamespaceOptions,
-  DropNamespaceOptions,
-  ListNamespacesResponse,
-  CreateNamespaceResponse,
-  DropNamespaceResponse,
-  DescribeNamespaceResponse,
 } from "./connection";

 export { Session } from "./native.js";
@@ -126,7 +117,6 @@ export { MergeInsertBuilder, WriteExecutionOptions } from "./merge";

 export * as embedding from "./embedding";
 export { permutationBuilder, PermutationBuilder } from "./permutation";
-export { Scannable, ScannableOptions } from "./scannable";
 export * as rerankers from "./rerankers";
 export {
  SchemaLike,
@@ -303,197 +293,3 @@ export async function connect(
  );
  return new LocalConnection(nativeConn);
 }
-
-/**
- * Configuration for the built-in directory namespace (`"dir"`).
- *
- * The directory namespace stores tables under a single root path (local
- * filesystem or object storage URI). See
- * {@link https://docs.lancedb.com/namespaces} for the documented surface;
- * less-common knobs live under {@link DirNamespaceConfig.extraProperties}.
- */
-export interface DirNamespaceConfig {
-  /** Root path or URI containing the LanceDB tables. */
-  root: string;
-  /**
-   * Whether to maintain a namespace manifest at the root. Required for
-   * child namespaces. Defaults to true on the impl side.
-   */
-  manifestEnabled?: boolean;
-  /**
-   * Additional raw properties passed verbatim to the namespace
-   * implementation (e.g. `storage.*`, `credential_vendor.*`). Typed
-   * fields above take precedence on key collision.
-   */
-  extraProperties?: Record<string, string>;
-}
-
-/**
- * Configuration for the built-in REST namespace (`"rest"`).
- *
- * The REST namespace talks to a remote catalog server over HTTP. See
- * {@link https://docs.lancedb.com/namespaces} for the documented surface;
- * less-common knobs (TLS, metrics) live under
- * {@link RestNamespaceConfig.extraProperties}.
- */
-export interface RestNamespaceConfig {
-  /** Catalog endpoint URL. */
-  uri: string;
-  /**
-   * HTTP headers forwarded with each request. Keys are passed through
-   * as-is (e.g. `"x-api-key"`, `"Authorization"`).
-   */
-  headers?: Record<string, string>;
-  /**
-   * Additional raw properties passed verbatim to the namespace
-   * implementation (e.g. `tls.*`, `ops_metrics_enabled`, `delimiter`).
-   * Typed fields above take precedence on key collision.
-   */
-  extraProperties?: Record<string, string>;
-}
-
-function dirConfigToProperties(
-  config: DirNamespaceConfig,
-): Record<string, string> {
-  // Spread the whole input so that unknown keys (e.g. a raw `manifest_enabled`
-  // passed via the dynamic-impl path) flow through instead of being dropped.
-  // Typed transformations layer on top.
-  const { manifestEnabled, extraProperties, ...rest } = config;
-  const properties: Record<string, string> = {
-    ...(extraProperties ?? {}),
-    ...(rest as Record<string, string>),
-  };
-  if (manifestEnabled !== undefined) {
-    properties.manifest_enabled = String(manifestEnabled);
-  }
-  return properties;
-}
-
-function restConfigToProperties(
-  config: RestNamespaceConfig,
-): Record<string, string> {
-  const { headers, extraProperties, ...rest } = config;
-  const properties: Record<string, string> = {
-    ...(extraProperties ?? {}),
-    ...(rest as Record<string, string>),
-  };
-  if (headers) {
-    for (const [name, value] of Object.entries(headers)) {
-      properties[`headers.${name}`] = value;
-    }
-  }
-  return properties;
-}
-
-/**
- * Connect to a LanceDB database through a namespace.
- *
- * Unlike {@link connect}, which routes by URI scheme (local path vs.
- * `db://` cloud), `connectNamespace` always returns a namespace-backed
- * connection. The `implName` selects the namespace implementation:
- *
- * - `"dir"` — directory namespace, configured with {@link DirNamespaceConfig}.
- * - `"rest"` — remote REST catalog, configured with {@link RestNamespaceConfig}.
- * - Any other string — full module path for a custom implementation,
- *   configured with a free-form string-keyed `properties` map.
- *
- * @example Typed dir namespace
- * ```ts
- * const db = await connectNamespace("dir", { root: "/path/to/db" });
- * await db.createTable("users", [{ id: 1 }]);
- * ```
- *
- * @example Typed REST namespace with auth headers
- * ```ts
- * const db = await connectNamespace("rest", {
- *   uri: "https://catalog.example.com",
- *   headers: { "x-api-key": process.env.CATALOG_KEY ?? "" },
- * });
- * ```
- *
- * @example Custom implementation with raw properties
- * ```ts
- * const db = await connectNamespace("my.custom.Namespace", {
- *   endpoint: "...",
- * });
- * ```
- */
-export function connectNamespace(
-  implName: "dir",
-  config: DirNamespaceConfig,
-  options?: Partial<ConnectNamespaceOptions>,
-): Promise<Connection>;
-/**
- * Connect through the built-in REST namespace.
- *
- * Configured with {@link RestNamespaceConfig}. See the function-level
- * documentation above for the full surface, examples, and how this
- * relates to {@link connect}.
- *
- * @example
- * ```ts
- * const db = await connectNamespace("rest", {
- *   uri: "https://catalog.example.com",
- *   headers: { "x-api-key": process.env.CATALOG_KEY ?? "" },
- * });
- * ```
- */
-export function connectNamespace(
-  implName: "rest",
-  config: RestNamespaceConfig,
-  options?: Partial<ConnectNamespaceOptions>,
-): Promise<Connection>;
-/**
- * Connect through a custom namespace implementation by full module path,
- * configured with a free-form string-keyed `properties` map. Use the
- * typed overloads above for the built-in `"dir"` and `"rest"` impls.
- *
- * See the function-level documentation above for examples and how this
- * relates to {@link connect}.
- *
- * @example
- * ```ts
- * const db = await connectNamespace("my.custom.Namespace", {
- *   endpoint: "...",
- * });
- * ```
- */
-export function connectNamespace(
-  implName: string,
-  properties: Record<string, string>,
-  options?: Partial<ConnectNamespaceOptions>,
-): Promise<Connection>;
-export async function connectNamespace(
-  implName: string,
-  configOrProperties:
-    | DirNamespaceConfig
-    | RestNamespaceConfig
-    | Record<string, string>,
-  options?: Partial<ConnectNamespaceOptions>,
-): Promise<Connection> {
-  let properties: Record<string, string>;
-  if (implName === "dir") {
-    properties = dirConfigToProperties(
-      configOrProperties as DirNamespaceConfig,
-    );
-  } else if (implName === "rest") {
-    properties = restConfigToProperties(
-      configOrProperties as RestNamespaceConfig,
-    );
-  } else {
-    properties = configOrProperties as Record<string, string>;
-  }
-
-  const finalOptions: ConnectNamespaceOptions = (options ??
-    {}) as ConnectNamespaceOptions;
-  finalOptions.storageOptions = cleanseStorageOptions(
-    finalOptions.storageOptions,
-  );
-
-  const nativeConn = await LanceDbConnection.newWithNamespace(
-    implName,
-    properties,
-    finalOptions,
-  );
-  return new LocalConnection(nativeConn);
-}
--- a/nodejs/lancedb/scannable.ts
+++ b/nodejs/lancedb/scannable.ts
@@ -1,274 +0,0 @@
-// SPDX-License-Identifier: Apache-2.0
-// SPDX-FileCopyrightText: Copyright The LanceDB Authors
-
-import {
-  Table as ArrowTable,
-  RecordBatch,
-  RecordBatchReader,
-  Schema,
-} from "apache-arrow";
-import {
-  fromRecordBatchToStreamBuffer,
-  fromTableToBuffer,
-  makeEmptyTable,
-} from "./arrow";
-import { NapiScannable } from "./native.js";
-
-export interface ScannableOptions {
-  /** Hint about the number of rows. Not validated against the stream. */
-  numRows?: number;
-  /**
-   * Whether the source can be scanned more than once. Defaults to `true` for
-   * `fromTable` / `fromFactory` and `false` for `fromIterable` /
-   * `fromRecordBatchReader`.
-   */
-  rescannable?: boolean;
-}
-
-/**
- * A data source that can be scanned as a stream of Arrow `RecordBatch`es.
- *
- * `Scannable` wraps the schema + optional row count + rescannable flag and
- * a callback that yields batches one at a time. It is passed to consumers
- * (e.g. `Table.add`, `createTable`, `mergeInsert` — follow-up work) that
- * need to pull data without materializing the full dataset in JS memory.
- *
- * Batches cross the JS↔Rust boundary as Arrow IPC Stream messages; a fresh
- * writer serializes each batch, and the Rust side decodes it with
- * `arrow_ipc::reader::StreamReader`. One batch is in flight at a time.
- */
-export class Scannable {
-  readonly schema: Schema;
-  readonly numRows: number | null;
-  readonly rescannable: boolean;
-
-  /** @hidden */
-  private readonly native: NapiScannable;
-
-  private constructor(
-    native: NapiScannable,
-    schema: Schema,
-    numRows: number | null,
-    rescannable: boolean,
-  ) {
-    this.native = native;
-    this.schema = schema;
-    this.numRows = numRows;
-    this.rescannable = rescannable;
-  }
-
-  /** @hidden Access the native handle for passing through to Rust consumers. */
-  get inner(): NapiScannable {
-    return this.native;
-  }
-
-  /**
-   * Build a Scannable from an explicit schema and a factory that returns a
-   * fresh batch iterator on each call.
-   *
-   * The factory is invoked once per scan. Each iterator yields
-   * `RecordBatch`es matching the declared schema. Use this when you need
-   * direct control over the pull loop — for example, to wrap a streaming
-   * source whose batches are produced lazily.
-   *
-   * @param schema - The Arrow schema of the produced batches.
-   * @param factory - Called at the start of each scan to produce a batch
-   *   iterator. Must be idempotent when `rescannable` is true.
-   * @param opts - Optional hints. `rescannable` defaults to `true`; set to
-   *   `false` if calling `factory()` twice would not reproduce the same data.
-   */
-  static async fromFactory(
-    schema: Schema,
-    factory: () =>
-      | AsyncIterable<RecordBatch>
-      | Iterable<RecordBatch>
-      | AsyncIterator<RecordBatch>
-      | Iterator<RecordBatch>,
-    opts: ScannableOptions = {},
-  ): Promise<Scannable> {
-    const numRows = opts.numRows ?? null;
-    if (numRows != null && !Number.isInteger(numRows)) {
-      throw new TypeError("numRows must be an integer");
-    }
-    const rescannable = opts.rescannable ?? true;
-
-    let iter: AsyncIterator<RecordBatch> | Iterator<RecordBatch> | null = null;
-    const getNextBatch = async (isStart: boolean): Promise<Buffer | null> => {
-      // `isStart` is true on the first pull of every new scan_as_stream.
-      // Drop any cached iterator so factory() is re-invoked for the next scan
-      if (isStart) {
-        iter = null;
-      }
-      if (iter === null) {
-        iter = normalizeIterator(factory());
-      }
-      const result = await iter.next();
-      if (result.done) {
-        iter = null;
-        return null;
-      }
-      return fromRecordBatchToStreamBuffer(result.value);
-    };
-
-    const schemaBuf = await fromTableToBuffer(makeEmptyTable(schema));
-    const native = new NapiScannable(
-      schemaBuf,
-      numRows,
-      rescannable,
-      getNextBatch,
-    );
-    return new Scannable(native, schema, numRows, rescannable);
-  }
-
-  /**
-   * Build a Scannable from an in-memory Arrow `Table`. Always rescannable;
-   * the table's batches are replayed on each scan.
-   *
-   * The table's row count is authoritative: `opts.numRows` must either be
-   * omitted or equal to `table.numRows`. `opts.rescannable` of `false` is
-   * rejected because in-memory Tables are always rescannable.
-   */
-  static async fromTable(
-    table: ArrowTable,
-    opts: ScannableOptions = {},
-  ): Promise<Scannable> {
-    if (opts.numRows != null && opts.numRows !== table.numRows) {
-      throw new TypeError(
-        `opts.numRows (${opts.numRows}) does not match table.numRows (${table.numRows}). ` +
-          `The table's row count is authoritative; omit numRows or pass the matching value.`,
-      );
-    }
-    if (opts.rescannable === false) {
-      throw new TypeError(
-        `fromTable does not accept rescannable: false. ` +
-          `In-memory Arrow Tables are always rescannable; omit the option or pass true.`,
-      );
-    }
-    return Scannable.fromFactory(table.schema, () => table.batches, {
-      numRows: table.numRows,
-      rescannable: true,
-    });
-  }
-
-  /**
-   * Build a Scannable from an iterable of `RecordBatch`es. `rescannable`
-   * defaults to `false`. Pass an explicit schema so the consumer can
-   * validate before any batch is pulled.
-   *
-   * `opts.rescannable: true` is honest for replayable iterables (Arrays,
-   * Sets, or custom iterables whose `[Symbol.iterator]()` returns a fresh
-   * iterator each call). It is rejected for one-shot iterables (generators,
-   * async generators, or already-an-iterator inputs) because their
-   * `[Symbol.iterator]()` returns the same exhausted object on the second
-   * scan. For replayable sources outside this shape, use
-   * `fromFactory(schema, () => createIter(), { rescannable: true })`.
-   *
-   * Note: when `opts.rescannable` is `true`, the constructor calls
-   * `[Symbol.iterator]()` once on the input to perform the structural check.
-   */
-  static async fromIterable(
-    schema: Schema,
-    iter: AsyncIterable<RecordBatch> | Iterable<RecordBatch>,
-    opts: ScannableOptions = {},
-  ): Promise<Scannable> {
-    if (opts.rescannable === true && isOneShotIterable(iter)) {
-      throw new TypeError(
-        `fromIterable: rescannable: true is not honest for one-shot iterables ` +
-          `(generators, async generators, or iterators where [Symbol.iterator]() ` +
-          `returns the same object). The source would be exhausted after the first scan. ` +
-          `Use fromFactory(schema, () => createIter(), { rescannable: true }) for sources ` +
-          `where each call mints a fresh iterator.`,
-      );
-    }
-    return Scannable.fromFactory(schema, () => iter, {
-      numRows: opts.numRows,
-      rescannable: opts.rescannable ?? false,
-    });
-  }
-
-  /**
-   * Build a Scannable from an Arrow `RecordBatchReader`. A reader can only
-   * be consumed once; `rescannable` defaults to `false`.
-   *
-   * The reader must already be opened (via `.open()`) so its `.schema` is
-   * populated. `RecordBatchReader.from(...)` returns an unopened reader.
-   *
-   * `opts.rescannable: true` is rejected because `RecordBatchReader` is a
-   * self-iterator (its `[Symbol.iterator]()` returns itself), and this
-   * constructor does not call `reader.reset()` between scans, so a second
-   * scan would always see an exhausted reader. For genuinely replayable
-   * sources, use
-   * `fromFactory(schema, () => openReader(), { rescannable: true })`,
-   * which mints a fresh reader on each scan.
-   */
-  static async fromRecordBatchReader(
-    reader: RecordBatchReader,
-    opts: ScannableOptions = {},
-  ): Promise<Scannable> {
-    if (opts.rescannable === true) {
-      throw new TypeError(
-        `fromRecordBatchReader does not accept rescannable: true. ` +
-          `RecordBatchReader is a self-iterator (its [Symbol.iterator]() ` +
-          `returns itself) and would be exhausted after the first scan. ` +
-          `Use fromFactory(schema, () => openReader(), { rescannable: true }) ` +
-          `for sources where each call mints a fresh reader.`,
-      );
-    }
-    return Scannable.fromFactory(reader.schema, () => reader, {
-      numRows: opts.numRows,
-      rescannable: false,
-    });
-  }
-}
-
-function normalizeIterator<T>(
-  source: AsyncIterable<T> | Iterable<T> | AsyncIterator<T> | Iterator<T>,
-): AsyncIterator<T> | Iterator<T> {
-  if (source == null) {
-    throw new TypeError("Scannable factory returned null/undefined");
-  }
-  if (
-    typeof (source as AsyncIterable<T>)[Symbol.asyncIterator] === "function"
-  ) {
-    return (source as AsyncIterable<T>)[Symbol.asyncIterator]();
-  }
-  if (typeof (source as Iterable<T>)[Symbol.iterator] === "function") {
-    return (source as Iterable<T>)[Symbol.iterator]();
-  }
-  // Already an iterator (has `.next`).
-  if (typeof (source as Iterator<T>).next === "function") {
-    return source as Iterator<T>;
-  }
-  throw new TypeError("Scannable factory returned a non-iterable value");
-}
-
-// A "self-iterator" returns the same object from `[Symbol.iterator]()` /
-// `[Symbol.asyncIterator]()`. Generators behave this way, so they exhaust
-// after one pass. Replayable iterables (Array, Set, custom) return a fresh
-// iterator each call. Detection mirrors `normalizeIterator`'s ordering so
-// classification matches scan-time behavior.
-function isOneShotIterable(
-  source: AsyncIterable<unknown> | Iterable<unknown>,
-): boolean {
-  // null/undefined are not one-shot in any meaningful sense; let
-  // `normalizeIterator` raise the actual error at scan time.
-  if (source == null) return false;
-  const ref = source as unknown;
-  if (
-    typeof (source as AsyncIterable<unknown>)[Symbol.asyncIterator] ===
-    "function"
-  ) {
-    const it = (source as AsyncIterable<unknown>)[
-      Symbol.asyncIterator
-    ]() as unknown;
-    return it === ref;
-  }
-  if (typeof (source as Iterable<unknown>)[Symbol.iterator] === "function") {
-    const it = (source as Iterable<unknown>)[Symbol.iterator]() as unknown;
-    return it === ref;
-  }
-  // Already-an-iterator (has `.next` but no `Symbol.iterator`) is by
-  // definition one-shot.
-  if (typeof (source as { next?: unknown }).next === "function") return true;
-  return false;
-}
--- a/nodejs/lancedb/table.ts
+++ b/nodejs/lancedb/table.ts
@@ -285,25 +285,6 @@ export abstract class Table {
   */
  abstract prewarmIndex(name: string): Promise<void>;

-  /**
-   * Prewarm one or more columns of data in the table.
-   *
-   * @param columns The columns to prewarm. If undefined, all columns are prewarmed.
-   *
-   * This will load the column data into the page cache so that future queries that
-   * read those columns avoid the initial cold-start latency.  This call initiates
-   * prewarming and returns once the request is accepted; the warming itself may
-   * continue in the background.  Calling it on already-prewarmed columns is a
-   * no-op on the server.
-   *
-   * Prewarming is generally useful for columns used in filters or projections.
-   * Large columns (e.g. high-dimensional vectors or binary data) may not be
-   * practical to prewarm.
-   *
-   * This feature is currently only supported on remote tables.
-   */
-  abstract prewarmData(columns?: string[]): Promise<void>;
-
  /**
   * Waits for asynchronous indexing to complete on the table.
   *
@@ -729,10 +710,6 @@ export class LocalTable extends Table {
    await this.inner.prewarmIndex(name);
  }

-  async prewarmData(columns?: string[]): Promise<void> {
-    await this.inner.prewarmData(columns);
-  }
-
  async waitForIndex(
    indexNames: string[],
    timeoutSeconds: number,
--- a/nodejs/npm/darwin-arm64/package.json
+++ b/nodejs/npm/darwin-arm64/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-darwin-arm64",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["darwin"],
 	"cpu": ["arm64"],
 	"main": "lancedb.darwin-arm64.node",
--- a/nodejs/npm/linux-arm64-gnu/package.json
+++ b/nodejs/npm/linux-arm64-gnu/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-linux-arm64-gnu",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["linux"],
 	"cpu": ["arm64"],
 	"main": "lancedb.linux-arm64-gnu.node",
--- a/nodejs/npm/linux-arm64-musl/package.json
+++ b/nodejs/npm/linux-arm64-musl/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-linux-arm64-musl",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["linux"],
 	"cpu": ["arm64"],
 	"main": "lancedb.linux-arm64-musl.node",
--- a/nodejs/npm/linux-x64-gnu/package.json
+++ b/nodejs/npm/linux-x64-gnu/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-linux-x64-gnu",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["linux"],
 	"cpu": ["x64"],
 	"main": "lancedb.linux-x64-gnu.node",
--- a/nodejs/npm/linux-x64-musl/package.json
+++ b/nodejs/npm/linux-x64-musl/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-linux-x64-musl",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["linux"],
 	"cpu": ["x64"],
 	"main": "lancedb.linux-x64-musl.node",
--- a/nodejs/npm/win32-arm64-msvc/package.json
+++ b/nodejs/npm/win32-arm64-msvc/package.json
@@ -1,6 +1,6 @@
 {
  "name": "@lancedb/lancedb-win32-arm64-msvc",
-  "version": "0.28.0-beta.11",
+  "version": "0.28.0-beta.5",
  "os": [
    "win32"
  ],
--- a/nodejs/npm/win32-x64-msvc/package.json
+++ b/nodejs/npm/win32-x64-msvc/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@lancedb/lancedb-win32-x64-msvc",
-	"version": "0.28.0-beta.11",
+	"version": "0.28.0-beta.5",
 	"os": ["win32"],
 	"cpu": ["x64"],
 	"main": "lancedb.win32-x64-msvc.node",
--- a/nodejs/package-lock.json
+++ b/nodejs/package-lock.json
--- a/nodejs/package.json
+++ b/nodejs/package.json
@@ -11,7 +11,7 @@
    "ann"
  ],
  "private": false,
-  "version": "0.28.0-beta.11",
+  "version": "0.28.0-beta.5",
  "main": "dist/index.js",
  "exports": {
    ".": "./dist/index.js",
@@ -38,15 +38,15 @@
    "url": "https://github.com/lancedb/lancedb"
  },
  "devDependencies": {
-    "@aws-sdk/client-dynamodb": "3.1003.0",
-    "@aws-sdk/client-kms": "3.1003.0",
-    "@aws-sdk/client-s3": "3.1003.0",
+    "@aws-sdk/client-dynamodb": "^3.33.0",
+    "@aws-sdk/client-kms": "^3.33.0",
+    "@aws-sdk/client-s3": "^3.33.0",
    "@biomejs/biome": "^1.7.3",
    "@jest/globals": "^29.7.0",
-    "@napi-rs/cli": "3.5.1",
+    "@napi-rs/cli": "^3.5.1",
    "@types/axios": "^0.14.0",
    "@types/jest": "^29.1.2",
-    "@types/node": "22.7.4",
+    "@types/node": "^22.7.4",
    "@types/tmp": "^0.2.6",
    "apache-arrow-15": "npm:apache-arrow@15.0.0",
    "apache-arrow-16": "npm:apache-arrow@16.0.0",
@@ -57,9 +57,9 @@
    "shx": "^0.3.4",
    "tmp": "^0.2.3",
    "ts-jest": "^29.1.2",
-    "typedoc": "0.26.4",
-    "typedoc-plugin-markdown": "4.2.1",
-    "typescript": "5.5.4",
+    "typedoc": "^0.26.4",
+    "typedoc-plugin-markdown": "^4.2.1",
+    "typescript": "^5.5.4",
    "typescript-eslint": "^7.1.0"
  },
  "ava": {
@@ -68,16 +68,16 @@
  "engines": {
    "node": ">= 18"
  },
-  "packageManager": "pnpm@11.1.1",
  "cpu": ["x64", "arm64"],
  "os": ["darwin", "linux", "win32"],
  "scripts": {
    "artifacts": "napi artifacts",
    "build:debug": "napi build --platform --dts ../lancedb/native.d.ts --js ../lancedb/native.js --output-dir lancedb",
-    "postbuild:debug": "shx mkdir -p dist && shx cp lancedb/*.node dist/ && node -e \"require('fs').writeFileSync('dist/package.json', JSON.stringify({name:'@lancedb/lancedb',type:'commonjs'}))\"",
+    "postbuild:debug": "shx mkdir -p dist && shx cp lancedb/*.node dist/",
    "build:release": "napi build --platform --release --dts ../lancedb/native.d.ts --js ../lancedb/native.js --output-dir dist",
-    "build": "pnpm build:debug && pnpm tsc",
-    "build-release": "pnpm build:release && pnpm tsc",
+    "postbuild:release": "shx mkdir -p dist && shx cp lancedb/*.node dist/",
+    "build": "npm run build:debug && npm run tsc",
+    "build-release": "npm run build:release && npm run tsc",
    "tsc": "tsc -b",
    "posttsc": "shx cp lancedb/native.d.ts dist/native.d.ts",
    "lint-ci": "biome ci .",
@@ -87,7 +87,7 @@
    "lint-fix": "biome check --write . && biome format --write .",
    "prepublishOnly": "napi prepublish -t npm",
    "test": "jest --verbose",
-    "integration": "S3_TEST=1 pnpm test",
+    "integration": "S3_TEST=1 npm run test",
    "universal": "napi universalize",
    "version": "napi version"
  },
@@ -95,8 +95,8 @@
    "reflect-metadata": "^0.2.2"
  },
  "optionalDependencies": {
-    "@huggingface/transformers": "3.0.2",
-    "openai": "4.29.2"
+    "@huggingface/transformers": "^3.0.2",
+    "openai": "^4.29.2"
  },
  "peerDependencies": {
    "apache-arrow": ">=15.0.0 <=18.1.0"
--- a/nodejs/pnpm-lock.yaml
+++ b/nodejs/pnpm-lock.yaml
--- a/nodejs/pnpm-workspace.yaml
+++ b/nodejs/pnpm-workspace.yaml
@@ -1,18 +0,0 @@
-# Flat node_modules layout. The @napi-rs/cli build step fails to locate
-# the cdylib artifact under pnpm's isolated layout; the hoisted linker
-# mirrors npm's structure and unblocks the native build.
-nodeLinker: hoisted
-
-# Block resolution of versions less than 24h old (Shai-Hulud window).
-# This is the pnpm 11 default but pinned here so it's visible to
-# reviewers and survives a future pnpm major flipping the default.
-minimumReleaseAge: 1440
-
-# Fail install if a transitive dep tries to run an unapproved script.
-strictDepBuilds: true
-
-allowBuilds:
-  '@biomejs/biome': true
-  onnxruntime-node: true
-  protobufjs: true
-  sharp: true
--- a/nodejs/src/connection.rs
+++ b/nodejs/src/connection.rs
@@ -8,16 +8,12 @@ use lancedb::database::{CreateTableMode, Database};
 use napi::bindgen_prelude::*;
 use napi_derive::*;

-use crate::ConnectNamespaceOptions;
 use crate::ConnectionOptions;
 use crate::error::NapiErrorExt;
 use crate::header::JsHeaderProvider;
 use crate::table::Table;
-use lancedb::connection::{ConnectBuilder, Connection as LanceDBConnection, connect_namespace};
+use lancedb::connection::{ConnectBuilder, Connection as LanceDBConnection};

-use lance_namespace::models::{
-    CreateNamespaceRequest, DescribeNamespaceRequest, DropNamespaceRequest, ListNamespacesRequest,
-};
 use lancedb::ipc::{ipc_file_to_batches, ipc_file_to_schema};

 #[napi]
@@ -25,29 +21,6 @@ pub struct Connection {
    inner: Option<LanceDBConnection>,
 }

-#[napi(object)]
-pub struct DescribeNamespaceResponse {
-    pub properties: Option<HashMap<String, String>>,
-}
-
-#[napi(object)]
-pub struct ListNamespacesResponse {
-    pub namespaces: Vec<String>,
-    pub page_token: Option<String>,
-}
-
-#[napi(object)]
-pub struct CreateNamespaceResponse {
-    pub properties: Option<HashMap<String, String>>,
-    pub transaction_id: Option<String>,
-}
-
-#[napi(object)]
-pub struct DropNamespaceResponse {
-    pub properties: Option<HashMap<String, String>>,
-    pub transaction_id: Option<Vec<String>>,
-}
-
 impl Connection {
    pub(crate) fn inner_new(inner: LanceDBConnection) -> Self {
        Self { inner: Some(inner) }
@@ -94,12 +67,6 @@ impl Connection {
                builder = builder.storage_option(key, value);
            }
        }
-        if let Some(manifest_enabled) = options.manifest_enabled {
-            builder = builder.manifest_enabled(manifest_enabled);
-        }
-        if let Some(namespace_client_properties) = options.namespace_client_properties {
-            builder = builder.namespace_client_properties(namespace_client_properties);
-        }

        // Create client config, optionally with header provider
        let client_config = options.client_config.unwrap_or_default();
@@ -133,39 +100,6 @@ impl Connection {
        Ok(Self::inner_new(builder.execute().await.default_error()?))
    }

-    /// Create a new Connection instance backed by a namespace implementation.
-    #[napi(factory)]
-    pub async fn new_with_namespace(
-        impl_name: String,
-        properties: HashMap<String, String>,
-        options: ConnectNamespaceOptions,
-    ) -> napi::Result<Self> {
-        if impl_name.is_empty() {
-            return Err(napi::Error::from_reason(
-                "implName must be a non-empty string",
-            ));
-        }
-
-        let mut builder = connect_namespace(&impl_name, properties);
-        if let Some(interval) = options.read_consistency_interval {
-            builder =
-                builder.read_consistency_interval(std::time::Duration::from_secs_f64(interval));
-        }
-        if let Some(storage_options) = options.storage_options {
-            for (key, value) in storage_options {
-                builder = builder.storage_option(key, value);
-            }
-        }
-        if let Some(namespace_client_properties) = options.namespace_client_properties {
-            builder = builder.namespace_client_properties(namespace_client_properties);
-        }
-        if let Some(session) = options.session {
-            builder = builder.session(session.inner.clone());
-        }
-
-        Ok(Self::inner_new(builder.execute().await.default_error()?))
-    }
-
    #[napi]
    pub fn display(&self) -> napi::Result<String> {
        Ok(self.get_inner()?.to_string())
@@ -328,149 +262,9 @@ impl Connection {
            .default_error()
    }

-    #[napi(catch_unwind)]
-    pub async fn rename_table(
-        &self,
-        old_name: String,
-        new_name: String,
-        namespace_path: Option<Vec<String>>,
-    ) -> napi::Result<()> {
-        let ns = namespace_path.unwrap_or_default();
-        self.get_inner()?
-            .rename_table(&old_name, &new_name, &ns, &ns)
-            .await
-            .default_error()
-    }
-
    #[napi(catch_unwind)]
    pub async fn drop_all_tables(&self, namespace_path: Option<Vec<String>>) -> napi::Result<()> {
        let ns = namespace_path.unwrap_or_default();
        self.get_inner()?.drop_all_tables(&ns).await.default_error()
    }
-
-    #[napi(catch_unwind)]
-    /// Describe a namespace and return its properties.
-    pub async fn describe_namespace(
-        &self,
-        namespace_path: Vec<String>,
-    ) -> napi::Result<DescribeNamespaceResponse> {
-        let req = DescribeNamespaceRequest {
-            id: Some(namespace_path),
-            ..Default::default()
-        };
-        let resp = self
-            .get_inner()?
-            .describe_namespace(req)
-            .await
-            .default_error()?;
-        Ok(DescribeNamespaceResponse {
-            properties: resp.properties,
-        })
-    }
-
-    #[napi(catch_unwind)]
-    /// List child namespaces under the given namespace path
-    pub async fn list_namespaces(
-        &self,
-        namespace_path: Option<Vec<String>>,
-        page_token: Option<String>,
-        limit: Option<u32>,
-    ) -> napi::Result<ListNamespacesResponse> {
-        let req = ListNamespacesRequest {
-            id: namespace_path,
-            page_token,
-            limit: limit.map(|l| l as i32),
-            ..Default::default()
-        };
-        let resp = self
-            .get_inner()?
-            .list_namespaces(req)
-            .await
-            .default_error()?;
-        Ok(ListNamespacesResponse {
-            namespaces: resp.namespaces,
-            page_token: resp.page_token,
-        })
-    }
-
-    #[napi(catch_unwind)]
-    /// Create a new namespace with optional properties.
-    pub async fn create_namespace(
-        &self,
-        namespace_path: Vec<String>,
-        mode: Option<String>,
-        properties: Option<HashMap<String, String>>,
-    ) -> napi::Result<CreateNamespaceResponse> {
-        let mode_str = mode
-            .map(|m| match m.to_lowercase().as_str() {
-                "create" => Ok("Create".to_string()),
-                "exist_ok" => Ok("ExistOk".to_string()),
-                "overwrite" => Ok("Overwrite".to_string()),
-                _ => Err(napi::Error::from_reason(format!(
-                    "Invalid mode '{}': expected one of 'create', 'exist_ok', 'overwrite'",
-                    m
-                ))),
-            })
-            .transpose()?;
-        let req = CreateNamespaceRequest {
-            id: Some(namespace_path),
-            mode: mode_str,
-            properties,
-            ..Default::default()
-        };
-        let resp = self
-            .get_inner()?
-            .create_namespace(req)
-            .await
-            .default_error()?;
-        Ok(CreateNamespaceResponse {
-            properties: resp.properties,
-            transaction_id: resp.transaction_id,
-        })
-    }
-
-    #[napi(catch_unwind)]
-    /// Drop a namespace.
-    pub async fn drop_namespace(
-        &self,
-        namespace_path: Vec<String>,
-        mode: Option<String>,
-        behavior: Option<String>,
-    ) -> napi::Result<DropNamespaceResponse> {
-        let mode_str = mode
-            .map(|m| match m.to_lowercase().as_str() {
-                "skip" => Ok("Skip".to_string()),
-                "fail" => Ok("Fail".to_string()),
-                _ => Err(napi::Error::from_reason(format!(
-                    "Invalid mode '{}': expected one of 'skip', 'fail'",
-                    m
-                ))),
-            })
-            .transpose()?;
-        let behavior_str = behavior
-            .map(|b| match b.to_lowercase().as_str() {
-                "restrict" => Ok("Restrict".to_string()),
-                "cascade" => Ok("Cascade".to_string()),
-                _ => Err(napi::Error::from_reason(format!(
-                    "Invalid behavior '{}': expected one of 'restrict', 'cascade'",
-                    b
-                ))),
-            })
-            .transpose()?;
-        let req = DropNamespaceRequest {
-            id: Some(namespace_path),
-            mode: mode_str,
-            behavior: behavior_str,
-            ..Default::default()
-        };
-        let resp = self
-            .get_inner()?
-            .drop_namespace(req)
-            .await
-            .default_error()?;
-        Ok(DropNamespaceResponse {
-            properties: resp.properties,
-            transaction_id: resp.transaction_id,
-        })
-    }
 }
--- a/nodejs/src/lib.rs
+++ b/nodejs/src/lib.rs
@@ -16,7 +16,6 @@ pub mod permutation;
 mod query;
 pub mod remote;
 mod rerankers;
-mod scannable;
 mod session;
 mod table;
 mod util;
@@ -36,15 +35,8 @@ pub struct ConnectionOptions {
    pub read_consistency_interval: Option<f64>,
    /// (For LanceDB OSS only): configuration for object storage.
    ///
-    /// The available options are described at https://docs.lancedb.com/storage/
+    /// The available options are described at https://lancedb.com/docs/storage/
    pub storage_options: Option<HashMap<String, String>>,
-    /// (For LanceDB OSS only): use directory namespace manifests as the source
-    /// of truth for table metadata. Existing directory-listed root tables are
-    /// migrated into the manifest on access.
-    pub manifest_enabled: Option<bool>,
-    /// (For LanceDB OSS only): extra properties for the backing namespace
-    /// client used by manifest-enabled native connections.
-    pub namespace_client_properties: Option<HashMap<String, String>>,
    /// (For LanceDB OSS only): the session to use for this connection. Holds
    /// shared caches and other session-specific state.
    pub session: Option<session::Session>,
@@ -68,26 +60,6 @@ pub struct OpenTableOptions {
    pub storage_options: Option<HashMap<String, String>>,
 }

-#[napi(object)]
-#[derive(Debug)]
-pub struct ConnectNamespaceOptions {
-    /// The interval, in seconds, at which to check for updates to the table
-    /// from other processes. If None, then consistency is not checked. For
-    /// performance reasons, this is the default. For strong consistency, set
-    /// this to zero seconds. Then every read will check for updates from other
-    /// processes. As a compromise, you can set this to a non-zero value for
-    /// eventual consistency.
-    pub read_consistency_interval: Option<f64>,
-    /// Configuration for object storage. The available options are described
-    /// at https://docs.lancedb.com/storage/
-    pub storage_options: Option<HashMap<String, String>>,
-    /// Extra properties for the backing namespace client.
-    pub namespace_client_properties: Option<HashMap<String, String>>,
-    /// The session to use for this connection. Holds shared caches and other
-    /// session-specific state.
-    pub session: Option<session::Session>,
-}
-
 #[napi_derive::module_init]
 fn init() {
    let env = Env::new()
--- a/nodejs/src/rerankers.rs
+++ b/nodejs/src/rerankers.rs
@@ -18,7 +18,6 @@ type RerankHybridFn = ThreadsafeFunction<
    RerankHybridCallbackArgs,
    Status,
    false,
-    true,
 >;

 /// Reranker implementation that "wraps" a NodeJS Reranker implementation.
@@ -33,10 +32,7 @@ impl Reranker {
    pub fn new(
        rerank_hybrid: Function<RerankHybridCallbackArgs, Promise<Buffer>>,
    ) -> napi::Result<Self> {
-        let rerank_hybrid = rerank_hybrid
-            .build_threadsafe_function()
-            .weak::<true>()
-            .build()?;
+        let rerank_hybrid = rerank_hybrid.build_threadsafe_function().build()?;
        Ok(Self { rerank_hybrid })
    }
 }
--- a/nodejs/src/scannable.rs
+++ b/nodejs/src/scannable.rs
@@ -1,253 +0,0 @@
-// SPDX-License-Identifier: Apache-2.0
-// SPDX-FileCopyrightText: Copyright The LanceDB Authors
-
-//! NodeJS binding for the [`lancedb::data::scannable::Scannable`] trait.
-//!
-//! The JS side supplies a `getNextBatch(isStart)` callback that returns the
-//! next Arrow `RecordBatch` encoded as a self-contained Arrow IPC Stream
-//! message (schema message + record batch message + EOS marker) wrapped in a
-//! `Buffer`, or `null` when the stream is exhausted. The Rust side parses
-//! each buffer with `arrow_ipc::reader::StreamReader`, validates every
-//! standalone batch stream against the declared schema, and yields decoded
-//! `RecordBatch`es as a [`SendableRecordBatchStream`].
-//!
-//! `isStart` is `true` on the first `getNextBatch` call of each new
-//! `scan_as_stream` and `false` thereafter. JS uses it to drop any cached
-//! iterator and re-invoke its factory at scan boundaries, so retries
-//! triggered by mid-stream failures restart at batch 0.
-
-use std::io::Cursor;
-use std::sync::Arc;
-
-use arrow_array::RecordBatch;
-use arrow_ipc::reader::StreamReader;
-use arrow_schema::SchemaRef;
-use futures::stream::once;
-use lancedb::arrow::{SendableRecordBatchStream, SimpleRecordBatchStream};
-use lancedb::data::scannable::Scannable as LanceScannable;
-use lancedb::ipc::ipc_file_to_schema;
-use lancedb::{Error, Result as LanceResult};
-use napi::bindgen_prelude::*;
-use napi::threadsafe_function::ThreadsafeFunction;
-use napi_derive::napi;
-
-/// Threadsafe handle to the JS `getNextBatch` callback. The callback takes a
-/// single boolean `isStart` (`true` on the first call of each new scan) and
-/// returns a Promise that resolves to a `Buffer` containing one IPC Stream
-/// message, or `null` at end-of-stream.
-type GetNextBatchFn = ThreadsafeFunction<bool, Promise<Option<Buffer>>, bool, Status, false>;
-
-/// A Rust-side view of a JS-constructed `Scannable`.
-///
-/// Held in JS as the return value of the `Scannable` class constructor. When
-/// passed to a consumer that accepts `impl lancedb::data::scannable::Scannable`,
-/// the consumer invokes `scan_as_stream()` to pull batches through the JS
-/// callback.
-#[napi]
-pub struct NapiScannable {
-    schema: SchemaRef,
-    num_rows: Option<usize>,
-    rescannable: bool,
-    // `ThreadsafeFunction` is not `Clone`; wrap in `Arc` so the stream
-    // returned by `scan_as_stream` can own a handle independent of `self`.
-    get_next_batch: Arc<GetNextBatchFn>,
-    // Tracks whether a scan has already started; used to enforce one-shot
-    // semantics on non-rescannable sources.
-    scanned: bool,
-}
-
-#[napi]
-impl NapiScannable {
-    /// Construct a new `NapiScannable`.
-    ///
-    /// - `schema_buf` — Arrow IPC File buffer carrying only the schema (no batches).
-    /// - `num_rows` — optional row count hint; not validated against the stream.
-    /// - `rescannable` — whether `get_next_batch` may be re-driven after the
-    ///   scan completes.
-    /// - `get_next_batch` -- JS callback that yields the next batch as an Arrow
-    ///   IPC Stream message wrapped in a `Buffer`, or `null` at EOF. The
-    ///   `isStart` argument is `true` on the first call of each new scan;
-    ///   JS uses it to discard any cached iterator before pulling.
-    #[napi(constructor)]
-    pub fn new(
-        schema_buf: Buffer,
-        num_rows: Option<i64>,
-        rescannable: bool,
-        get_next_batch: Function<bool, Promise<Option<Buffer>>>,
-    ) -> napi::Result<Self> {
-        let schema = ipc_file_to_schema(schema_buf.to_vec())
-            .map_err(|e| napi::Error::from_reason(format!("Invalid schema buffer: {}", e)))?;
-        let num_rows = num_rows
-            .map(|n| {
-                usize::try_from(n)
-                    .map_err(|_| napi::Error::from_reason("num_rows must be non-negative"))
-            })
-            .transpose()?;
-        let get_next_batch = Arc::new(get_next_batch.build_threadsafe_function().build()?);
-        Ok(Self {
-            schema,
-            num_rows,
-            rescannable,
-            get_next_batch,
-            scanned: false,
-        })
-    }
-}
-
-impl std::fmt::Debug for NapiScannable {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        f.debug_struct("NapiScannable")
-            .field("schema", &self.schema)
-            .field("num_rows", &self.num_rows)
-            .field("rescannable", &self.rescannable)
-            .finish()
-    }
-}
-
-impl LanceScannable for NapiScannable {
-    fn schema(&self) -> SchemaRef {
-        self.schema.clone()
-    }
-
-    fn scan_as_stream(&mut self) -> SendableRecordBatchStream {
-        let schema = self.schema.clone();
-
-        // One-shot enforcement for non-rescannable sources: return a stream
-        // whose first item is an error.
-        if self.scanned && !self.rescannable {
-            let err_stream = once(async {
-                Err(Error::InvalidInput {
-                    message: "Scannable has already been consumed (non-rescannable source)"
-                        .to_string(),
-                })
-            });
-            return Box::pin(SimpleRecordBatchStream::new(err_stream, schema));
-        }
-        self.scanned = true;
-
-        let tsfn = Arc::clone(&self.get_next_batch);
-        let declared_schema = schema.clone();
-
-        // State threaded through the unfold. `is_first_pull` starts true so
-        // the first call into JS signals a new-scan boundary; JS uses it to
-        // reset any cached iterator before factory()-ing a fresh one.
-        let initial = State {
-            tsfn,
-            batch_index: 0,
-            declared_schema,
-            errored: false,
-            is_first_pull: true,
-        };
-
-        let stream = futures::stream::unfold(initial, |mut state| async move {
-            if state.errored {
-                return None;
-            }
-
-            // Pull the next IPC Stream buffer from JS. `is_first_pull` is
-            // consumed here and cleared so subsequent pulls continue the
-            // same scan rather than restarting it.
-            let is_start = state.is_first_pull;
-            state.is_first_pull = false;
-            let buf = match pull_next(&state.tsfn, is_start).await {
-                Ok(Some(buf)) => buf,
-                Ok(None) => return None,
-                Err(e) => {
-                    state.errored = true;
-                    return Some((Err(e), state));
-                }
-            };
-
-            match decode_one_batch(buf.as_ref(), &state.declared_schema) {
-                Ok(batch) => {
-                    state.batch_index += 1;
-                    Some((Ok(batch), state))
-                }
-                Err(e) => {
-                    let tagged = Error::Runtime {
-                        message: format!(
-                            "[scannable/rust-bridge] failure at batch index {}: {}",
-                            state.batch_index, e
-                        ),
-                    };
-                    state.errored = true;
-                    Some((Err(tagged), state))
-                }
-            }
-        });
-
-        Box::pin(SimpleRecordBatchStream::new(stream, schema))
-    }
-
-    fn num_rows(&self) -> Option<usize> {
-        self.num_rows
-    }
-
-    fn rescannable(&self) -> bool {
-        self.rescannable
-    }
-}
-
-struct State {
-    tsfn: Arc<GetNextBatchFn>,
-    batch_index: usize,
-    declared_schema: SchemaRef,
-    errored: bool,
-    /// True for the very first pull of a new scan. Forwarded to JS so the
-    /// callback can drop any cached iterator and call its factory fresh,
-    /// which makes rescannable sources restart at batch 0 even when the
-    /// previous scan ended mid-stream.
-    is_first_pull: bool,
-}
-
-/// Invoke the JS callback and await its Promise. `is_start` is forwarded to
-/// the JS side as the `isStart` argument so it can reset its iterator at the
-/// scan boundary. Errors on the JS side surface here as rejected promises
-/// and are tunneled back as `lancedb::Error::Runtime`.
-async fn pull_next(tsfn: &GetNextBatchFn, is_start: bool) -> LanceResult<Option<Buffer>> {
-    let promise = tsfn
-        .call_async(is_start)
-        .await
-        .map_err(|e| Error::Runtime {
-            message: format!(
-                "[scannable/js-factory] napi error status={}, reason={}",
-                e.status, e.reason
-            ),
-        })?;
-    promise.await.map_err(|e| Error::Runtime {
-        message: format!(
-            "[scannable/js-iterator] napi error status={}, reason={}",
-            e.status, e.reason
-        ),
-    })
-}
-
-/// Decode one IPC Stream buffer (schema + batch + EOS) into a `RecordBatch`.
-/// Each buffer is a standalone IPC stream, so every decoded stream schema must
-/// match the one declared at construction.
-fn decode_one_batch(buf: &[u8], declared: &SchemaRef) -> LanceResult<RecordBatch> {
-    let reader = StreamReader::try_new(Cursor::new(buf), None).map_err(|e| Error::Runtime {
-        message: format!("failed to open IPC stream reader: {}", e),
-    })?;
-
-    let actual = reader.schema();
-    if actual.as_ref() != declared.as_ref() {
-        return Err(Error::InvalidInput {
-            message: format!(
-                "declared schema does not match stream schema: declared={:?} actual={:?}",
-                declared, actual
-            ),
-        });
-    }
-
-    let mut iter = reader;
-    let batch = iter
-        .next()
-        .ok_or_else(|| Error::Runtime {
-            message: "IPC stream contained schema but no record batch".to_string(),
-        })?
-        .map_err(|e| Error::Runtime {
-            message: format!("failed to decode record batch: {}", e),
-        })?;
-    Ok(batch)
-}
--- a/nodejs/src/table.rs
+++ b/nodejs/src/table.rs
@@ -159,14 +159,6 @@ impl Table {
            .default_error()
    }

-    #[napi(catch_unwind)]
-    pub async fn prewarm_data(&self, columns: Option<Vec<String>>) -> napi::Result<()> {
-        self.inner_ref()?
-            .prewarm_data(columns)
-            .await
-            .default_error()
-    }
-
    #[napi(catch_unwind)]
    pub async fn wait_for_index(&self, index_names: Vec<String>, timeout_s: i64) -> Result<()> {
        let timeout = std::time::Duration::from_secs(timeout_s.try_into().unwrap());
--- a/python/.bumpversion.toml
+++ b/python/.bumpversion.toml
@@ -1,5 +1,5 @@
 [tool.bumpversion]
-current_version = "0.31.0-beta.11"
+current_version = "0.31.0-beta.5"
 parse = """(?x)
    (?P<major>0|[1-9]\\d*)\\.
    (?P<minor>0|[1-9]\\d*)\\.
--- a/python/Cargo.toml
+++ b/python/Cargo.toml
@@ -1,7 +1,6 @@
 [package]
 name = "lancedb-python"
-version = "0.31.0-beta.11"
-publish = false
+version = "0.31.0-beta.5"
 edition.workspace = true
 description = "Python bindings for LanceDB"
 license.workspace = true
@@ -15,19 +14,18 @@ name = "_lancedb"
 crate-type = ["cdylib"]

 [dependencies]
-arrow = { version = "58.0.0", features = ["pyarrow"] }
+arrow = { version = "57.2", features = ["pyarrow"] }
 async-trait = "0.1"
 bytes = "1"
 lancedb = { path = "../rust/lancedb", default-features = false }
-datafusion-common.workspace = true
 lance-core.workspace = true
 lance-namespace.workspace = true
 lance-namespace-impls.workspace = true
 lance-io.workspace = true
 env_logger.workspace = true
 log.workspace = true
-pyo3 = { version = "0.28", features = ["extension-module", "abi3-py39"] }
-pyo3-async-runtimes = { version = "0.28", features = [
+pyo3 = { version = "0.26", features = ["extension-module", "abi3-py39"] }
+pyo3-async-runtimes = { version = "0.26", features = [
    "attributes",
    "tokio-runtime",
 ] }
@@ -36,11 +34,10 @@ futures.workspace = true
 serde = "1"
 serde_json = "1"
 snafu.workspace = true
-tokio = { version = "1.40", features = ["sync", "rt-multi-thread"] }
-libc = "0.2"
+tokio = { version = "1.40", features = ["sync"] }

 [build-dependencies]
-pyo3-build-config = { version = "0.28", features = [
+pyo3-build-config = { version = "0.26", features = [
    "extension-module",
    "abi3-py39",
 ] }
--- a/python/PYTHON_THIRD_PARTY_LICENSES.md
+++ b/python/PYTHON_THIRD_PARTY_LICENSES.md
@@ -183,6 +183,7 @@
 | stack-data                     | 0.6.3           | MIT License                                                                                      | http://github.com/alexmojaki/stack_data                                                           |
 | sympy                          | 1.14.0          | BSD License                                                                                      | https://sympy.org                                                                                 |
 | tabulate                       | 0.9.0           | MIT License                                                                                      | https://github.com/astanin/python-tabulate                                                        |
+| tantivy                        | 0.25.1          | UNKNOWN                                                                                          | UNKNOWN                                                                                           |
 | threadpoolctl                  | 3.6.0           | BSD License                                                                                      | https://github.com/joblib/threadpoolctl                                                           |
 | timm                           | 1.0.24          | Apache Software License                                                                          | https://github.com/huggingface/pytorch-image-models                                               |
 | tinycss2                       | 1.4.0           | BSD License                                                                                      | https://www.courtbouillon.org/tinycss2                                                            |
--- a/python/pyproject.toml
+++ b/python/pyproject.toml
@@ -57,6 +57,7 @@ tests = [
    "duckdb>=0.9.0",
    "pytz>=2023.3",
    "polars>=0.19, <=1.3.0",
+    "tantivy>=0.20.0",
    "pyarrow-stubs>=16.0",
    "pylance>=5.0.0b5",
    "requests>=2.31.0",
--- a/python/python/lancedb/init.py
+++ b/python/python/lancedb/init.py
@@ -7,6 +7,7 @@ import os
 from concurrent.futures import ThreadPoolExecutor
 from datetime import timedelta
 from typing import Dict, Optional, Union, Any, List
+import warnings

 __version__ = importlib.metadata.version("lancedb")

@@ -72,7 +73,6 @@ def connect(
    client_config: Union[ClientConfig, Dict[str, Any], None] = None,
    storage_options: Optional[Dict[str, str]] = None,
    session: Optional[Session] = None,
-    manifest_enabled: bool = False,
    namespace_client_impl: Optional[str] = None,
    namespace_client_properties: Optional[Dict[str, str]] = None,
    namespace_client_pushdown_operations: Optional[List[str]] = None,
@@ -110,11 +110,7 @@ def connect(
        default configuration is used.
    storage_options: dict, optional
        Additional options for the storage backend. See available options at
-        <https://docs.lancedb.com/storage/>
-    manifest_enabled : bool, default False
-        When true for local/native connections, use directory namespace
-        manifests as the source of truth for table metadata. Existing
-        directory-listed root tables are migrated into the manifest on access.
+        <https://lancedb.com/docs/storage/>
    session: Session, optional
        (For LanceDB OSS only)
        A session to use for this connection. Sessions allow you to configure
@@ -162,11 +158,11 @@ def connect(
    conn : DBConnection
        A connection to a LanceDB database.
    """
-    if namespace_client_impl is not None:
-        if namespace_client_properties is None:
+    if namespace_client_impl is not None or namespace_client_properties is not None:
+        if namespace_client_impl is None or namespace_client_properties is None:
            raise ValueError(
-                "namespace_client_properties must be provided when "
-                "namespace_client_impl is set"
+                "Both namespace_client_impl and "
+                "namespace_client_properties must be provided"
            )
        if kwargs:
            raise ValueError(f"Unknown keyword arguments: {kwargs}")
@@ -179,12 +175,6 @@ def connect(
            namespace_client_pushdown_operations=namespace_client_pushdown_operations,
        )

-    if namespace_client_properties is not None and not manifest_enabled:
-        raise ValueError(
-            "namespace_client_impl must be provided when using "
-            "namespace_client_properties unless manifest_enabled=True"
-        )
-
    if namespace_client_pushdown_operations is not None:
        raise ValueError(
            "namespace_client_pushdown_operations is only valid when "
@@ -222,8 +212,6 @@ def connect(
        read_consistency_interval=read_consistency_interval,
        storage_options=storage_options,
        session=session,
-        manifest_enabled=manifest_enabled,
-        namespace_client_properties=namespace_client_properties,
    )


@@ -301,8 +289,6 @@ def deserialize_conn(
            parsed["uri"],
            read_consistency_interval=rci,
            storage_options=storage_options,
-            manifest_enabled=parsed.get("manifest_enabled", False),
-            namespace_client_properties=parsed.get("namespace_client_properties"),
        )
    else:
        raise ValueError(f"Unknown connection_type: {connection_type}")
@@ -318,8 +304,6 @@ async def connect_async(
    client_config: Optional[Union[ClientConfig, Dict[str, Any]]] = None,
    storage_options: Optional[Dict[str, str]] = None,
    session: Optional[Session] = None,
-    manifest_enabled: bool = False,
-    namespace_client_properties: Optional[Dict[str, str]] = None,
 ) -> AsyncConnection:
    """Connect to a LanceDB database.

@@ -352,20 +336,13 @@ async def connect_async(
        default configuration is used.
    storage_options: dict, optional
        Additional options for the storage backend. See available options at
-        <https://docs.lancedb.com/storage/>
+        <https://lancedb.com/docs/storage/>
    session: Session, optional
        (For LanceDB OSS only)
        A session to use for this connection. Sessions allow you to configure
        cache sizes for index and metadata caches, which can significantly
        impact memory use and performance. They can also be re-used across
        multiple connections to share the same cache state.
-    manifest_enabled : bool, default False
-        When true for local/native connections, use directory namespace
-        manifests as the source of truth for table metadata. Existing
-        directory-listed root tables are migrated into the manifest on access.
-    namespace_client_properties : dict, optional
-        Additional directory namespace client properties to use with
-        ``manifest_enabled=True``.

    Examples
    --------
@@ -408,8 +385,6 @@ async def connect_async(
            client_config,
            storage_options,
            session,
-            manifest_enabled,
-            namespace_client_properties,
        )
    )

@@ -437,3 +412,13 @@ __all__ = [
    "Table",
    "__version__",
 ]
+
+
+def __warn_on_fork():
+    warnings.warn(
+        "lance is not fork-safe. If you are using multiprocessing, use spawn instead.",
+    )
+
+
+if hasattr(os, "register_at_fork"):
+    os.register_at_fork(before=__warn_on_fork)  # type: ignore[attr-defined]
--- a/python/python/lancedb/_lancedb.pyi
+++ b/python/python/lancedb/_lancedb.pyi
@@ -12,7 +12,6 @@ from .index import (
    LabelList,
    HnswPq,
    HnswSq,
-    HnswFlat,
    FTS,
 )
 from lance_namespace import (
@@ -26,7 +25,6 @@ from .remote import ClientConfig

 IvfHnswPq: type[HnswPq] = HnswPq
 IvfHnswSq: type[HnswSq] = HnswSq
-IvfHnswFlat: type[HnswFlat] = HnswFlat

 class PyExpr:
    """A type-safe DataFusion expression node (Rust-side handle)."""
@@ -51,7 +49,7 @@ class PyExpr:
    def to_sql(self) -> str: ...

 def expr_col(name: str) -> PyExpr: ...
-def expr_lit(value: Union[bool, int, float, str, bytes]) -> PyExpr: ...
+def expr_lit(value: Union[bool, int, float, str]) -> PyExpr: ...
 def expr_func(name: str, args: List[PyExpr]) -> PyExpr: ...

 class Session:
@@ -182,7 +180,6 @@ class Table:
            IvfPq,
            HnswPq,
            HnswSq,
-            HnswFlat,
            BTree,
            Bitmap,
            LabelList,
@@ -245,8 +242,6 @@ async def connect(
    client_config: Optional[Union[ClientConfig, Dict[str, Any]]],
    storage_options: Optional[Dict[str, str]],
    session: Optional[Session],
-    manifest_enabled: bool = False,
-    namespace_client_properties: Optional[Dict[str, str]] = None,
 ) -> Connection: ...

 class RecordBatchStream:
@@ -445,7 +440,7 @@ class AsyncPermutationBuilder:
    async def execute(self) -> Table: ...

 def async_permutation_builder(
-    table: Table,
+    table: Table, dest_table_name: str
 ) -> AsyncPermutationBuilder: ...
 def fts_query_to_json(query: Any) -> str: ...

--- a/python/python/lancedb/background_loop.py
+++ b/python/python/lancedb/background_loop.py
@@ -2,9 +2,7 @@
 # SPDX-FileCopyrightText: Copyright The LanceDB Authors

 import asyncio
-import os
 import threading
-import warnings


 class BackgroundEventLoop:
@@ -15,9 +13,6 @@ class BackgroundEventLoop:
    """

    def __init__(self):
-        self._start()
-
-    def _start(self):
        self.loop = asyncio.new_event_loop()
        self.thread = threading.Thread(
            target=self.loop.run_forever,
@@ -36,30 +31,3 @@ class BackgroundEventLoop:


 LOOP = BackgroundEventLoop()
-
-_FORK_WARNED = False
-
-
-def _reset_after_fork():
-    # Threads do not survive fork(), so the asyncio loop in LOOP.thread is
-    # dead in the child. Re-initialize the singleton in place so existing
-    # `from .background_loop import LOOP` references in other modules see
-    # the new state. The Rust-side tokio runtime is reset analogously by a
-    # pthread_atfork hook installed in the _lancedb extension.
-    LOOP._start()
-    global _FORK_WARNED
-    if not _FORK_WARNED:
-        _FORK_WARNED = True
-        warnings.warn(
-            "lancedb fork support is experimental: the internal async "
-            "runtime has been reset in the forked child, but a small chance "
-            "of deadlock remains if other state was mid-operation at fork "
-            "time. The 'forkserver' or 'spawn' multiprocessing start method "
-            "is likely a safer alternative.",
-            RuntimeWarning,
-            stacklevel=2,
-        )
-
-
-if hasattr(os, "register_at_fork"):
-    os.register_at_fork(after_in_child=_reset_after_fork)
--- a/python/python/lancedb/common.py
+++ b/python/python/lancedb/common.py
@@ -96,7 +96,7 @@ def data_to_reader(
            f"Unknown data type {type(data)}. "
            "Supported types: list of dicts, pandas DataFrame, polars DataFrame, "
            "pyarrow Table/RecordBatch, or Pydantic models. "
-            "See https://docs.lancedb.com/tables/ for examples."
+            "See https://lancedb.com/docs/tables/ for examples."
        )


--- a/python/python/lancedb/db.py
+++ b/python/python/lancedb/db.py
@@ -282,7 +282,7 @@ class DBConnection(EnforceOverrides):
            Additional options for the storage backend. Options already set on the
            connection will be inherited by the table, but can be overridden here.
            See available options at
-            <https://docs.lancedb.com/storage/>
+            <https://lancedb.com/docs/storage/>

            To enable stable row IDs (row IDs remain stable after compaction,
            update, delete, and merges), set `new_table_enable_stable_row_ids`
@@ -433,7 +433,7 @@ class DBConnection(EnforceOverrides):
            Additional options for the storage backend. Options already set on the
            connection will be inherited by the table, but can be overridden here.
            See available options at
-            <https://docs.lancedb.com/storage/>
+            <https://lancedb.com/docs/storage/>

        Returns
        -------
@@ -590,13 +590,8 @@ class LanceDBConnection(DBConnection):
        read_consistency_interval: Optional[timedelta] = None,
        storage_options: Optional[Dict[str, str]] = None,
        session: Optional[Session] = None,
-        manifest_enabled: bool = False,
-        namespace_client_properties: Optional[Dict[str, str]] = None,
        _inner: Optional[LanceDbConnection] = None,
    ):
-        self.storage_options = storage_options
-        self._manifest_enabled = manifest_enabled
-        self._namespace_client_properties = namespace_client_properties
        if _inner is not None:
            self._conn = _inner
            self._cached_namespace_client = None
@@ -638,8 +633,6 @@ class LanceDBConnection(DBConnection):
                None,
                storage_options,
                session,
-                manifest_enabled,
-                namespace_client_properties,
            )

        # TODO: It would be nice if we didn't store self.storage_options but it is
@@ -647,6 +640,7 @@ class LanceDBConnection(DBConnection):
        # work because some paths like LanceDBConnection.from_inner will lose the
        # storage_options.  Also, this class really shouldn't be holding any state
        # beyond _conn.
+        self.storage_options = storage_options
        self._conn = AsyncConnection(LOOP.run(do_connect()))
        self._cached_namespace_client: Optional[LanceNamespace] = None

@@ -683,8 +677,6 @@ class LanceDBConnection(DBConnection):
                "connection_type": "local",
                "uri": self.uri,
                "storage_options": self.storage_options,
-                "manifest_enabled": self._manifest_enabled,
-                "namespace_client_properties": self._namespace_client_properties,
                "read_consistency_interval_seconds": (
                    rci.total_seconds() if rci else None
                ),
@@ -1398,7 +1390,6 @@ class AsyncConnection(object):
        namespace_path: Optional[List[str]] = None,
        embedding_functions: Optional[List[EmbeddingFunctionConfig]] = None,
        location: Optional[str] = None,
-        namespace_client: Optional[Any] = None,
    ) -> AsyncTable:
        """Create an [AsyncTable][lancedb.table.AsyncTable] in the database.

@@ -1443,7 +1434,7 @@ class AsyncConnection(object):
            Additional options for the storage backend. Options already set on the
            connection will be inherited by the table, but can be overridden here.
            See available options at
-            <https://docs.lancedb.com/storage/>
+            <https://lancedb.com/docs/storage/>

            To enable stable row IDs (row IDs remain stable after compaction,
            update, delete, and merges), set `new_table_enable_stable_row_ids`
@@ -1596,7 +1587,6 @@ class AsyncConnection(object):
                namespace_path=namespace_path,
                storage_options=storage_options,
                location=location,
-                namespace_client=namespace_client,
            )
        else:
            data = data_to_reader(data, schema)
@@ -1607,7 +1597,6 @@ class AsyncConnection(object):
                namespace_path=namespace_path,
                storage_options=storage_options,
                location=location,
-                namespace_client=namespace_client,
            )

        return AsyncTable(new_table)
@@ -1636,7 +1625,7 @@ class AsyncConnection(object):
            Additional options for the storage backend. Options already set on the
            connection will be inherited by the table, but can be overridden here.
            See available options at
-            <https://docs.lancedb.com/storage/>
+            <https://lancedb.com/docs/storage/>
        index_cache_size: int, default 256
            **Deprecated**: Use session-level cache configuration instead.
            Create a Session with custom cache sizes and pass it to lancedb.connect().
--- a/python/python/lancedb/expr.py
+++ b/python/python/lancedb/expr.py
@@ -63,7 +63,7 @@ def _coerce(value: "ExprLike") -> "Expr":


 # Type alias used in annotations.
-ExprLike = Union["Expr", bool, int, float, str, bytes]
+ExprLike = Union["Expr", bool, int, float, str]


 class Expr:
@@ -261,13 +261,13 @@ def col(name: str) -> Expr:
    return Expr(expr_col(name))


-def lit(value: Union[bool, int, float, str, bytes]) -> Expr:
+def lit(value: Union[bool, int, float, str]) -> Expr:
    """Create a literal (constant) value expression.

    Parameters
    ----------
    value:
-        A Python ``bool``, ``int``, ``float``, ``str``, or ``bytes``.
+        A Python ``bool``, ``int``, ``float``, or ``str``.

    Examples
    --------
--- a/python/python/lancedb/fts.py
+++ b/python/python/lancedb/fts.py
@@ -0,0 +1,201 @@
+# SPDX-License-Identifier: Apache-2.0
+# SPDX-FileCopyrightText: Copyright The LanceDB Authors
+
+"""Full text search index using tantivy-py"""
+
+import os
+from typing import List, Tuple, Optional
+
+import pyarrow as pa
+
+try:
+    import tantivy
+except ImportError:
+    raise ImportError(
+        "Please install tantivy-py `pip install tantivy` to use the full text search feature."  # noqa: E501
+    )
+
+from .table import LanceTable
+
+
+def create_index(
+    index_path: str,
+    text_fields: List[str],
+    ordering_fields: Optional[List[str]] = None,
+    tokenizer_name: str = "default",
+) -> tantivy.Index:
+    """
+    Create a new Index (not populated)
+
+    Parameters
+    ----------
+    index_path : str
+        Path to the index directory
+    text_fields : List[str]
+        List of text fields to index
+    ordering_fields: List[str]
+        List of unsigned type fields to order by at search time
+    tokenizer_name : str, default "default"
+        The tokenizer to use
+
+    Returns
+    -------
+    index : tantivy.Index
+        The index object (not yet populated)
+    """
+    if ordering_fields is None:
+        ordering_fields = []
+    # Declaring our schema.
+    schema_builder = tantivy.SchemaBuilder()
+    # special field that we'll populate with row_id
+    schema_builder.add_integer_field("doc_id", stored=True)
+    # data fields
+    for name in text_fields:
+        schema_builder.add_text_field(name, stored=True, tokenizer_name=tokenizer_name)
+    if ordering_fields:
+        for name in ordering_fields:
+            schema_builder.add_unsigned_field(name, fast=True)
+    schema = schema_builder.build()
+    os.makedirs(index_path, exist_ok=True)
+    index = tantivy.Index(schema, path=index_path)
+    return index
+
+
+def populate_index(
+    index: tantivy.Index,
+    table: LanceTable,
+    fields: List[str],
+    writer_heap_size: Optional[int] = None,
+    ordering_fields: Optional[List[str]] = None,
+) -> int:
+    """
+    Populate an index with data from a LanceTable
+
+    Parameters
+    ----------
+    index : tantivy.Index
+        The index object
+    table : LanceTable
+        The table to index
+    fields : List[str]
+        List of fields to index
+    writer_heap_size : int
+        The writer heap size in bytes, defaults to 1GB
+
+    Returns
+    -------
+    int
+        The number of rows indexed
+    """
+    if ordering_fields is None:
+        ordering_fields = []
+    writer_heap_size = writer_heap_size or 1024 * 1024 * 1024
+    # first check the fields exist and are string or large string type
+    nested = []
+
+    for name in fields:
+        try:
+            f = table.schema.field(name)  # raises KeyError if not found
+        except KeyError:
+            f = resolve_path(table.schema, name)
+            nested.append(name)
+
+        if not pa.types.is_string(f.type) and not pa.types.is_large_string(f.type):
+            raise TypeError(f"Field {name} is not a string type")
+
+    # create a tantivy writer
+    writer = index.writer(heap_size=writer_heap_size)
+    # write data into index
+    dataset = table.to_lance()
+    row_id = 0
+
+    max_nested_level = 0
+    if len(nested) > 0:
+        max_nested_level = max([len(name.split(".")) for name in nested])
+
+    for b in dataset.to_batches(columns=fields + ordering_fields):
+        if max_nested_level > 0:
+            b = pa.Table.from_batches([b])
+            for _ in range(max_nested_level - 1):
+                b = b.flatten()
+        for i in range(b.num_rows):
+            doc = tantivy.Document()
+            for name in fields:
+                value = b[name][i].as_py()
+                if value is not None:
+                    doc.add_text(name, value)
+            for name in ordering_fields:
+                value = b[name][i].as_py()
+                if value is not None:
+                    doc.add_unsigned(name, value)
+            if not doc.is_empty:
+                doc.add_integer("doc_id", row_id)
+                writer.add_document(doc)
+            row_id += 1
+    # commit changes
+    writer.commit()
+    return row_id
+
+
+def resolve_path(schema, field_name: str) -> pa.Field:
+    """
+    Resolve a nested field path to a list of field names
+
+    Parameters
+    ----------
+    field_name : str
+        The field name to resolve
+
+    Returns
+    -------
+    List[str]
+        The resolved path
+    """
+    path = field_name.split(".")
+    field = schema.field(path.pop(0))
+    for segment in path:
+        if pa.types.is_struct(field.type):
+            field = field.type.field(segment)
+        else:
+            raise KeyError(f"field {field_name} not found in schema {schema}")
+    return field
+
+
+def search_index(
+    index: tantivy.Index, query: str, limit: int = 10, ordering_field=None
+) -> Tuple[Tuple[int], Tuple[float]]:
+    """
+    Search an index for a query
+
+    Parameters
+    ----------
+    index : tantivy.Index
+        The index object
+    query : str
+        The query string
+    limit : int
+        The maximum number of results to return
+
+    Returns
+    -------
+    ids_and_score: list[tuple[int], tuple[float]]
+        A tuple of two tuples, the first containing the document ids
+        and the second containing the scores
+    """
+    searcher = index.searcher()
+    query = index.parse_query(query)
+    # get top results
+    if ordering_field:
+        results = searcher.search(query, limit, order_by_field=ordering_field)
+    else:
+        results = searcher.search(query, limit)
+    if results.count == 0:
+        return tuple(), tuple()
+    return tuple(
+        zip(
+            *[
+                (searcher.doc(doc_address)["doc_id"][0], score)
+                for score, doc_address in results.hits
+            ]
+        )
+    )
--- a/python/python/lancedb/index.py
+++ b/python/python/lancedb/index.py
@@ -7,7 +7,6 @@ from typing import Literal, Optional
 from ._lancedb import (
    IndexConfig,
 )
-from .types import BaseTokenizerType

 lang_mapping = {
    "ar": "Arabic",
@@ -112,12 +111,8 @@ class FTS:
        - "simple": Splits text by whitespace and punctuation.
        - "whitespace": Split text by whitespace, but not punctuation.
        - "raw": No tokenization. The entire text is treated as a single token.
-        - "ngram": N-gram tokenizer for substring-style matching.
-        - "jieba/*": Jieba tokenizer loaded from Lance's language model home.
-        - "lindera/*": Lindera tokenizer loaded from Lance's language model home.
    language : str, default "English"
-        The language to use for stemming and stop-word removal. This is not the
-        primary way to enable CJK tokenization.
+        The language to use for tokenization.
    max_token_length : int, default 40
        The maximum token length to index. Tokens longer than this length will be
        ignored.
@@ -132,17 +127,10 @@ class FTS:
    ascii_folding : bool, default True
        Whether to fold ASCII characters. This converts accented characters to
        their ASCII equivalent. For example, "café" would be converted to "cafe".
-
-    Notes
-    -----
-    Model-backed tokenizers such as ``jieba/default`` and ``lindera/ipadic``
-    require tokenizer models in Lance's language model home. Set
-    ``LANCE_LANGUAGE_MODEL_HOME`` to override the default platform data
-    directory under ``lance/language_models``.
    """

    with_position: bool = False
-    base_tokenizer: BaseTokenizerType = "simple"
+    base_tokenizer: Literal["simple", "raw", "whitespace"] = "simple"
    language: str = "English"
    max_token_length: Optional[int] = 40
    lower_case: bool = True
@@ -388,98 +376,9 @@ class HnswSq:
    target_partition_size: Optional[int] = None


-@dataclass
-class HnswFlat:
-    """Describe a HNSW-FLAT index configuration.
-
-    HNSW-FLAT stands for Hierarchical Navigable Small World without quantization.
-    It stores raw vectors in the HNSW graph, providing the highest recall among
-    the IVF_HNSW family at the cost of more memory and disk space compared to
-    :class:`HnswSq` or :class:`HnswPq`.
-
-    Parameters
-    ----------
-
-    distance_type: str, default "l2"
-
-        The distance metric used to train the index.
-
-        The following distance types are available:
-
-        "l2" - Euclidean distance. This is a very common distance metric that
-        accounts for both magnitude and direction when determining the distance
-        between vectors. l2 distance has a range of [0, ∞).
-
-        "cosine" - Cosine distance.  Cosine distance is a distance metric
-        calculated from the cosine similarity between two vectors. Cosine
-        similarity is a measure of similarity between two non-zero vectors of an
-        inner product space. It is defined to equal the cosine of the angle
-        between them.  Unlike l2, the cosine distance is not affected by the
-        magnitude of the vectors.  Cosine distance has a range of [0, 2].
-
-        "dot" - Dot product. Dot distance is the dot product of two vectors. Dot
-        distance has a range of (-∞, ∞). If the vectors are normalized (i.e. their
-        l2 norm is 1), then dot distance is equivalent to the cosine distance.
-
-    num_partitions, default sqrt(num_rows)
-
-        The number of IVF partitions to create.
-
-        For HNSW, we recommend a small number of partitions. Setting this to 1
-        works well for most tables. For very large tables, training just one HNSW
-        graph will require too much memory. Each partition becomes its own HNSW
-        graph, so setting this value higher reduces the peak memory use of
-        training.
-
-    max_iterations, default 50
-
-        Max iterations to train kmeans.
-
-        When training an IVF index we use kmeans to calculate the partitions.
-        This parameter controls how many iterations of kmeans to run.
-
-    sample_rate, default 256
-
-        The rate used to calculate the number of training vectors for kmeans.
-
-    m, default 20
-
-        The number of neighbors to select for each vector in the HNSW graph.
-
-        This value controls the tradeoff between search speed and accuracy.
-        The higher the value the more accurate the search but the slower it
-        will be.
-
-    ef_construction, default 300
-
-        The number of candidates to evaluate during the construction of the HNSW
-        graph.
-
-        This value controls the tradeoff between build speed and accuracy.
-        The higher the value the more accurate the build but the slower it will
-        be.  150 to 300 is the typical range. 100 is a minimum for good quality
-        search results. In most cases, there is no benefit to setting this higher
-        than 500.  This value should be set to a value that is not less than `ef`
-        in the search phase.
-
-    target_partition_size, default is 1,048,576
-
-        The target size of each partition.
-    """
-
-    distance_type: Literal["l2", "cosine", "dot"] = "l2"
-    num_partitions: Optional[int] = None
-    max_iterations: int = 50
-    sample_rate: int = 256
-    m: int = 20
-    ef_construction: int = 300
-    target_partition_size: Optional[int] = None
-
-
 # Backwards-compatible aliases
 IvfHnswPq = HnswPq
 IvfHnswSq = HnswSq
-IvfHnswFlat = HnswFlat


@dataclass
@@ -799,13 +698,11 @@ __all__ = [
    "IvfPq",
    "IvfHnswPq",
    "IvfHnswSq",
-    "IvfHnswFlat",
    "IvfSq",
    "IvfRq",
    "IvfFlat",
    "HnswPq",
    "HnswSq",
-    "HnswFlat",
    "IndexConfig",
    "FTS",
    "Bitmap",
--- a/python/python/lancedb/namespace.py
+++ b/python/python/lancedb/namespace.py
@@ -10,6 +10,7 @@ through a namespace abstraction.

 from __future__ import annotations

+import asyncio
 import sys
 from typing import TYPE_CHECKING, Any, Dict, Iterable, List, Optional, Union

@@ -24,24 +25,7 @@ if TYPE_CHECKING:
 from datetime import timedelta
 import pyarrow as pa

-from lance_namespace_urllib3_client.models.json_arrow_data_type import JsonArrowDataType
-from lance_namespace_urllib3_client.models.json_arrow_field import JsonArrowField
-from lance_namespace_urllib3_client.models.json_arrow_schema import JsonArrowSchema
-from lance_namespace_urllib3_client.models.query_table_request import QueryTableRequest
-from lance_namespace_urllib3_client.models.query_table_request_columns import (
-    QueryTableRequestColumns,
-)
-from lance_namespace_urllib3_client.models.query_table_request_full_text_query import (
-    QueryTableRequestFullTextQuery,
-)
-from lance_namespace_urllib3_client.models.query_table_request_vector import (
-    QueryTableRequestVector,
-)
-from lance_namespace_urllib3_client.models.string_fts_query import StringFtsQuery
-from lance_namespace.errors import TableNotFoundError
-from lancedb._lancedb import connect_namespace_client as _connect_namespace_client
-from lancedb.background_loop import LOOP
-from lancedb.db import AsyncConnection, DBConnection
+from lancedb.db import DBConnection, LanceDBConnection
 from lancedb.namespace_utils import (
    _normalize_create_namespace_mode,
    _normalize_drop_namespace_mode,
@@ -56,11 +40,14 @@ from lance_namespace import (
    ListNamespacesResponse,
    ListTablesResponse,
    ListTablesRequest,
+    DescribeTableRequest,
    DescribeNamespaceRequest,
    DropTableRequest,
    ListNamespacesRequest,
    CreateNamespaceRequest,
    DropNamespaceRequest,
+    DeclareTableRequest,
+    CreateTableRequest,
 )
 from lancedb.table import AsyncTable, LanceTable, Table
 from lancedb.util import validate_table_name
@@ -69,6 +56,21 @@ from lancedb.pydantic import LanceModel
 from lancedb.embeddings import EmbeddingFunctionConfig
 from ._lancedb import Session

+from lance_namespace_urllib3_client.models.json_arrow_schema import JsonArrowSchema
+from lance_namespace_urllib3_client.models.json_arrow_field import JsonArrowField
+from lance_namespace_urllib3_client.models.json_arrow_data_type import JsonArrowDataType
+from lance_namespace_urllib3_client.models.query_table_request import QueryTableRequest
+from lance_namespace_urllib3_client.models.query_table_request_vector import (
+    QueryTableRequestVector,
+)
+from lance_namespace_urllib3_client.models.query_table_request_columns import (
+    QueryTableRequestColumns,
+)
+from lance_namespace_urllib3_client.models.query_table_request_full_text_query import (
+    QueryTableRequestFullTextQuery,
+)
+from lance_namespace_urllib3_client.models.string_fts_query import StringFtsQuery
+

 def _query_to_namespace_request(
    table_id: List[str],
@@ -422,23 +424,6 @@ class LanceNamespaceDBConnection(DBConnection):
        )
        self._namespace_client_impl = namespace_client_impl
        self._namespace_client_properties = namespace_client_properties
-        self._inner = AsyncConnection(
-            _connect_namespace_client(
-                namespace_client,
-                read_consistency_interval=(
-                    read_consistency_interval.total_seconds()
-                    if read_consistency_interval is not None
-                    else None
-                ),
-                storage_options=self.storage_options or None,
-                session=session,
-                namespace_client_pushdown_operations=(
-                    list(self._namespace_client_pushdown_operations)
-                ),
-                namespace_client_impl=namespace_client_impl,
-                namespace_client_properties=namespace_client_properties,
-            )
-        )

    @override
    def serialize(self) -> str:
@@ -512,10 +497,13 @@ class LanceNamespaceDBConnection(DBConnection):
        if mode.lower() not in ["create", "overwrite"]:
            raise ValueError("mode must be either 'create' or 'overwrite'")
        validate_table_name(name)
-        async_table = LOOP.run(
-            self._inner.create_table(
-                name,
-                data,
+
+        table_id = namespace_path + [name]
+
+        if "CreateTable" in self._namespace_client_pushdown_operations:
+            return self._create_table_server_side(
+                name=name,
+                data=data,
                schema=schema,
                mode=mode,
                exist_ok=exist_ok,
@@ -525,15 +513,130 @@ class LanceNamespaceDBConnection(DBConnection):
                namespace_path=namespace_path,
                storage_options=storage_options,
            )
+
+        # Local create path: declare_table + local write
+        # Step 1: Get the table location and storage options from namespace
+        # In overwrite mode, if table exists, use describe_table to get
+        # existing location. Otherwise, call create_empty_table to reserve
+        # a new location
+        location = None
+        namespace_storage_options = None
+        if mode.lower() == "overwrite":
+            # Try to describe the table first to see if it exists
+            try:
+                describe_request = DescribeTableRequest(id=table_id)
+                describe_response = self._namespace_client.describe_table(
+                    describe_request
+                )
+                location = describe_response.location
+                namespace_storage_options = describe_response.storage_options
+            except Exception:
+                # Table doesn't exist, will create a new one below
+                pass
+
+        if location is None:
+            # Table doesn't exist or mode is "create", reserve a new location
+            declare_request = DeclareTableRequest(
+                id=table_id,
+                location=None,
+                properties=self.storage_options if self.storage_options else None,
+            )
+            declare_response = self._namespace_client.declare_table(declare_request)
+
+            if not declare_response.location:
+                raise ValueError(
+                    "Table location is missing from declare_table response"
+                )
+
+            location = declare_response.location
+            namespace_storage_options = declare_response.storage_options
+
+        # Merge storage options: self.storage_options < user options < namespace options
+        merged_storage_options = dict(self.storage_options)
+        if storage_options:
+            merged_storage_options.update(storage_options)
+        if namespace_storage_options:
+            merged_storage_options.update(namespace_storage_options)
+
+        # Step 2: Create table using LanceTable.create with the location
+        # We need a temporary connection for the LanceTable.create method
+        temp_conn = LanceDBConnection(
+            location,  # Use the actual location as the connection URI
+            read_consistency_interval=self.read_consistency_interval,
+            storage_options=merged_storage_options,
+            session=self.session,
        )

-        return LanceTable(
-            self,
+        # Note: storage_options_provider is auto-created in Rust from namespace_client
+        tbl = LanceTable.create(
+            temp_conn,
            name,
+            data,
+            schema,
+            mode=mode,
+            exist_ok=exist_ok,
+            on_bad_vectors=on_bad_vectors,
+            fill_value=fill_value,
+            embedding_functions=embedding_functions,
            namespace_path=namespace_path,
+            storage_options=merged_storage_options,
+            location=location,
            namespace_client=self._namespace_client,
            pushdown_operations=self._namespace_client_pushdown_operations,
-            _async=async_table,
+        )
+
+        return tbl
+
+    def _create_table_server_side(
+        self,
+        name: str,
+        data: Optional[DATA],
+        schema: Optional[Union[pa.Schema, LanceModel]],
+        mode: str,
+        exist_ok: bool,
+        on_bad_vectors: str,
+        fill_value: float,
+        embedding_functions: Optional[List[EmbeddingFunctionConfig]],
+        namespace_path: Optional[List[str]],
+        storage_options: Optional[Dict[str, str]],
+    ) -> Table:
+        """Create a table using server-side namespace.create_table()."""
+        if namespace_path is None:
+            namespace_path = []
+        table_id = namespace_path + [name]
+
+        arrow_ipc_bytes = _data_to_arrow_ipc(
+            data=data,
+            schema=schema,
+            embedding_functions=embedding_functions,
+            on_bad_vectors=on_bad_vectors,
+            fill_value=fill_value,
+        )
+
+        merged = dict(self.storage_options or {})
+        if storage_options:
+            merged.update(storage_options)
+        request = CreateTableRequest(
+            id=table_id,
+            mode=_normalize_create_table_mode(mode),
+            properties=merged or None,
+        )
+
+        try:
+            self._namespace_client.create_table(request, arrow_ipc_bytes)
+        except Exception as e:
+            if exist_ok and "already exists" in str(e).lower():
+                return self.open_table(
+                    name,
+                    namespace_path=namespace_path,
+                    storage_options=storage_options,
+                )
+            raise
+
+        return self.open_table(
+            name,
+            namespace_path=namespace_path,
+            storage_options=storage_options,
        )

    @override
@@ -547,28 +650,30 @@ class LanceNamespaceDBConnection(DBConnection):
    ) -> Table:
        if namespace_path is None:
            namespace_path = []
-        try:
-            async_table = LOOP.run(
-                self._inner.open_table(
-                    name,
-                    namespace_path=namespace_path,
-                    storage_options=storage_options,
-                    index_cache_size=index_cache_size,
-                )
-            )
-        except RuntimeError as e:
-            if "Table not found" in str(e):
-                table_id = namespace_path + [name]
-                raise TableNotFoundError(f"Table not found: {'$'.join(table_id)}")
-            raise
+        table_id = namespace_path + [name]
+        request = DescribeTableRequest(id=table_id)
+        response = self._namespace_client.describe_table(request)

-        return LanceTable(
-            self,
+        # Merge storage options: self.storage_options < user options < namespace options
+        merged_storage_options = dict(self.storage_options)
+        if storage_options:
+            merged_storage_options.update(storage_options)
+        if response.storage_options:
+            merged_storage_options.update(response.storage_options)
+
+        # Pass managed_versioning to avoid redundant describe_table call in Rust.
+        # Convert None to False since we already have the answer from describe_table.
+        managed_versioning = response.managed_versioning is True
+
+        # Note: storage_options_provider is auto-created in Rust from namespace_client
+        return self._lance_table_from_uri(
            name,
+            response.location,
            namespace_path=namespace_path,
+            storage_options=merged_storage_options,
+            index_cache_size=index_cache_size,
            namespace_client=self._namespace_client,
-            pushdown_operations=self._namespace_client_pushdown_operations,
-            _async=async_table,
+            managed_versioning=managed_versioning,
        )

    @override
@@ -792,34 +897,33 @@ class LanceNamespaceDBConnection(DBConnection):
        namespace_client: Optional[Any] = None,
        managed_versioning: Optional[bool] = None,
    ) -> LanceTable:
-        # Open a table directly from the namespace-resolved physical location.
-        #
-        # Open the table through the Rust namespace-backed connection.  The Rust
-        # layer keeps the logical namespace path and namespace client intact.
+        # Open a table directly from a URI using the location parameter
+        # Note: storage_options should already be merged by the caller
+        # Note: storage_options_provider is auto-created in Rust from namespace_client
        if namespace_path is None:
            namespace_path = []
-
-        async_table = LOOP.run(
-            self._inner.open_table(
-                name,
-                namespace_path=namespace_path,
-                storage_options=storage_options,
-                index_cache_size=index_cache_size,
-                location=None,
-                namespace_client=namespace_client,
-                managed_versioning=managed_versioning,
-            )
+        temp_conn = LanceDBConnection(
+            table_uri,  # Use the table location as the connection URI
+            read_consistency_interval=self.read_consistency_interval,
+            storage_options=storage_options if storage_options is not None else {},
+            session=self.session,
        )

-        return LanceTable(
-            self,
+        # Open the table using the temporary connection with the location parameter
+        # Pass namespace_client to enable managed versioning support and auto-create
+        # storage options provider
+        # Pass managed_versioning to avoid redundant describe_table call
+        # Pass pushdown_operations if configured on this connection
+        return LanceTable.open(
+            temp_conn,
            name,
            namespace_path=namespace_path,
+            storage_options=storage_options,
+            index_cache_size=index_cache_size,
            location=table_uri,
            namespace_client=namespace_client,
            managed_versioning=managed_versioning,
            pushdown_operations=self._namespace_client_pushdown_operations,
-            _async=async_table,
        )

    @override
@@ -886,23 +990,6 @@ class AsyncLanceNamespaceDBConnection:
        self._namespace_client_pushdown_operations = set(
            namespace_client_pushdown_operations or []
        )
-        self._inner = AsyncConnection(
-            _connect_namespace_client(
-                namespace_client,
-                read_consistency_interval=(
-                    read_consistency_interval.total_seconds()
-                    if read_consistency_interval is not None
-                    else None
-                ),
-                storage_options=self.storage_options or None,
-                session=session,
-                namespace_client_pushdown_operations=(
-                    list(self._namespace_client_pushdown_operations)
-                ),
-                namespace_client_impl=None,
-                namespace_client_properties=None,
-            )
-        )

    async def table_names(
        self,
@@ -954,16 +1041,148 @@ class AsyncLanceNamespaceDBConnection:
        if mode.lower() not in ["create", "overwrite"]:
            raise ValueError("mode must be either 'create' or 'overwrite'")
        validate_table_name(name)
-        return await self._inner.create_table(
+
+        table_id = namespace_path + [name]
+
+        if "CreateTable" in self._namespace_client_pushdown_operations:
+            return await self._create_table_server_side(
+                name=name,
+                data=data,
+                schema=schema,
+                mode=mode,
+                exist_ok=exist_ok,
+                on_bad_vectors=on_bad_vectors,
+                fill_value=fill_value,
+                embedding_functions=embedding_functions,
+                namespace_path=namespace_path,
+                storage_options=storage_options,
+            )
+
+        # Local create path: declare_table + local write
+        # Step 1: Get the table location and storage options from namespace
+        location = None
+        namespace_storage_options = None
+        if mode.lower() == "overwrite":
+            # Try to describe the table first to see if it exists
+            try:
+                describe_request = DescribeTableRequest(id=table_id)
+                describe_response = self._namespace_client.describe_table(
+                    describe_request
+                )
+                location = describe_response.location
+                namespace_storage_options = describe_response.storage_options
+            except Exception:
+                # Table doesn't exist, will create a new one below
+                pass
+
+        if location is None:
+            # Table doesn't exist or mode is "create", reserve a new location
+            declare_request = DeclareTableRequest(
+                id=table_id,
+                location=None,
+                properties=self.storage_options if self.storage_options else None,
+            )
+            declare_response = self._namespace_client.declare_table(declare_request)
+
+            if not declare_response.location:
+                raise ValueError(
+                    "Table location is missing from declare_table response"
+                )
+
+            location = declare_response.location
+            namespace_storage_options = declare_response.storage_options
+
+        # Merge storage options: self.storage_options < user options < namespace options
+        merged_storage_options = dict(self.storage_options)
+        if storage_options:
+            merged_storage_options.update(storage_options)
+        if namespace_storage_options:
+            merged_storage_options.update(namespace_storage_options)
+
+        # Step 2: Create table using LanceTable.create with the location
+        # Run the sync operation in a thread
+        def _create_table():
+            temp_conn = LanceDBConnection(
+                location,
+                read_consistency_interval=self.read_consistency_interval,
+                storage_options=merged_storage_options,
+                session=self.session,
+            )
+
+            # storage_options_provider is auto-created in Rust from namespace_client
+            return LanceTable.create(
+                temp_conn,
+                name,
+                data,
+                schema,
+                mode=mode,
+                exist_ok=exist_ok,
+                on_bad_vectors=on_bad_vectors,
+                fill_value=fill_value,
+                embedding_functions=embedding_functions,
+                namespace_path=namespace_path,
+                storage_options=merged_storage_options,
+                location=location,
+                namespace_client=self._namespace_client,
+                pushdown_operations=self._namespace_client_pushdown_operations,
+            )
+
+        lance_table = await asyncio.to_thread(_create_table)
+        # Get the underlying async table from LanceTable
+        return lance_table._table
+
+    async def _create_table_server_side(
+        self,
+        name: str,
+        data: Optional[DATA],
+        schema: Optional[Union[pa.Schema, LanceModel]],
+        mode: str,
+        exist_ok: bool,
+        on_bad_vectors: str,
+        fill_value: float,
+        embedding_functions: Optional[List[EmbeddingFunctionConfig]],
+        namespace_path: Optional[List[str]],
+        storage_options: Optional[Dict[str, str]],
+    ) -> AsyncTable:
+        """Create a table using server-side namespace.create_table()."""
+        if namespace_path is None:
+            namespace_path = []
+        table_id = namespace_path + [name]
+
+        def _prepare_and_create():
+            arrow_ipc_bytes = _data_to_arrow_ipc(
+                data=data,
+                schema=schema,
+                embedding_functions=embedding_functions,
+                on_bad_vectors=on_bad_vectors,
+                fill_value=fill_value,
+            )
+
+            merged = dict(self.storage_options or {})
+            if storage_options:
+                merged.update(storage_options)
+            request = CreateTableRequest(
+                id=table_id,
+                mode=_normalize_create_table_mode(mode),
+                properties=merged or None,
+            )
+
+            self._namespace_client.create_table(request, arrow_ipc_bytes)
+
+        try:
+            await asyncio.to_thread(_prepare_and_create)
+        except Exception as e:
+            if exist_ok and "already exists" in str(e).lower():
+                return await self.open_table(
+                    name,
+                    namespace_path=namespace_path,
+                    storage_options=storage_options,
+                )
+            raise
+
+        return await self.open_table(
            name,
-            data,
-            schema=schema,
-            mode=mode,
-            exist_ok=exist_ok,
-            on_bad_vectors=on_bad_vectors,
-            fill_value=fill_value,
            namespace_path=namespace_path,
-            embedding_functions=embedding_functions,
            storage_options=storage_options,
        )

@@ -978,18 +1197,45 @@ class AsyncLanceNamespaceDBConnection:
        """Open an existing table from the namespace."""
        if namespace_path is None:
            namespace_path = []
-        try:
-            return await self._inner.open_table(
+        table_id = namespace_path + [name]
+        request = DescribeTableRequest(id=table_id)
+        response = self._namespace_client.describe_table(request)
+
+        # Merge storage options: self.storage_options < user options < namespace options
+        merged_storage_options = dict(self.storage_options)
+        if storage_options:
+            merged_storage_options.update(storage_options)
+        if response.storage_options:
+            merged_storage_options.update(response.storage_options)
+
+        # Capture managed_versioning from describe response.
+        # Convert None to False since we already have the answer from describe_table.
+        managed_versioning = response.managed_versioning is True
+
+        # Open table in a thread
+        # Note: storage_options_provider is auto-created in Rust from namespace_client
+        def _open_table():
+            temp_conn = LanceDBConnection(
+                response.location,
+                read_consistency_interval=self.read_consistency_interval,
+                storage_options=merged_storage_options,
+                session=self.session,
+            )
+
+            return LanceTable.open(
+                temp_conn,
                name,
                namespace_path=namespace_path,
-                storage_options=storage_options,
+                storage_options=merged_storage_options,
                index_cache_size=index_cache_size,
+                location=response.location,
+                namespace_client=self._namespace_client,
+                managed_versioning=managed_versioning,
+                pushdown_operations=self._namespace_client_pushdown_operations,
            )
-        except RuntimeError as e:
-            if "Table not found" in str(e):
-                table_id = namespace_path + [name]
-                raise TableNotFoundError(f"Table not found: {'$'.join(table_id)}")
-            raise
+
+        lance_table = await asyncio.to_thread(_open_table)
+        return lance_table._table

    async def drop_table(self, name: str, namespace_path: Optional[List[str]] = None):
        """Drop a table from the namespace."""
--- a/python/python/lancedb/namespace_utils.py
+++ b/python/python/lancedb/namespace_utils.py
@@ -6,44 +6,22 @@
 from typing import Optional


-_CREATE_NAMESPACE_MODES = frozenset({"create", "exist_ok", "overwrite"})
-_DROP_NAMESPACE_MODES = frozenset({"SKIP", "FAIL"})
-_DROP_NAMESPACE_BEHAVIORS = frozenset({"RESTRICT", "CASCADE"})
-
-
 def _normalize_create_namespace_mode(mode: Optional[str]) -> Optional[str]:
    """Normalize create namespace mode to lowercase (API expects lowercase)."""
    if mode is None:
        return None
-    normalized = mode.lower()
-    if normalized not in _CREATE_NAMESPACE_MODES:
-        raise ValueError(
-            f"Invalid create namespace mode {mode!r}: "
-            f"expected one of 'create', 'exist_ok', 'overwrite'"
-        )
-    return normalized
+    return mode.lower()


 def _normalize_drop_namespace_mode(mode: Optional[str]) -> Optional[str]:
    """Normalize drop namespace mode to uppercase (API expects uppercase)."""
    if mode is None:
        return None
-    normalized = mode.upper()
-    if normalized not in _DROP_NAMESPACE_MODES:
-        raise ValueError(
-            f"Invalid drop namespace mode {mode!r}: expected one of 'skip', 'fail'"
-        )
-    return normalized
+    return mode.upper()


 def _normalize_drop_namespace_behavior(behavior: Optional[str]) -> Optional[str]:
    """Normalize drop namespace behavior to uppercase (API expects uppercase)."""
    if behavior is None:
        return None
-    normalized = behavior.upper()
-    if normalized not in _DROP_NAMESPACE_BEHAVIORS:
-        raise ValueError(
-            f"Invalid drop namespace behavior {behavior!r}: "
-            f"expected one of 'restrict', 'cascade'"
-        )
-    return normalized
+    return behavior.upper()
--- a/python/python/lancedb/permutation.py
+++ b/python/python/lancedb/permutation.py
@@ -1,11 +1,10 @@
 # SPDX-License-Identifier: Apache-2.0
 # SPDX-FileCopyrightText: Copyright The LanceDB Authors

-import copy
-import json
-
 from deprecation import deprecated
+from lancedb import AsyncConnection, DBConnection
 import pyarrow as pa
+import json

 from ._lancedb import async_permutation_builder, PermutationReader
 from .table import LanceTable
@@ -37,7 +36,10 @@ class PermutationBuilder:
    be referenced by name in the future.  If names are not provided then they can only
    be referenced by their ordinal index.  There is no requirement to name every split.

-    The permutation is stored in memory and will be lost when the program exits.
+    By default, the permutation will be stored in memory and will be lost when the
+    program exits.  To persist the permutation (for very large datasets or to share
+    the permutation across multiple workers) use the [persist](#persist) method to
+    create a permanent table.
    """

    def __init__(self, table: LanceTable):
@@ -49,6 +51,15 @@ class PermutationBuilder:
        """
        self._async = async_permutation_builder(table)

+    def persist(
+        self, database: Union[DBConnection, AsyncConnection], table_name: str
+    ) -> "PermutationBuilder":
+        """
+        Persist the permutation to the given database.
+        """
+        self._async.persist(database, table_name)
+        return self
+
    def split_random(
        self,
        *,
@@ -369,44 +380,20 @@ class Permutation:

    def __init__(
        self,
-        base_table: LanceTable,
-        permutation_table: Optional[LanceTable],
-        split: int,
+        reader: PermutationReader,
        selection: dict[str, str],
        batch_size: int,
        transform_fn: Callable[pa.RecordBatch, Any],
-        offset: Optional[int] = None,
-        limit: Optional[int] = None,
-        connection_factory: Optional[Callable[[str], LanceTable]] = None,
-        _reader: Optional[PermutationReader] = None,
    ):
        """
        Internal constructor.  Use [from_tables](#from_tables) instead.
        """
-        assert base_table is not None, "base_table is required"
+        assert reader is not None, "reader is required"
        assert selection is not None, "selection is required"
-        self.base_table = base_table
-        self.permutation_table = permutation_table
-        self.split = split
+        self.reader = reader
        self.selection = selection
        self.transform_fn = transform_fn
        self.batch_size = batch_size
-        self.offset = offset
-        self.limit = limit
-        self.connection_factory = connection_factory
-        if _reader is None:
-            _reader = LOOP.run(self._build_reader())
-        self.reader: PermutationReader = _reader
-
-    async def _build_reader(self) -> PermutationReader:
-        reader = await PermutationReader.from_tables(
-            self.base_table, self.permutation_table, self.split
-        )
-        if self.offset is not None:
-            reader = await reader.with_offset(self.offset)
-        if self.limit is not None:
-            reader = await reader.with_limit(self.limit)
-        return reader

    def _with_selection(self, selection: dict[str, str]) -> "Permutation":
        """
@@ -415,97 +402,21 @@ class Permutation:
        Does not validation of the selection and it replaces it entirely.  This is not
        intended for public use.
        """
-        new = copy.copy(self)
-        new.selection = selection
-        return new
+        return Permutation(self.reader, selection, self.batch_size, self.transform_fn)
+
+    def _with_reader(self, reader: PermutationReader) -> "Permutation":
+        """
+        Creates a new permutation with the given reader
+
+        This is an internal method and should not be used directly.
+        """
+        return Permutation(reader, self.selection, self.batch_size, self.transform_fn)

    def with_batch_size(self, batch_size: int) -> "Permutation":
        """
        Creates a new permutation with the given batch size
        """
-        new = copy.copy(self)
-        new.batch_size = batch_size
-        return new
-
-    def with_connection_factory(
-        self, connection_factory: Callable[[str], LanceTable]
-    ) -> "Permutation":
-        """
-        Creates a new permutation that will use ``connection_factory`` to reopen
-        the base table when this permutation is unpickled in a worker process.
-
-        The factory is a callable that takes a single argument — the base table
-        name — and returns a [LanceTable]. It must be picklable; the worker
-        will pickle it via standard ``pickle`` and call it to recover the base
-        table. Picklable callables in practice means top-level (module-level)
-        functions, ``functools.partial`` of such functions, or instances of
-        picklable classes implementing ``__call__``. Lambdas and closures over
-        local variables don't pickle with the default protocol.
-
-        Setting a factory is necessary when the URI alone is not enough to
-        re-open the connection — most importantly for LanceDB Cloud (``db://``)
-        connections, where ``api_key`` and ``region`` aren't recoverable from
-        the connection object after construction.
-
-        For local file or cloud-storage paths the factory is optional: if not
-        set, ``__getstate__`` falls back to capturing
-        ``(uri, storage_options, namespace_path)`` and re-opening via
-        ``lancedb.connect(uri, storage_options=...)``.
-
-        Examples
-        --------
-        Basic native (file-system path), parameterized via ``functools.partial``::
-
-            import functools, lancedb
-            from lancedb.permutation import Permutation
-
-            def open_native_table(uri: str, table_name: str):
-                return lancedb.connect(uri).open_table(table_name)
-
-            factory = functools.partial(open_native_table, "/data/lance_db")
-            permutation = Permutation.identity(
-                factory("training")
-            ).with_connection_factory(factory)
-
-        Native via :func:`lancedb.connect_namespace` (e.g. a directory- or
-        REST-backed namespace client). The factory takes the
-        implementation name and properties dict as partial-bound args so
-        the worker can rebuild the same namespace connection::
-
-            def open_via_namespace(
-                impl: str, properties: dict[str, str], table_name: str,
-            ):
-                return lancedb.connect_namespace(impl, properties).open_table(
-                    table_name,
-                )
-
-            factory = functools.partial(
-                open_via_namespace,
-                "dir",
-                {"root": "/data/lance_db"},
-            )
-
-        LanceDB Cloud, reading credentials from env vars at worker startup
-        so secrets aren't pickled into the dataset::
-
-            import os, lancedb
-
-            def open_remote_table(table_name: str):
-                db = lancedb.connect(
-                    "db://my-database",
-                    api_key=os.environ["LANCEDB_API_KEY"],
-                    region=os.environ.get("LANCEDB_REGION", "us-east-1"),
-                )
-                return db.open_table(table_name)
-
-            permutation = Permutation.identity(
-                open_remote_table("training")
-            ).with_connection_factory(open_remote_table)
-        """
-        assert connection_factory is not None, "connection_factory is required"
-        new = copy.copy(self)
-        new.connection_factory = connection_factory
-        return new
+        return Permutation(self.reader, self.selection, batch_size, self.transform_fn)

    @classmethod
    def identity(cls, table: LanceTable) -> "Permutation":
@@ -578,126 +489,11 @@ class Permutation:
            schema = await reader.output_schema(None)
            initial_selection = {name: name for name in schema.names}
            return cls(
-                base_table,
-                permutation_table,
-                split,
-                initial_selection,
-                DEFAULT_BATCH_SIZE,
-                Transforms.arrow2python,
-                _reader=reader,
+                reader, initial_selection, DEFAULT_BATCH_SIZE, Transforms.arrow2python
            )

        return LOOP.run(do_from_tables())

-    def __getstate__(self) -> dict[str, Any]:
-        """Build a picklable state dict for this permutation.
-
-        The base table is captured either via a user-supplied
-        ``connection_factory`` (see [with_connection_factory]) or, as a
-        fallback, by introspecting ``(uri, storage_options, namespace_path)``
-        on the connection. The permutation table — always an in-memory
-        LanceDB table — is captured as a pyarrow Table (which pickles via
-        Arrow IPC natively). The reader is dropped from the wire format;
-        ``__setstate__`` rebuilds it from the restored tables.
-        """
-        permutation_data: Optional[pa.Table] = None
-        if self.permutation_table is not None:
-            permutation_data = self.permutation_table.to_arrow()
-
-        common = {
-            "base_table_name": self.base_table.name,
-            "permutation_data": permutation_data,
-            "split": self.split,
-            "selection": self.selection,
-            "batch_size": self.batch_size,
-            "transform_fn": self.transform_fn,
-            "offset": self.offset,
-            "limit": self.limit,
-            "connection_factory": self.connection_factory,
-        }
-
-        if self.connection_factory is not None:
-            # The factory carries enough state to recover the base table on
-            # its own; we don't need to capture the URI / storage options /
-            # namespace from the existing connection.
-            return common
-
-        # URI-introspection fallback: only viable for native (OSS) connections
-        # where (uri, storage_options) is enough to reopen. Remote / cloud
-        # connections don't expose recoverable api_key / region — those users
-        # must call with_connection_factory().
-        try:
-            base_uri = self.base_table._conn.uri
-            storage_options = self.base_table._conn.storage_options
-        except AttributeError as e:
-            raise ValueError(
-                "Cannot pickle this Permutation: the base table's connection "
-                "does not expose a uri/storage_options, which usually means it "
-                "is a remote (LanceDB Cloud) connection. Call "
-                "Permutation.with_connection_factory(...) first to provide a "
-                "picklable callable that re-opens the base table from a worker "
-                "process."
-            ) from e
-
-        if base_uri.startswith("memory://"):
-            # In-memory base tables don't exist in any worker process by
-            # default, so dump the entire base table into the pickle. This
-            # can be expensive for large datasets — users with large
-            # in-memory base tables should either persist them or set a
-            # connection_factory.
-            return {
-                **common,
-                "base_table_data": self.base_table.to_arrow(),
-            }
-
-        return {
-            **common,
-            "base_table_uri": base_uri,
-            "base_table_namespace": self.base_table._namespace_path,
-            "base_table_storage_options": storage_options,
-        }
-
-    def __setstate__(self, state: dict[str, Any]) -> None:
-        from . import connect
-
-        connection_factory = state["connection_factory"]
-        if connection_factory is not None:
-            base_table = connection_factory(state["base_table_name"])
-        elif "base_table_data" in state:
-            # In-memory base table inlined into the pickle; rebuild the same
-            # way we rebuild the in-memory permutation table.
-            mem_db = connect("memory://")
-            base_table = mem_db.create_table(
-                state["base_table_name"], state["base_table_data"]
-            )
-        else:
-            base_db = connect(
-                state["base_table_uri"],
-                storage_options=state["base_table_storage_options"],
-            )
-            base_table = base_db.open_table(
-                state["base_table_name"],
-                namespace_path=state["base_table_namespace"] or None,
-            )
-
-        permutation_table: Optional[LanceTable] = None
-        if state["permutation_data"] is not None:
-            mem_db = connect("memory://")
-            permutation_table = mem_db.create_table(
-                "permutation", state["permutation_data"]
-            )
-
-        self.base_table = base_table
-        self.permutation_table = permutation_table
-        self.split = state["split"]
-        self.selection = state["selection"]
-        self.batch_size = state["batch_size"]
-        self.transform_fn = state["transform_fn"]
-        self.offset = state["offset"]
-        self.limit = state["limit"]
-        self.connection_factory = connection_factory
-        self.reader = LOOP.run(self._build_reader())
-
    @property
    def schema(self) -> pa.Schema:
        async def do_output_schema():
@@ -964,9 +760,7 @@ class Permutation:
        for expensive operations such as image decoding.
        """
        assert transform is not None, "transform is required"
-        new = copy.copy(self)
-        new.transform_fn = transform
-        return new
+        return Permutation(self.reader, self.selection, self.batch_size, transform)

    def __getitem__(self, index: int) -> Any:
        """
@@ -1001,10 +795,12 @@ class Permutation:
        """
        Skip the first `skip` rows of the permutation
        """
-        new = copy.copy(self)
-        new.offset = skip
-        new.reader = LOOP.run(new._build_reader())
-        return new
+
+        async def do_with_skip():
+            reader = await self.reader.with_offset(skip)
+            return self._with_reader(reader)
+
+        return LOOP.run(do_with_skip())

    @deprecated(details="Use with_take instead")
    def take(self, limit: int) -> "Permutation":
@@ -1022,10 +818,12 @@ class Permutation:
        """
        Limit the permutation to `limit` rows (following any `skip`)
        """
-        new = copy.copy(self)
-        new.limit = limit
-        new.reader = LOOP.run(new._build_reader())
-        return new
+
+        async def do_with_take():
+            reader = await self.reader.with_limit(limit)
+            return self._with_reader(reader)
+
+        return LOOP.run(do_with_take())

    @deprecated(details="Use with_repeat instead")
    def repeat(self, times: int) -> "Permutation":
--- a/python/python/lancedb/query.py
+++ b/python/python/lancedb/query.py
@@ -25,6 +25,7 @@ import deprecation
 import numpy as np
 import pyarrow as pa
 import pyarrow.compute as pc
+import pyarrow.fs as pa_fs
 import pydantic

 from lancedb.pydantic import PYDANTIC_VERSION
@@ -1525,7 +1526,9 @@ class LanceFtsQueryBuilder(LanceQueryBuilder):
        return self._table._output_schema(self.to_query_object())

    def to_arrow(self, *, timeout: Optional[timedelta] = None) -> pa.Table:
-        self._table._ensure_no_legacy_fts_index()
+        path, fs, exist = self._table._get_fts_index_path()
+        if exist:
+            return self.tantivy_to_arrow()

        query = self._query
        if self._phrase_query:
@@ -1549,6 +1552,90 @@ class LanceFtsQueryBuilder(LanceQueryBuilder):
    ):
        raise NotImplementedError("to_batches on an FTS query")

+    def tantivy_to_arrow(self) -> pa.Table:
+        try:
+            import tantivy
+        except ImportError:
+            raise ImportError(
+                "Please install tantivy-py `pip install tantivy` to use the full text search feature."  # noqa: E501
+            )
+
+        from .fts import search_index
+
+        # get the index path
+        path, fs, exist = self._table._get_fts_index_path()
+
+        # check if the index exist
+        if not exist:
+            raise FileNotFoundError(
+                "Fts index does not exist. "
+                "Please first call table.create_fts_index(['<field_names>']) to "
+                "create the fts index."
+            )
+
+        # Check that we are on local filesystem
+        if not isinstance(fs, pa_fs.LocalFileSystem):
+            raise NotImplementedError(
+                "Tantivy-based full text search "
+                "is only supported on the local filesystem"
+            )
+        # open the index
+        index = tantivy.Index.open(path)
+        # get the scores and doc ids
+        query = self._query
+        if self._phrase_query:
+            query = query.replace('"', "'")
+            query = f'"{query}"'
+        limit = self._limit if self._limit is not None else 10
+        row_ids, scores = search_index(
+            index, query, limit, ordering_field=self.ordering_field_name
+        )
+        if len(row_ids) == 0:
+            empty_schema = pa.schema([pa.field("_score", pa.float32())])
+            return pa.Table.from_batches([], schema=empty_schema)
+        scores = pa.array(scores)
+        output_tbl = self._table.to_lance().take(row_ids, columns=self._columns)
+        output_tbl = output_tbl.append_column("_score", scores)
+        # this needs to match vector search results which are uint64
+        row_ids = pa.array(row_ids, type=pa.uint64())
+
+        if self._where is not None:
+            tmp_name = "__lancedb__duckdb__indexer__"
+            output_tbl = output_tbl.append_column(
+                tmp_name, pa.array(range(len(output_tbl)))
+            )
+            try:
+                # TODO would be great to have Substrait generate pyarrow compute
+                # expressions or conversely have pyarrow support SQL expressions
+                # using Substrait
+                import duckdb
+
+                indexer = duckdb.sql(
+                    f"SELECT {tmp_name} FROM output_tbl WHERE {self._where}"
+                ).to_arrow_table()[tmp_name]
+                output_tbl = output_tbl.take(indexer).drop([tmp_name])
+                row_ids = row_ids.take(indexer)
+
+            except ImportError:
+                import tempfile
+
+                import lance
+
+                # TODO Use "memory://" instead once that's supported
+                with tempfile.TemporaryDirectory() as tmp:
+                    ds = lance.write_dataset(output_tbl, tmp)
+                    output_tbl = ds.to_table(filter=self._where)
+                    indexer = output_tbl[tmp_name]
+                    row_ids = row_ids.take(indexer)
+                    output_tbl = output_tbl.drop([tmp_name])
+
+        if self._with_row_id:
+            output_tbl = output_tbl.append_column("_rowid", row_ids)
+
+        if self._reranker is not None:
+            output_tbl = self._reranker.rerank_fts(self._query, output_tbl)
+        return output_tbl
+
    def rerank(self, reranker: Reranker) -> LanceFtsQueryBuilder:
        """Rerank the results using the specified reranker.

@@ -1643,7 +1730,7 @@ class LanceHybridQueryBuilder(LanceQueryBuilder):
    def _validate_query(self, query, vector=None, text=None):
        if query is not None and (vector is not None or text is not None):
            raise ValueError(
-                "You can either provide a string query in search() method "
+                "You can either provide a string query in search() method"
                "or set `vector()` and `text()` explicitly for hybrid search."
                "But not both."
            )
--- a/python/python/lancedb/remote/table.py
+++ b/python/python/lancedb/remote/table.py
@@ -22,7 +22,6 @@ from lancedb.index import (
    FTS,
    BTree,
    Bitmap,
-    HnswFlat,
    HnswSq,
    IvfFlat,
    IvfPq,
@@ -40,7 +39,6 @@ from lancedb.table import _normalize_progress

 from ..query import LanceVectorQueryBuilder, LanceQueryBuilder, LanceTakeQueryBuilder
 from ..table import AsyncTable, IndexStatistics, Query, Table, Tags
-from ..types import BaseTokenizerType


 class RemoteTable(Table):
@@ -169,7 +167,7 @@ class RemoteTable(Table):
        wait_timeout: Optional[timedelta] = None,
        with_position: bool = False,
        # tokenizer configs:
-        base_tokenizer: BaseTokenizerType = "simple",
+        base_tokenizer: str = "simple",
        language: str = "English",
        max_token_length: Optional[int] = 40,
        lower_case: bool = True,
@@ -286,15 +284,13 @@ class RemoteTable(Table):
            )
        elif index_type == "IVF_HNSW_SQ":
            config = HnswSq(distance_type=metric, num_partitions=num_partitions)
-        elif index_type == "IVF_HNSW_FLAT":
-            config = HnswFlat(distance_type=metric, num_partitions=num_partitions)
        elif index_type == "IVF_FLAT":
            config = IvfFlat(distance_type=metric, num_partitions=num_partitions)
        else:
            raise ValueError(
                f"Unknown vector index type: {index_type}. Valid options are"
                " 'IVF_FLAT', 'IVF_PQ', 'IVF_RQ', 'IVF_SQ',"
-                " 'IVF_HNSW_PQ', 'IVF_HNSW_SQ', 'IVF_HNSW_FLAT'"
+                " 'IVF_HNSW_PQ', 'IVF_HNSW_SQ'"
            )

        LOOP.run(
--- a/python/python/lancedb/table.py
+++ b/python/python/lancedb/table.py
@@ -57,7 +57,6 @@ from .index import (
    LabelList,
    HnswPq,
    HnswSq,
-    HnswFlat,
    FTS,
 )
 from .merge import LanceMergeInsertBuilder
@@ -87,59 +86,6 @@ from .util import (
 )
 from .index import lang_mapping

-_MODEL_BACKED_TOKENIZER_PREFIXES = ("jieba", "lindera")
-_MODEL_BACKED_TOKENIZER_ERRORS = (
-    "unknown base tokenizer",
-    "Invalid directory path:",
-    "Failed to load Jieba",
-    "Failed to load tokenizer config",
-    "Failed to initialize default tokenizer",
-)
-
-
-def _add_unique_note(exception: BaseException, note: str) -> None:
-    existing_notes = getattr(exception, "__notes__", ()) or ()
-    message = (
-        exception.args[0]
-        if exception.args and isinstance(exception.args[0], str)
-        else ""
-    )
-    if note not in existing_notes and note not in message:
-        add_note(exception, note)
-
-
-def _is_model_backed_tokenizer(base_tokenizer: str) -> bool:
-    return any(
-        base_tokenizer == prefix or base_tokenizer.startswith(f"{prefix}/")
-        for prefix in _MODEL_BACKED_TOKENIZER_PREFIXES
-    )
-
-
-def _maybe_add_fts_error_note(
-    exception: BaseException, *, base_tokenizer: str, language: Optional[str] = None
-) -> None:
-    message = str(exception)
-    if language is not None and "not support the requested language" in message:
-        supported_langs = ", ".join(lang_mapping.values())
-        _add_unique_note(exception, f"Supported languages: {supported_langs}")
-        return
-
-    if not _is_model_backed_tokenizer(base_tokenizer):
-        return
-
-    if not any(marker in message for marker in _MODEL_BACKED_TOKENIZER_ERRORS):
-        return
-
-    _add_unique_note(
-        exception,
-        "Model-backed tokenizers such as 'jieba/default' and 'lindera/ipadic' "
-        "require tokenizer models in Lance's language model home. Set "
-        "LANCE_LANGUAGE_MODEL_HOME to override the default platform data "
-        "directory under 'lance/language_models'. Expected layouts include "
-        "'<model-home>/jieba/default/...' and "
-        "'<model-home>/lindera/ipadic/...'.",
-    )
-

 if TYPE_CHECKING:
    from .db import LanceDBConnection
@@ -245,7 +191,7 @@ def _into_pyarrow_reader(
            f"Unknown data type {type(data)}. "
            "Supported types: list of dicts, pandas DataFrame, polars DataFrame, "
            "pyarrow Table/RecordBatch, or Pydantic models. "
-            "See https://docs.lancedb.com/tables/ for examples."
+            "See https://lancedb.com/docs/tables/ for examples."
        )


@@ -997,29 +943,29 @@ class Table(ABC):
        Parameters
        ----------
        field_names: str or list of str
-            The name of the field to index. Native FTS indexes can only be
-            created on a single field at a time. To search over multiple text
-            fields, create a separate FTS index for each field.
+            The name(s) of the field to index.
+            If ``use_tantivy`` is False (default), only a single field name
+            (str) is supported. To index multiple fields, create a separate
+            FTS index for each field.
        replace: bool, default False
            If True, replace the existing index if it exists. Note that this is
            not yet an atomic operation; the index will be temporarily
            unavailable while the new index is being created.
        writer_heap_size: int, default 1GB
-            Deprecated legacy Tantivy parameter. Any value other than the
-            default raises an error.
+            Only available with use_tantivy=True
        ordering_field_names:
-            Deprecated legacy Tantivy parameter. Setting this raises an error.
+            A list of unsigned type fields to index to optionally order
+            results on at search time.
+            only available with use_tantivy=True
        tokenizer_name: str, default "default"
-            A compatibility alias for native tokenizer configs. Can be "raw",
-            "default" or the 2 letter language code followed by "_stem". So
-            for english it would be "en_stem". For new native FTS indexes, use
-            ``base_tokenizer`` directly; ``tokenizer_name`` is a legacy
-            compatibility alias and does not expose model-backed tokenizer names
-            such as ``jieba/default`` or ``lindera/ipadic``.
+            The tokenizer to use for the index. Can be "raw", "default" or the 2 letter
+            language code followed by "_stem". So for english it would be "en_stem".
+            For available languages see: https://docs.rs/tantivy/latest/tantivy/tokenizer/enum.Language.html
        use_tantivy: bool, default False
-            Deprecated legacy Tantivy parameter. Setting this to True raises an
-            error.
+            If True, use the legacy full-text search implementation based on tantivy.
+            If False, use the new full-text search implementation based on lance-index.
        with_position: bool, default False
+            Only available with use_tantivy=False
            If False, do not store the positions of the terms in the text.
            This can reduce the size of the index and improve indexing speed.
            But it will raise an exception for phrase queries.
@@ -1029,11 +975,8 @@ class Table(ABC):
            - "whitespace": Split text by whitespace, but not punctuation.
            - "raw": No tokenization. The entire text is treated as a single token.
            - "ngram": N-Gram tokenizer.
-            - "jieba/*": Jieba tokenizer loaded from Lance's language model home.
-            - "lindera/*": Lindera tokenizer loaded from Lance's language model home.
        language : str, default "English"
-            The language to use for stemming and stop-word removal. This is not
-            the primary way to enable CJK tokenization.
+            The language to use for tokenization.
        max_token_length : int, default 40
            The maximum token length to index. Tokens longer than this length will be
            ignored.
@@ -1059,13 +1002,6 @@ class Table(ABC):
            The timeout to wait if indexing is asynchronous.
        name: str, optional
            The name of the index. If not provided, a default name will be generated.
-
-        Notes
-        -----
-        Model-backed tokenizers such as ``jieba/default`` and ``lindera/ipadic``
-        require tokenizer models in Lance's language model home. Set
-        ``LANCE_LANGUAGE_MODEL_HOME`` to override the default platform data
-        directory under ``lance/language_models``.
        """
        raise NotImplementedError

@@ -1810,16 +1746,6 @@ class Table(ABC):
        index_exists = fs.get_file_info(path).type != pa_fs.FileType.NotFound
        return (path, fs, index_exists)

-    def _ensure_no_legacy_fts_index(self):
-        path, _, exists = self._get_fts_index_path()
-        if exists:
-            raise ValueError(
-                "Legacy Tantivy FTS index detected at "
-                f"{path}. Tantivy-based FTS has been removed. "
-                "Delete the legacy index and recreate it with "
-                "table.create_fts_index(...)."
-            )
-
    @abstractmethod
    def uses_v2_manifest_paths(self) -> bool:
        """
@@ -2237,13 +2163,7 @@ class LanceTable(Table):
        index_cache_size: Optional[int] = None,
        num_bits: int = 8,
        index_type: Literal[
-            "IVF_FLAT",
-            "IVF_SQ",
-            "IVF_PQ",
-            "IVF_RQ",
-            "IVF_HNSW_SQ",
-            "IVF_HNSW_PQ",
-            "IVF_HNSW_FLAT",
+            "IVF_FLAT", "IVF_SQ", "IVF_PQ", "IVF_RQ", "IVF_HNSW_SQ", "IVF_HNSW_PQ"
        ] = "IVF_PQ",
        max_iterations: int = 50,
        sample_rate: int = 256,
@@ -2330,16 +2250,6 @@ class LanceTable(Table):
                ef_construction=ef_construction,
                target_partition_size=target_partition_size,
            )
-        elif index_type == "IVF_HNSW_FLAT":
-            config = HnswFlat(
-                distance_type=metric,
-                num_partitions=num_partitions,
-                max_iterations=max_iterations,
-                sample_rate=sample_rate,
-                m=m,
-                ef_construction=ef_construction,
-                target_partition_size=target_partition_size,
-            )
        else:
            raise ValueError(f"Unknown index type {index_type}")

@@ -2495,57 +2405,41 @@ class LanceTable(Table):
        prefix_only: bool = False,
        name: Optional[str] = None,
    ):
-        self._ensure_no_legacy_fts_index()
+        if not use_tantivy:
+            if not isinstance(field_names, str):
+                raise ValueError(
+                    "Native FTS indexes can only be created on a single field "
+                    "at a time. To search over multiple text fields, create a "
+                    "separate FTS index for each field."
+                )

-        if use_tantivy:
-            raise ValueError(
-                "Tantivy-based FTS has been removed. "
-                "Remove use_tantivy and recreate the index with native FTS."
-            )
-        if ordering_field_names is not None:
-            raise ValueError(
-                "ordering_field_names was only supported by the removed "
-                "Tantivy-based FTS implementation."
-            )
-        if writer_heap_size != 1024 * 1024 * 1024:
-            raise ValueError(
-                "writer_heap_size was only supported by the removed "
-                "Tantivy-based FTS implementation."
-            )
-        if not isinstance(field_names, str):
-            raise ValueError(
-                "Native FTS indexes can only be created on a single field "
-                "at a time. To search over multiple text fields, create a "
-                "separate FTS index for each field."
-            )
-        if "." in field_names:
-            raise ValueError(
-                "Native FTS indexes can only be created on top-level fields. "
-                f"Received nested field path: {field_names!r}."
+            if tokenizer_name is None:
+                tokenizer_configs = {
+                    "base_tokenizer": base_tokenizer,
+                    "language": language,
+                    "with_position": with_position,
+                    "max_token_length": max_token_length,
+                    "lower_case": lower_case,
+                    "stem": stem,
+                    "remove_stop_words": remove_stop_words,
+                    "ascii_folding": ascii_folding,
+                    "ngram_min_length": ngram_min_length,
+                    "ngram_max_length": ngram_max_length,
+                    "prefix_only": prefix_only,
+                }
+            else:
+                tokenizer_configs = self.infer_tokenizer_configs(tokenizer_name)
+
+            config = FTS(
+                **tokenizer_configs,
            )

-        if tokenizer_name is None:
-            tokenizer_configs = {
-                "base_tokenizer": base_tokenizer,
-                "language": language,
-                "with_position": with_position,
-                "max_token_length": max_token_length,
-                "lower_case": lower_case,
-                "stem": stem,
-                "remove_stop_words": remove_stop_words,
-                "ascii_folding": ascii_folding,
-                "ngram_min_length": ngram_min_length,
-                "ngram_max_length": ngram_max_length,
-                "prefix_only": prefix_only,
-            }
-        else:
-            tokenizer_configs = self.infer_tokenizer_configs(tokenizer_name)
+            # delete the existing legacy index if it exists
+            if replace:
+                path, fs, exist = self._get_fts_index_path()
+                if exist:
+                    fs.delete_dir(path)

-        config = FTS(
-            **tokenizer_configs,
-        )
-
-        try:
            LOOP.run(
                self._table.create_index(
                    field_names,
@@ -2554,13 +2448,42 @@ class LanceTable(Table):
                    name=name,
                )
            )
-        except (ValueError, RuntimeError) as e:
-            _maybe_add_fts_error_note(
-                e,
-                base_tokenizer=config.base_tokenizer,
-                language=config.language,
+            return
+
+        from .fts import create_index, populate_index
+
+        if isinstance(field_names, str):
+            field_names = [field_names]
+
+        if isinstance(ordering_field_names, str):
+            ordering_field_names = [ordering_field_names]
+
+        path, fs, exist = self._get_fts_index_path()
+        if exist:
+            if not replace:
+                raise ValueError("Index already exists. Use replace=True to overwrite.")
+            fs.delete_dir(path)
+
+        if not isinstance(fs, pa_fs.LocalFileSystem):
+            raise NotImplementedError(
+                "Full-text search is only supported on the local filesystem"
            )
-            raise e
+
+        if tokenizer_name is None:
+            tokenizer_name = "default"
+        index = create_index(
+            path,
+            field_names,
+            ordering_fields=ordering_field_names,
+            tokenizer_name=tokenizer_name,
+        )
+        populate_index(
+            index,
+            self,
+            field_names,
+            ordering_fields=ordering_field_names,
+            writer_heap_size=writer_heap_size,
+        )

    @staticmethod
    def infer_tokenizer_configs(tokenizer_name: str) -> dict:
@@ -3006,7 +2929,6 @@ class LanceTable(Table):
                namespace_path=namespace_path,
                storage_options=storage_options,
                location=location,
-                namespace_client=namespace_client,
            )
        )
        return self
@@ -3890,18 +3812,7 @@ class AsyncTable:
        *,
        replace: Optional[bool] = None,
        config: Optional[
-            Union[
-                IvfFlat,
-                IvfPq,
-                IvfRq,
-                HnswPq,
-                HnswSq,
-                HnswFlat,
-                BTree,
-                Bitmap,
-                LabelList,
-                FTS,
-            ]
+            Union[IvfFlat, IvfPq, IvfRq, HnswPq, HnswSq, BTree, Bitmap, LabelList, FTS]
        ] = None,
        wait_timeout: Optional[timedelta] = None,
        name: Optional[str] = None,
@@ -3948,7 +3859,6 @@ class AsyncTable:
                    IvfRq,
                    HnswPq,
                    HnswSq,
-                    HnswFlat,
                    BTree,
                    Bitmap,
                    LabelList,
@@ -3968,13 +3878,11 @@ class AsyncTable:
                name=name,
                train=train,
            )
-        except (ValueError, RuntimeError) as e:
-            if isinstance(config, FTS):
-                _maybe_add_fts_error_note(
-                    e,
-                    base_tokenizer=config.base_tokenizer,
-                    language=config.language,
-                )
+        except ValueError as e:
+            if "not support the requested language" in str(e):
+                supported_langs = ", ".join(lang_mapping.values())
+                help_msg = f"Supported languages: {supported_langs}"
+                add_note(e, help_msg)
            raise e

    async def drop_index(self, name: str) -> None:
@@ -5119,7 +5027,6 @@ class IndexStatistics:
        "IVF_RQ",
        "IVF_HNSW_SQ",
        "IVF_HNSW_PQ",
-        "IVF_HNSW_FLAT",
        "FTS",
        "BTREE",
        "BITMAP",
--- a/python/python/lancedb/types.py
+++ b/python/python/lancedb/types.py
@@ -24,7 +24,6 @@ VectorIndexType = Literal[
    "IVF_PQ",
    "IVF_HNSW_SQ",
    "IVF_HNSW_PQ",
-    "IVF_HNSW_FLAT",
    "IVF_RQ",
 ]
 ScalarIndexType = Literal["BTREE", "BITMAP", "LABEL_LIST"]
@@ -32,7 +31,6 @@ IndexType = Literal[
    "IVF_PQ",
    "IVF_HNSW_PQ",
    "IVF_HNSW_SQ",
-    "IVF_HNSW_FLAT",
    "IVF_SQ",
    "FTS",
    "BTREE",
@@ -42,5 +40,4 @@ IndexType = Literal[
 ]

 # Tokenizer literals
-BuiltinTokenizerType = Literal["simple", "raw", "whitespace", "ngram"]
-BaseTokenizerType = BuiltinTokenizerType | str
+BaseTokenizerType = Literal["simple", "raw", "whitespace", "ngram"]
--- a/python/python/tests/docs/test_search.py
+++ b/python/python/tests/docs/test_search.py
@@ -180,7 +180,7 @@ def test_fts_fuzzy_query():
        ),
        mode="overwrite",
    )
-    table.create_fts_index("text", replace=True)
+    table.create_fts_index("text", use_tantivy=False, replace=True)

    results = table.search(MatchQuery("foo", "text", fuzziness=1)).to_pandas()
    assert len(results) == 4
@@ -230,7 +230,7 @@ def test_fts_boost_query():
        ),
        mode="overwrite",
    )
-    table.create_fts_index("desc", replace=True)
+    table.create_fts_index("desc", use_tantivy=False, replace=True)

    results = table.search(
        BoostQuery(
@@ -265,7 +265,7 @@ def test_fts_boolean_query(tmp_path):
        ],
        mode="overwrite",
    )
-    table.create_fts_index("text", replace=True)
+    table.create_fts_index("text", use_tantivy=False, replace=True)

    # SHOULD
    results = table.search(
@@ -319,7 +319,9 @@ def test_fts_native():
        ],
    )

-    table.create_fts_index("text")
+    # passing `use_tantivy=False` to use lance FTS index
+    # `use_tantivy=True` by default
+    table.create_fts_index("text", use_tantivy=False)
    table.search("puppy").limit(10).select(["text"]).to_list()
    # [{'text': 'Frodo was a happy puppy', '_score': 0.6931471824645996}]
    # ...
@@ -330,6 +332,7 @@ def test_fts_native():
    # --8<-- [start:fts_config_folding]
    table.create_fts_index(
        "text",
+        use_tantivy=False,
        language="French",
        stem=True,
        ascii_folding=True,
@@ -343,7 +346,7 @@ def test_fts_native():
    table.search("puppy").limit(10).where("text='foo'", prefilter=False).to_list()
    # --8<-- [end:fts_postfiltering]
    # --8<-- [start:fts_with_position]
-    table.create_fts_index("text", with_position=True, replace=True)
+    table.create_fts_index("text", use_tantivy=False, with_position=True, replace=True)
    # --8<-- [end:fts_with_position]
    # --8<-- [start:fts_incremental_index]
    table.add([{"vector": [3.1, 4.1], "text": "Frodo was a happy puppy"}])
--- a/Show More
+++ b/Show More