Compare commits

...

1 Commits

Author SHA1 Message Date
Vlad Lazar
89231e3f99 storcon: squash all migrations into one
Problem

Neon and Hadron deployments have the same database schema, but different
migration histories. Some transactions have different identifiers too.
If we don't do anything about it, then the storage controller would fail
to apply the merged set of transactions.

Summary of Changes

We squash all migrations into a single one. If the schema already
matches, then the new transaction gets applie without doing anything.
For new regions, this migration will bootstrap the database schema.

This should be merged in both neon and hadron codebases.

Note that after deploying this change, the `__diesel_schema_migrations`
table will still contain entries for the old pre-squash transactions.
This is fine because diesel only considers the tranasactions embedded
in the repo for application. Once we are certain that we are not going
to roll back, we can clean up the `__diesel_schema_migrations` tables in
prod, but this is manual and error prone, so I'd skip it.

Rolling back

Rolling back to a previous deployment which embeds the non-squashed
transactions is safe. The old transactions are still present in
`__diesel_schema_migrations` (i.e. considered applied), so no migrations
will be run, so no migrations will be run.

Note that this assumes that all transactions are applied and squashed into
the new migration before deployment.
2025-07-31 13:39:27 +01:00
50 changed files with 122 additions and 160 deletions

View File

@@ -1 +0,0 @@
DROP TABLE tenant_shards;

View File

@@ -1,13 +0,0 @@
CREATE TABLE tenant_shards (
tenant_id VARCHAR NOT NULL,
shard_number INTEGER NOT NULL,
shard_count INTEGER NOT NULL,
PRIMARY KEY(tenant_id, shard_number, shard_count),
shard_stripe_size INTEGER NOT NULL,
generation INTEGER NOT NULL,
generation_pageserver BIGINT NOT NULL,
placement_policy VARCHAR NOT NULL,
splitting SMALLINT NOT NULL,
-- config is JSON encoded, opaque to the database.
config TEXT NOT NULL
);

View File

@@ -1 +0,0 @@
DROP TABLE nodes;

View File

@@ -1,10 +0,0 @@
CREATE TABLE nodes (
node_id BIGINT PRIMARY KEY NOT NULL,
scheduling_policy VARCHAR NOT NULL,
listen_http_addr VARCHAR NOT NULL,
listen_http_port INTEGER NOT NULL,
listen_pg_addr VARCHAR NOT NULL,
listen_pg_port INTEGER NOT NULL
);

View File

@@ -1,2 +0,0 @@
ALTER TABLE tenant_shards ALTER generation SET NOT NULL;
ALTER TABLE tenant_shards ALTER generation_pageserver SET NOT NULL;

View File

@@ -1,4 +0,0 @@
ALTER TABLE tenant_shards ALTER generation DROP NOT NULL;
ALTER TABLE tenant_shards ALTER generation_pageserver DROP NOT NULL;

View File

@@ -1,3 +0,0 @@
UPDATE tenant_shards set placement_policy='{"Double": 1}' where placement_policy='{"Attached": 1}';
UPDATE tenant_shards set placement_policy='"Single"' where placement_policy='{"Attached": 0}';

View File

@@ -1,3 +0,0 @@
UPDATE tenant_shards set placement_policy='{"Attached": 1}' where placement_policy='{"Double": 1}';
UPDATE tenant_shards set placement_policy='{"Attached": 0}' where placement_policy='"Single"';

View File

@@ -1,3 +0,0 @@
-- This file should undo anything in `up.sql`
ALTER TABLE tenant_shards drop scheduling_policy;

View File

@@ -1,2 +0,0 @@
ALTER TABLE tenant_shards add scheduling_policy VARCHAR NOT NULL DEFAULT '"Active"';

View File

@@ -1 +0,0 @@
DROP TABLE metadata_health;

View File

@@ -1,14 +0,0 @@
CREATE TABLE metadata_health (
tenant_id VARCHAR NOT NULL,
shard_number INTEGER NOT NULL,
shard_count INTEGER NOT NULL,
PRIMARY KEY(tenant_id, shard_number, shard_count),
-- Rely on cascade behavior for delete
FOREIGN KEY(tenant_id, shard_number, shard_count) REFERENCES tenant_shards ON DELETE CASCADE,
healthy BOOLEAN NOT NULL DEFAULT TRUE,
last_scrubbed_at TIMESTAMPTZ NOT NULL DEFAULT NOW()
);
INSERT INTO metadata_health(tenant_id, shard_number, shard_count)
SELECT tenant_id, shard_number, shard_count FROM tenant_shards;

View File

@@ -1 +0,0 @@
DROP TABLE controllers;

View File

@@ -1,5 +0,0 @@
CREATE TABLE controllers (
address VARCHAR NOT NULL,
started_at TIMESTAMPTZ NOT NULL,
PRIMARY KEY(address, started_at)
);

View File

@@ -1,2 +0,0 @@
-- This file should undo anything in `up.sql`
DROP TABLE safekeepers;

View File

@@ -1,15 +0,0 @@
-- started out as a copy of cplane schema, removed the unnecessary columns.
CREATE TABLE safekeepers (
-- the surrogate identifier defined by control plane database sequence
id BIGINT PRIMARY KEY,
region_id TEXT NOT NULL,
version BIGINT NOT NULL,
-- the natural id on whatever cloud platform, not needed in storage controller
-- instance_id TEXT UNIQUE NOT NULL,
host TEXT NOT NULL,
port INTEGER NOT NULL,
active BOOLEAN NOT NULL DEFAULT false,
-- projects_count INTEGER NOT NULL DEFAULT 0,
http_port INTEGER NOT NULL,
availability_zone_id TEXT NOT NULL
);

View File

@@ -1,2 +0,0 @@
-- This file should undo anything in `up.sql`
DROP INDEX tenant_shards_tenant_id;

View File

@@ -1,2 +0,0 @@
-- Your SQL goes here
CREATE INDEX tenant_shards_tenant_id ON tenant_shards (tenant_id);

View File

@@ -1 +0,0 @@
ALTER TABLE nodes DROP availability_zone_id;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ADD availability_zone_id VARCHAR;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ALTER availability_zone_id DROP NOT NULL;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ALTER availability_zone_id SET NOT NULL;

View File

@@ -1 +0,0 @@
ALTER TABLE tenant_shards DROP preferred_az_id;

View File

@@ -1 +0,0 @@
ALTER TABLE tenant_shards ADD preferred_az_id VARCHAR;

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers DROP scheduling_policy;

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers ADD scheduling_policy VARCHAR NOT NULL DEFAULT 'disabled';

View File

@@ -1,4 +0,0 @@
-- this sadly isn't a "true" revert of the migration, as the column is now at the end of the table.
-- But preserving order is not a trivial operation.
-- https://wiki.postgresql.org/wiki/Alter_column_position
ALTER TABLE safekeepers ADD active BOOLEAN NOT NULL DEFAULT false;

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers DROP active;

View File

@@ -1,2 +0,0 @@
ALTER TABLE safekeepers ALTER COLUMN scheduling_policy SET DEFAULT 'disabled';
UPDATE safekeepers SET scheduling_policy = 'disabled' WHERE scheduling_policy = 'pause';

View File

@@ -1,2 +0,0 @@
ALTER TABLE safekeepers ALTER COLUMN scheduling_policy SET DEFAULT 'pause';
UPDATE safekeepers SET scheduling_policy = 'pause' WHERE scheduling_policy = 'disabled';

View File

@@ -1 +0,0 @@
ALTER TABLE nodes DROP listen_https_port;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ADD listen_https_port INTEGER;

View File

@@ -1,2 +0,0 @@
DROP TABLE timelines;
DROP TABLE safekeeper_timeline_pending_ops;

View File

@@ -1,19 +0,0 @@
CREATE TABLE timelines (
tenant_id VARCHAR NOT NULL,
timeline_id VARCHAR NOT NULL,
start_lsn pg_lsn NOT NULL,
generation INTEGER NOT NULL,
sk_set BIGINT[] NOT NULL,
new_sk_set BIGINT[],
cplane_notified_generation INTEGER NOT NULL,
deleted_at timestamptz,
PRIMARY KEY(tenant_id, timeline_id)
);
CREATE TABLE safekeeper_timeline_pending_ops (
sk_id BIGINT NOT NULL,
tenant_id VARCHAR NOT NULL,
timeline_id VARCHAR NOT NULL,
generation INTEGER NOT NULL,
op_kind VARCHAR NOT NULL,
PRIMARY KEY(tenant_id, timeline_id, sk_id)
);

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers DROP https_port;

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers ADD https_port INTEGER;

View File

@@ -1 +0,0 @@
DROP TABLE timeline_imports;

View File

@@ -1,6 +0,0 @@
CREATE TABLE timeline_imports (
tenant_id VARCHAR NOT NULL,
timeline_id VARCHAR NOT NULL,
shard_statuses JSONB NOT NULL,
PRIMARY KEY(tenant_id, timeline_id)
);

View File

@@ -1 +0,0 @@
ALTER TABLE nodes DROP COLUMN lifecycle;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ADD COLUMN lifecycle VARCHAR NOT NULL DEFAULT 'active';

View File

@@ -1 +0,0 @@
ALTER TABLE nodes DROP listen_grpc_addr, listen_grpc_port;

View File

@@ -1 +0,0 @@
ALTER TABLE nodes ADD listen_grpc_addr VARCHAR NULL, ADD listen_grpc_port INTEGER NULL;

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers ALTER COLUMN scheduling_policy SET DEFAULT 'pause';

View File

@@ -1 +0,0 @@
ALTER TABLE safekeepers ALTER COLUMN scheduling_policy SET DEFAULT 'activating';

View File

@@ -1 +0,0 @@
ALTER TABLE timelines DROP sk_set_notified_generation;

View File

@@ -1 +0,0 @@
ALTER TABLE timelines ADD sk_set_notified_generation INTEGER NOT NULL DEFAULT 1;

View File

@@ -1,2 +0,0 @@
DROP TABLE hadron_safekeepers;
DROP TABLE hadron_timeline_safekeepers;

View File

@@ -1,17 +0,0 @@
-- hadron_safekeepers keep track of all Safe Keeper nodes that exist in the system.
-- Upon startup, each Safe Keeper reaches out to the hadron cluster coordinator to register its node ID and listen addresses.
CREATE TABLE hadron_safekeepers (
sk_node_id BIGINT PRIMARY KEY NOT NULL,
listen_http_addr VARCHAR NOT NULL,
listen_http_port INTEGER NOT NULL,
listen_pg_addr VARCHAR NOT NULL,
listen_pg_port INTEGER NOT NULL
);
CREATE TABLE hadron_timeline_safekeepers (
timeline_id VARCHAR NOT NULL,
sk_node_id BIGINT NOT NULL,
legacy_endpoint_id UUID DEFAULT NULL,
PRIMARY KEY(timeline_id, sk_node_id)
);

View File

@@ -0,0 +1,10 @@
DROP TABLE IF EXISTS timelines CASCADE;
DROP TABLE IF EXISTS timeline_imports CASCADE;
DROP TABLE IF EXISTS tenant_shards CASCADE;
DROP TABLE IF EXISTS safekeepers CASCADE;
DROP TABLE IF EXISTS safekeeper_timeline_pending_ops CASCADE;
DROP TABLE IF EXISTS nodes CASCADE;
DROP TABLE IF EXISTS metadata_health CASCADE;
DROP TABLE IF EXISTS hadron_timeline_safekeepers CASCADE;
DROP TABLE IF EXISTS hadron_safekeepers CASCADE;
DROP TABLE IF EXISTS controllers CASCADE;

View File

@@ -0,0 +1,112 @@
/*
* This migration squashes all previous migrations into a single one.
* It will be applied in two cases:
* 1. Spinning up a new region. There's no previous migrations apart from the diesel setup in this case
* 2. For existing regions.
*
* Hence, this migration does nothing if the schema is already up to date.
*/
CREATE TABLE IF NOT EXISTS controllers (
address character varying NOT NULL,
started_at timestamp with time zone NOT NULL,
PRIMARY KEY(address, started_at)
);
CREATE TABLE IF NOT EXISTS hadron_safekeepers (
sk_node_id bigint PRIMARY KEY NOT NULL,
listen_http_addr character varying NOT NULL,
listen_http_port integer NOT NULL,
listen_pg_addr character varying NOT NULL,
listen_pg_port integer NOT NULL
);
CREATE TABLE IF NOT EXISTS hadron_timeline_safekeepers (
timeline_id character varying NOT NULL,
sk_node_id bigint NOT NULL,
legacy_endpoint_id uuid,
PRIMARY KEY(timeline_id, sk_node_id)
);
CREATE TABLE IF NOT EXISTS tenant_shards (
tenant_id character varying NOT NULL,
shard_number integer NOT NULL,
shard_count integer NOT NULL,
PRIMARY KEY(tenant_id, shard_number, shard_count),
shard_stripe_size integer NOT NULL,
generation integer,
generation_pageserver bigint,
placement_policy character varying NOT NULL,
splitting smallint NOT NULL,
config text NOT NULL,
scheduling_policy character varying DEFAULT '"Active"'::character varying NOT NULL,
preferred_az_id character varying
);
CREATE INDEX IF NOT EXISTS tenant_shards_tenant_id ON tenant_shards USING btree (tenant_id);
CREATE TABLE IF NOT EXISTS metadata_health (
tenant_id character varying NOT NULL,
shard_number integer NOT NULL,
shard_count integer NOT NULL,
PRIMARY KEY(tenant_id, shard_number, shard_count),
-- Rely on cascade behavior for delete
FOREIGN KEY(tenant_id, shard_number, shard_count) REFERENCES tenant_shards ON DELETE CASCADE,
healthy boolean DEFAULT true NOT NULL,
last_scrubbed_at timestamp with time zone DEFAULT now() NOT NULL
);
CREATE TABLE IF NOT EXISTS nodes (
node_id bigint PRIMARY KEY NOT NULL,
scheduling_policy character varying NOT NULL,
listen_http_addr character varying NOT NULL,
listen_http_port integer NOT NULL,
listen_pg_addr character varying NOT NULL,
listen_pg_port integer NOT NULL,
availability_zone_id character varying NOT NULL,
listen_https_port integer,
lifecycle character varying DEFAULT 'active'::character varying NOT NULL,
listen_grpc_addr character varying,
listen_grpc_port integer
);
CREATE TABLE IF NOT EXISTS safekeeper_timeline_pending_ops (
sk_id bigint NOT NULL,
tenant_id character varying NOT NULL,
timeline_id character varying NOT NULL,
generation integer NOT NULL,
op_kind character varying NOT NULL,
PRIMARY KEY(tenant_id, timeline_id, sk_id)
);
CREATE TABLE IF NOT EXISTS safekeepers (
id bigint PRIMARY KEY NOT NULL,
region_id text NOT NULL,
version bigint NOT NULL,
host text NOT NULL,
port integer NOT NULL,
http_port integer NOT NULL,
availability_zone_id text NOT NULL,
scheduling_policy character varying DEFAULT 'activating'::character varying NOT NULL,
https_port integer
);
CREATE TABLE IF NOT EXISTS timeline_imports (
tenant_id character varying NOT NULL,
timeline_id character varying NOT NULL,
shard_statuses jsonb NOT NULL,
PRIMARY KEY(tenant_id, timeline_id)
);
CREATE TABLE IF NOT EXISTS timelines (
tenant_id character varying NOT NULL,
timeline_id character varying NOT NULL,
start_lsn pg_lsn NOT NULL,
generation integer NOT NULL,
sk_set bigint[] NOT NULL,
new_sk_set bigint[],
cplane_notified_generation integer NOT NULL,
deleted_at timestamp with time zone,
sk_set_notified_generation integer DEFAULT 1 NOT NULL,
PRIMARY KEY(tenant_id, timeline_id)
);