mirror of
https://github.com/neondatabase/neon.git
synced 2026-01-08 14:02:55 +00:00
by binding sockets before daemonization also use less annoying error reporting by not printing full error messages for connect errors in first several connection retries closes #507
272 lines
8.1 KiB
Rust
272 lines
8.1 KiB
Rust
use std::io::Write;
|
|
use std::net::TcpStream;
|
|
use std::path::PathBuf;
|
|
use std::process::Command;
|
|
use std::time::Duration;
|
|
use std::{io, thread};
|
|
|
|
use anyhow::{anyhow, bail, Result};
|
|
use nix::sys::signal::{kill, Signal};
|
|
use nix::unistd::Pid;
|
|
use pageserver::http::models::{BranchCreateRequest, TenantCreateRequest};
|
|
use postgres::{Config, NoTls};
|
|
use reqwest::blocking::{Client, RequestBuilder};
|
|
use reqwest::{IntoUrl, Method};
|
|
use zenith_utils::postgres_backend::AuthType;
|
|
use zenith_utils::zid::ZTenantId;
|
|
|
|
use crate::local_env::LocalEnv;
|
|
use crate::read_pidfile;
|
|
use pageserver::branches::BranchInfo;
|
|
use zenith_utils::connstring::connection_address;
|
|
|
|
const HTTP_BASE_URL: &str = "http://127.0.0.1:9898/v1";
|
|
|
|
//
|
|
// Control routines for pageserver.
|
|
//
|
|
// Used in CLI and tests.
|
|
//
|
|
#[derive(Debug)]
|
|
pub struct PageServerNode {
|
|
pub kill_on_exit: bool,
|
|
pub pg_connection_config: Config,
|
|
pub env: LocalEnv,
|
|
pub http_client: Client,
|
|
pub http_base_url: String,
|
|
}
|
|
|
|
impl PageServerNode {
|
|
pub fn from_env(env: &LocalEnv) -> PageServerNode {
|
|
let password = if env.auth_type == AuthType::ZenithJWT {
|
|
&env.auth_token
|
|
} else {
|
|
""
|
|
};
|
|
|
|
PageServerNode {
|
|
kill_on_exit: false,
|
|
pg_connection_config: Self::default_config(password), // default
|
|
env: env.clone(),
|
|
http_client: Client::new(),
|
|
http_base_url: HTTP_BASE_URL.to_owned(),
|
|
}
|
|
}
|
|
|
|
fn default_config(password: &str) -> Config {
|
|
format!("postgresql://no_user:{}@localhost:64000/no_db", password)
|
|
.parse()
|
|
.unwrap()
|
|
}
|
|
|
|
pub fn init(&self, create_tenant: Option<&str>, enable_auth: bool) -> Result<()> {
|
|
let mut cmd = Command::new(self.env.pageserver_bin()?);
|
|
let mut args = vec![
|
|
"--init",
|
|
"-D",
|
|
self.env.base_data_dir.to_str().unwrap(),
|
|
"--postgres-distrib",
|
|
self.env.pg_distrib_dir.to_str().unwrap(),
|
|
];
|
|
|
|
if enable_auth {
|
|
args.extend(&["--auth-validation-public-key-path", "auth_public_key.pem"]);
|
|
args.extend(&["--auth-type", "ZenithJWT"]);
|
|
}
|
|
|
|
if let Some(tenantid) = create_tenant {
|
|
args.extend(&["--create-tenant", tenantid])
|
|
}
|
|
|
|
let status = cmd
|
|
.args(args)
|
|
.env_clear()
|
|
.env("RUST_BACKTRACE", "1")
|
|
.status()
|
|
.expect("pageserver init failed");
|
|
|
|
if status.success() {
|
|
Ok(())
|
|
} else {
|
|
Err(anyhow!("pageserver init failed"))
|
|
}
|
|
}
|
|
|
|
pub fn repo_path(&self) -> PathBuf {
|
|
self.env.pageserver_data_dir()
|
|
}
|
|
|
|
pub fn pid_file(&self) -> PathBuf {
|
|
self.repo_path().join("pageserver.pid")
|
|
}
|
|
|
|
pub fn start(&self) -> Result<()> {
|
|
print!(
|
|
"Starting pageserver at '{}' in '{}'",
|
|
connection_address(&self.pg_connection_config),
|
|
self.repo_path().display()
|
|
);
|
|
io::stdout().flush().unwrap();
|
|
|
|
let mut cmd = Command::new(self.env.pageserver_bin()?);
|
|
cmd.args(&["-D", self.repo_path().to_str().unwrap()])
|
|
.arg("-d")
|
|
.env_clear()
|
|
.env("RUST_BACKTRACE", "1");
|
|
|
|
if !cmd.status()?.success() {
|
|
bail!(
|
|
"Pageserver failed to start. See '{}' for details.",
|
|
self.repo_path().join("pageserver.log").display()
|
|
);
|
|
}
|
|
|
|
// It takes a while for the page server to start up. Wait until it is
|
|
// open for business.
|
|
const RETRIES: i8 = 15;
|
|
for retries in 1..RETRIES {
|
|
match self.check_status() {
|
|
Ok(_) => {
|
|
println!("\nPageserver started");
|
|
return Ok(());
|
|
}
|
|
Err(err) => {
|
|
if err.is_connect() && retries < 5 {
|
|
print!(".");
|
|
io::stdout().flush().unwrap();
|
|
} else {
|
|
if retries == 5 {
|
|
print!("\n") // put a line break after dots for second message
|
|
}
|
|
println!(
|
|
"Pageserver not responding yet, err {} retrying ({})...",
|
|
err, retries
|
|
);
|
|
}
|
|
thread::sleep(Duration::from_secs(1));
|
|
}
|
|
}
|
|
}
|
|
bail!("pageserver failed to start in {} seconds", RETRIES);
|
|
}
|
|
|
|
pub fn stop(&self) -> Result<()> {
|
|
let pid = read_pidfile(&self.pid_file())?;
|
|
let pid = Pid::from_raw(pid);
|
|
if kill(pid, Signal::SIGTERM).is_err() {
|
|
bail!("Failed to kill pageserver with pid {}", pid);
|
|
}
|
|
|
|
// wait for pageserver stop
|
|
let address = connection_address(&self.pg_connection_config);
|
|
for _ in 0..5 {
|
|
let stream = TcpStream::connect(&address);
|
|
thread::sleep(Duration::from_secs(1));
|
|
if let Err(_e) = stream {
|
|
println!("Pageserver stopped");
|
|
return Ok(());
|
|
}
|
|
println!("Stopping pageserver on {}", address);
|
|
}
|
|
|
|
bail!("Failed to stop pageserver with pid {}", pid);
|
|
}
|
|
|
|
pub fn page_server_psql(&self, sql: &str) -> Vec<postgres::SimpleQueryMessage> {
|
|
let mut client = self.pg_connection_config.connect(NoTls).unwrap();
|
|
|
|
println!("Pageserver query: '{}'", sql);
|
|
client.simple_query(sql).unwrap()
|
|
}
|
|
|
|
pub fn page_server_psql_client(&self) -> Result<postgres::Client, postgres::Error> {
|
|
self.pg_connection_config.connect(NoTls)
|
|
}
|
|
|
|
fn http_request<U: IntoUrl>(&self, method: Method, url: U) -> RequestBuilder {
|
|
let mut builder = self.http_client.request(method, url);
|
|
if self.env.auth_type == AuthType::ZenithJWT {
|
|
builder = builder.bearer_auth(&self.env.auth_token)
|
|
}
|
|
builder
|
|
}
|
|
|
|
pub fn check_status(&self) -> reqwest::Result<()> {
|
|
self.http_request(Method::GET, format!("{}/{}", self.http_base_url, "status"))
|
|
.send()?
|
|
.error_for_status()?;
|
|
Ok(())
|
|
}
|
|
|
|
pub fn tenant_list(&self) -> reqwest::Result<Vec<String>> {
|
|
Ok(self
|
|
.http_request(Method::GET, format!("{}/{}", self.http_base_url, "tenant"))
|
|
.send()?
|
|
.error_for_status()?
|
|
.json()?)
|
|
}
|
|
|
|
pub fn tenant_create(&self, tenantid: ZTenantId) -> reqwest::Result<()> {
|
|
Ok(self
|
|
.http_request(Method::POST, format!("{}/{}", self.http_base_url, "tenant"))
|
|
.json(&TenantCreateRequest {
|
|
tenant_id: tenantid,
|
|
})
|
|
.send()?
|
|
.error_for_status()?
|
|
.json()?)
|
|
}
|
|
|
|
pub fn branch_list(&self, tenantid: &ZTenantId) -> reqwest::Result<Vec<BranchInfo>> {
|
|
Ok(self
|
|
.http_request(
|
|
Method::GET,
|
|
format!("{}/branch/{}", self.http_base_url, tenantid),
|
|
)
|
|
.send()?
|
|
.error_for_status()?
|
|
.json()?)
|
|
}
|
|
|
|
pub fn branch_create(
|
|
&self,
|
|
branch_name: &str,
|
|
startpoint: &str,
|
|
tenantid: &ZTenantId,
|
|
) -> reqwest::Result<BranchInfo> {
|
|
Ok(self
|
|
.http_request(Method::POST, format!("{}/branch", self.http_base_url))
|
|
.json(&BranchCreateRequest {
|
|
tenant_id: tenantid.to_owned(),
|
|
name: branch_name.to_owned(),
|
|
start_point: startpoint.to_owned(),
|
|
})
|
|
.send()?
|
|
.error_for_status()?
|
|
.json()?)
|
|
}
|
|
|
|
pub fn branch_get_by_name(
|
|
&self,
|
|
tenantid: &ZTenantId,
|
|
branch_name: &str,
|
|
) -> Result<BranchInfo> {
|
|
Ok(self
|
|
.http_request(
|
|
Method::GET,
|
|
format!("{}/branch/{}/{}", self.http_base_url, tenantid, branch_name),
|
|
)
|
|
.send()?
|
|
.error_for_status()?
|
|
.json()?)
|
|
}
|
|
}
|
|
|
|
impl Drop for PageServerNode {
|
|
fn drop(&mut self) {
|
|
if self.kill_on_exit {
|
|
let _ = self.stop();
|
|
}
|
|
}
|
|
}
|