Implemented full incremental backup creation: internal/backup/incremental_postgres.go: - CreateIncrementalBackup() - main entry point - Validates base backup exists and is full backup - Loads base backup metadata (.meta.json) - Uses FindChangedFiles() to detect modifications - Creates tar.gz with ONLY changed files - Generates incremental metadata with: - Base backup ID (SHA-256) - Backup chain (base -> incr1 -> incr2...) - Changed file count and total size - Saves .meta.json with full incremental metadata - Calculates SHA-256 checksum of archive internal/backup/incremental_tar.go: - createTarGz() - creates compressed archive - addFileToTar() - adds individual files to tar - Handles context cancellation - Progress logging for each file - Preserves file permissions and timestamps Helper Functions: - loadBackupInfo() - loads BackupMetadata from .meta.json - buildBackupChain() - constructs restore chain - CalculateFileChecksum() - SHA-256 for archive Features: ✅ Creates tar.gz with ONLY changed files ✅ Much smaller than full backup ✅ Links to base backup via SHA-256 ✅ Tracks complete restore chain ✅ Full metadata for restore validation ✅ Context-aware (cancellable) Status: READY FOR TESTING Next: Wire into backup engine, test with real PostgreSQL data
279 lines
7.9 KiB
Go
279 lines
7.9 KiB
Go
package backup
|
|
|
|
import (
|
|
"context"
|
|
"crypto/sha256"
|
|
"encoding/hex"
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
"path/filepath"
|
|
"strings"
|
|
"time"
|
|
|
|
"dbbackup/internal/logger"
|
|
"dbbackup/internal/metadata"
|
|
)
|
|
|
|
// PostgresIncrementalEngine implements incremental backups for PostgreSQL
|
|
type PostgresIncrementalEngine struct {
|
|
log logger.Logger
|
|
}
|
|
|
|
// NewPostgresIncrementalEngine creates a new PostgreSQL incremental backup engine
|
|
func NewPostgresIncrementalEngine(log logger.Logger) *PostgresIncrementalEngine {
|
|
return &PostgresIncrementalEngine{
|
|
log: log,
|
|
}
|
|
}
|
|
|
|
// FindChangedFiles identifies files that changed since the base backup
|
|
// This is a simple mtime-based implementation. Production should use pg_basebackup with incremental support.
|
|
func (e *PostgresIncrementalEngine) FindChangedFiles(ctx context.Context, config *IncrementalBackupConfig) ([]ChangedFile, error) {
|
|
e.log.Info("Finding changed files for incremental backup",
|
|
"base_backup", config.BaseBackupPath,
|
|
"data_dir", config.DataDirectory)
|
|
|
|
// Load base backup metadata to get timestamp
|
|
baseInfo, err := e.loadBackupInfo(config.BaseBackupPath)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to load base backup info: %w", err)
|
|
}
|
|
|
|
// Validate base backup is full backup
|
|
if baseInfo.BackupType != "" && baseInfo.BackupType != "full" {
|
|
return nil, fmt.Errorf("base backup must be a full backup, got: %s", baseInfo.BackupType)
|
|
}
|
|
|
|
baseTimestamp := baseInfo.Timestamp
|
|
e.log.Info("Base backup timestamp", "timestamp", baseTimestamp)
|
|
|
|
// Scan data directory for changed files
|
|
var changedFiles []ChangedFile
|
|
|
|
err = filepath.Walk(config.DataDirectory, func(path string, info os.FileInfo, err error) error {
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Skip directories
|
|
if info.IsDir() {
|
|
return nil
|
|
}
|
|
|
|
// Skip temporary files, lock files, and sockets
|
|
if e.shouldSkipFile(path, info) {
|
|
return nil
|
|
}
|
|
|
|
// Check if file was modified after base backup
|
|
if info.ModTime().After(baseTimestamp) {
|
|
relPath, err := filepath.Rel(config.DataDirectory, path)
|
|
if err != nil {
|
|
e.log.Warn("Failed to get relative path", "path", path, "error", err)
|
|
return nil
|
|
}
|
|
|
|
changedFiles = append(changedFiles, ChangedFile{
|
|
RelativePath: relPath,
|
|
AbsolutePath: path,
|
|
Size: info.Size(),
|
|
ModTime: info.ModTime(),
|
|
})
|
|
}
|
|
|
|
return nil
|
|
})
|
|
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to scan data directory: %w", err)
|
|
}
|
|
|
|
e.log.Info("Found changed files", "count", len(changedFiles))
|
|
return changedFiles, nil
|
|
}
|
|
|
|
// shouldSkipFile determines if a file should be excluded from incremental backup
|
|
func (e *PostgresIncrementalEngine) shouldSkipFile(path string, info os.FileInfo) bool {
|
|
name := info.Name()
|
|
|
|
// Skip temporary files
|
|
if strings.HasSuffix(name, ".tmp") {
|
|
return true
|
|
}
|
|
|
|
// Skip lock files
|
|
if strings.HasSuffix(name, ".lock") || name == "postmaster.pid" {
|
|
return true
|
|
}
|
|
|
|
// Skip sockets
|
|
if info.Mode()&os.ModeSocket != 0 {
|
|
return true
|
|
}
|
|
|
|
// Skip pg_wal symlink target (WAL handled separately if needed)
|
|
if strings.Contains(path, "pg_wal") || strings.Contains(path, "pg_xlog") {
|
|
return true
|
|
}
|
|
|
|
// Skip pg_replslot (replication slots)
|
|
if strings.Contains(path, "pg_replslot") {
|
|
return true
|
|
}
|
|
|
|
// Skip postmaster.opts (runtime config, regenerated on startup)
|
|
if name == "postmaster.opts" {
|
|
return true
|
|
}
|
|
|
|
return false
|
|
}
|
|
|
|
// loadBackupInfo loads backup metadata from .meta.json file
|
|
func (e *PostgresIncrementalEngine) loadBackupInfo(backupPath string) (*metadata.BackupMetadata, error) {
|
|
// Load using metadata package
|
|
meta, err := metadata.Load(backupPath)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to load backup metadata: %w", err)
|
|
}
|
|
|
|
return meta, nil
|
|
}
|
|
|
|
// CreateIncrementalBackup creates a new incremental backup archive
|
|
func (e *PostgresIncrementalEngine) CreateIncrementalBackup(ctx context.Context, config *IncrementalBackupConfig, changedFiles []ChangedFile) error {
|
|
e.log.Info("Creating incremental backup",
|
|
"changed_files", len(changedFiles),
|
|
"base_backup", config.BaseBackupPath)
|
|
|
|
if len(changedFiles) == 0 {
|
|
e.log.Info("No changed files detected - skipping incremental backup")
|
|
return fmt.Errorf("no changed files since base backup")
|
|
}
|
|
|
|
// Load base backup metadata
|
|
baseInfo, err := e.loadBackupInfo(config.BaseBackupPath)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to load base backup info: %w", err)
|
|
}
|
|
|
|
// Generate output filename: dbname_incr_TIMESTAMP.tar.gz
|
|
timestamp := time.Now().Format("20060102_150405")
|
|
outputFile := filepath.Join(filepath.Dir(config.BaseBackupPath),
|
|
fmt.Sprintf("%s_incr_%s.tar.gz", baseInfo.Database, timestamp))
|
|
|
|
e.log.Info("Creating incremental archive", "output", outputFile)
|
|
|
|
// Create tar.gz archive with changed files
|
|
if err := e.createTarGz(ctx, outputFile, changedFiles, config); err != nil {
|
|
return fmt.Errorf("failed to create archive: %w", err)
|
|
}
|
|
|
|
// Calculate checksum
|
|
checksum, err := e.CalculateFileChecksum(outputFile)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to calculate checksum: %w", err)
|
|
}
|
|
|
|
// Get archive size
|
|
stat, err := os.Stat(outputFile)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to stat archive: %w", err)
|
|
}
|
|
|
|
// Calculate total size of changed files
|
|
var totalSize int64
|
|
for _, f := range changedFiles {
|
|
totalSize += f.Size
|
|
}
|
|
|
|
// Create incremental metadata
|
|
metadata := &metadata.BackupMetadata{
|
|
Version: "2.2.0",
|
|
Timestamp: time.Now(),
|
|
Database: baseInfo.Database,
|
|
DatabaseType: baseInfo.DatabaseType,
|
|
Host: baseInfo.Host,
|
|
Port: baseInfo.Port,
|
|
User: baseInfo.User,
|
|
BackupFile: outputFile,
|
|
SizeBytes: stat.Size(),
|
|
SHA256: checksum,
|
|
Compression: "gzip",
|
|
BackupType: "incremental",
|
|
BaseBackup: filepath.Base(config.BaseBackupPath),
|
|
Incremental: &metadata.IncrementalMetadata{
|
|
BaseBackupID: baseInfo.SHA256,
|
|
BaseBackupPath: filepath.Base(config.BaseBackupPath),
|
|
BaseBackupTimestamp: baseInfo.Timestamp,
|
|
IncrementalFiles: len(changedFiles),
|
|
TotalSize: totalSize,
|
|
BackupChain: buildBackupChain(baseInfo, filepath.Base(outputFile)),
|
|
},
|
|
}
|
|
|
|
// Save metadata
|
|
if err := metadata.Save(); err != nil {
|
|
return fmt.Errorf("failed to save metadata: %w", err)
|
|
}
|
|
|
|
e.log.Info("Incremental backup created successfully",
|
|
"output", outputFile,
|
|
"size", stat.Size(),
|
|
"changed_files", len(changedFiles),
|
|
"checksum", checksum[:16]+"...")
|
|
|
|
return nil
|
|
}
|
|
|
|
// RestoreIncremental restores an incremental backup on top of a base
|
|
func (e *PostgresIncrementalEngine) RestoreIncremental(ctx context.Context, baseBackupPath, incrementalPath, targetDir string) error {
|
|
e.log.Info("Restoring incremental backup",
|
|
"base", baseBackupPath,
|
|
"incremental", incrementalPath,
|
|
"target", targetDir)
|
|
|
|
// TODO: Implementation in next step
|
|
// 1. Extract base backup to target
|
|
// 2. Extract incremental backup, overwriting files
|
|
// 3. Verify checksums
|
|
// 4. Update permissions
|
|
|
|
return fmt.Errorf("not implemented yet")
|
|
}
|
|
|
|
// CalculateFileChecksum computes SHA-256 hash of a file
|
|
func (e *PostgresIncrementalEngine) CalculateFileChecksum(path string) (string, error) {
|
|
file, err := os.Open(path)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
defer file.Close()
|
|
|
|
hash := sha256.New()
|
|
if _, err := io.Copy(hash, file); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
return hex.EncodeToString(hash.Sum(nil)), nil
|
|
}
|
|
|
|
// buildBackupChain constructs the backup chain from base backup to current incremental
|
|
func buildBackupChain(baseInfo *metadata.BackupMetadata, currentBackup string) []string {
|
|
chain := []string{}
|
|
|
|
// If base backup has a chain (is itself incremental), use that
|
|
if baseInfo.Incremental != nil && len(baseInfo.Incremental.BackupChain) > 0 {
|
|
chain = append(chain, baseInfo.Incremental.BackupChain...)
|
|
} else {
|
|
// Base is a full backup, start chain with it
|
|
chain = append(chain, filepath.Base(baseInfo.BackupFile))
|
|
}
|
|
|
|
// Add current incremental to chain
|
|
chain = append(chain, currentBackup)
|
|
|
|
return chain
|
|
}
|