feat: v2.0 Sprint 3 - Cloud URI Support & Command Integration (Part 1)

Sprint 3 Implementation - Cloud URI Support:

New Features:
 Cloud URI parser (s3://bucket/path)
 Backup command with --cloud URI flag
 Restore from cloud URIs
 Verify cloud backups
 Cleanup cloud storage with retention policy

New Files:
- internal/cloud/uri.go - Cloud URI parser
- internal/restore/ - Cloud download module
- internal/restore/cloud_download.go - Download & verify helper

Modified Commands:
- cmd/backup.go - Added --cloud s3://bucket/path flag
- cmd/restore.go - Auto-detect & download from cloud URIs
- cmd/verify.go - Verify backups from cloud storage
- cmd/cleanup.go - Apply retention policy to cloud storage

URI Support:
- s3://bucket/path/file.dump - AWS S3
- minio://bucket/path/file.dump - MinIO
- b2://bucket/path/file.dump - Backblaze B2
- gs://bucket/path/file.dump - Google Cloud Storage

Examples:
  # Backup with cloud URI
  dbbackup backup single mydb --cloud s3://my-bucket/backups/

  # Restore from cloud
  dbbackup restore single s3://my-bucket/backups/mydb.dump --confirm

  # Verify cloud backup
  dbbackup verify-backup s3://my-bucket/backups/mydb.dump

  # Cleanup old cloud backups
  dbbackup cleanup s3://my-bucket/backups/ --retention-days 30

Features:
- Automatic download to temp directory
- SHA-256 verification after download
- Automatic temp file cleanup
- Progress tracking for downloads
- Metadata synchronization
- Retention policy for cloud storage

Sprint 3 Part 1 COMPLETE!
This commit is contained in:
2025-11-25 20:30:28 +00:00
parent 20b7f1ec04
commit bdf9af0650
6 changed files with 798 additions and 37 deletions

198
internal/cloud/uri.go Normal file
View File

@@ -0,0 +1,198 @@
package cloud
import (
"fmt"
"net/url"
"path"
"strings"
)
// CloudURI represents a parsed cloud storage URI
type CloudURI struct {
Provider string // "s3", "minio", "azure", "gcs", "b2"
Bucket string // Bucket or container name
Path string // Path within bucket (without leading /)
Region string // Region (optional, extracted from host)
Endpoint string // Custom endpoint (for MinIO, etc)
FullURI string // Original URI string
}
// ParseCloudURI parses a cloud storage URI like s3://bucket/path/file.dump
// Supported formats:
// - s3://bucket/path/file.dump
// - s3://bucket.s3.region.amazonaws.com/path/file.dump
// - minio://bucket/path/file.dump
// - azure://container/path/file.dump
// - gs://bucket/path/file.dump (Google Cloud Storage)
// - b2://bucket/path/file.dump (Backblaze B2)
func ParseCloudURI(uri string) (*CloudURI, error) {
if uri == "" {
return nil, fmt.Errorf("URI cannot be empty")
}
// Parse URL
parsed, err := url.Parse(uri)
if err != nil {
return nil, fmt.Errorf("invalid URI: %w", err)
}
// Extract provider from scheme
provider := strings.ToLower(parsed.Scheme)
if provider == "" {
return nil, fmt.Errorf("URI must have a scheme (e.g., s3://)")
}
// Validate provider
validProviders := map[string]bool{
"s3": true,
"minio": true,
"azure": true,
"gs": true,
"gcs": true,
"b2": true,
}
if !validProviders[provider] {
return nil, fmt.Errorf("unsupported provider: %s (supported: s3, minio, azure, gs, gcs, b2)", provider)
}
// Normalize provider names
if provider == "gcs" {
provider = "gs"
}
// Extract bucket and path
bucket := parsed.Host
if bucket == "" {
return nil, fmt.Errorf("URI must specify a bucket (e.g., s3://bucket/path)")
}
// Extract region from AWS S3 hostname if present
// Format: bucket.s3.region.amazonaws.com or bucket.s3-region.amazonaws.com
var region string
var endpoint string
if strings.Contains(bucket, ".amazonaws.com") {
parts := strings.Split(bucket, ".")
if len(parts) >= 3 {
// Extract bucket name (first part)
bucket = parts[0]
// Extract region if present
// bucket.s3.us-west-2.amazonaws.com -> us-west-2
// bucket.s3-us-west-2.amazonaws.com -> us-west-2
for i, part := range parts {
if part == "s3" && i+1 < len(parts) && parts[i+1] != "amazonaws" {
region = parts[i+1]
break
}
if strings.HasPrefix(part, "s3-") {
region = strings.TrimPrefix(part, "s3-")
break
}
}
}
}
// For MinIO and custom endpoints, preserve the host as endpoint
if provider == "minio" || (provider == "s3" && !strings.Contains(bucket, "amazonaws.com")) {
// If it looks like a custom endpoint (has dots), preserve it
if strings.Contains(bucket, ".") && !strings.Contains(bucket, "amazonaws.com") {
endpoint = bucket
// Try to extract bucket from path
trimmedPath := strings.TrimPrefix(parsed.Path, "/")
pathParts := strings.SplitN(trimmedPath, "/", 2)
if len(pathParts) > 0 && pathParts[0] != "" {
bucket = pathParts[0]
if len(pathParts) > 1 {
parsed.Path = "/" + pathParts[1]
} else {
parsed.Path = "/"
}
}
}
}
// Clean up path (remove leading slash)
filepath := strings.TrimPrefix(parsed.Path, "/")
return &CloudURI{
Provider: provider,
Bucket: bucket,
Path: filepath,
Region: region,
Endpoint: endpoint,
FullURI: uri,
}, nil
}
// IsCloudURI checks if a string looks like a cloud storage URI
func IsCloudURI(s string) bool {
s = strings.ToLower(s)
return strings.HasPrefix(s, "s3://") ||
strings.HasPrefix(s, "minio://") ||
strings.HasPrefix(s, "azure://") ||
strings.HasPrefix(s, "gs://") ||
strings.HasPrefix(s, "gcs://") ||
strings.HasPrefix(s, "b2://")
}
// String returns the string representation of the URI
func (u *CloudURI) String() string {
return u.FullURI
}
// BaseName returns the filename without path
func (u *CloudURI) BaseName() string {
return path.Base(u.Path)
}
// Dir returns the directory path without filename
func (u *CloudURI) Dir() string {
return path.Dir(u.Path)
}
// Join appends path elements to the URI path
func (u *CloudURI) Join(elem ...string) string {
newPath := u.Path
for _, e := range elem {
newPath = path.Join(newPath, e)
}
return fmt.Sprintf("%s://%s/%s", u.Provider, u.Bucket, newPath)
}
// ToConfig converts a CloudURI to a cloud.Config
func (u *CloudURI) ToConfig() *Config {
cfg := &Config{
Provider: u.Provider,
Bucket: u.Bucket,
Prefix: u.Dir(), // Use directory part as prefix
}
// Set region if available
if u.Region != "" {
cfg.Region = u.Region
}
// Set endpoint if available (for MinIO, etc)
if u.Endpoint != "" {
cfg.Endpoint = u.Endpoint
}
// Provider-specific settings
switch u.Provider {
case "minio":
cfg.PathStyle = true
case "b2":
cfg.PathStyle = true
}
return cfg
}
// BuildRemotePath constructs the full remote path for a file
func (u *CloudURI) BuildRemotePath(filename string) string {
if u.Path == "" || u.Path == "." {
return filename
}
return path.Join(u.Path, filename)
}

View File

@@ -0,0 +1,211 @@
package restore
import (
"context"
"crypto/sha256"
"encoding/hex"
"fmt"
"io"
"os"
"path/filepath"
"dbbackup/internal/cloud"
"dbbackup/internal/logger"
"dbbackup/internal/metadata"
)
// CloudDownloader handles downloading backups from cloud storage
type CloudDownloader struct {
backend cloud.Backend
log logger.Logger
}
// NewCloudDownloader creates a new cloud downloader
func NewCloudDownloader(backend cloud.Backend, log logger.Logger) *CloudDownloader {
return &CloudDownloader{
backend: backend,
log: log,
}
}
// DownloadOptions contains options for downloading from cloud
type DownloadOptions struct {
VerifyChecksum bool // Verify SHA-256 checksum after download
KeepLocal bool // Keep downloaded file (don't delete temp)
TempDir string // Temp directory (default: os.TempDir())
}
// DownloadResult contains information about a downloaded backup
type DownloadResult struct {
LocalPath string // Path to downloaded file
RemotePath string // Original remote path
Size int64 // File size in bytes
SHA256 string // SHA-256 checksum (if verified)
MetadataPath string // Path to downloaded metadata (if exists)
IsTempFile bool // Whether the file is in a temp directory
}
// Download downloads a backup from cloud storage
func (d *CloudDownloader) Download(ctx context.Context, remotePath string, opts DownloadOptions) (*DownloadResult, error) {
// Determine temp directory
tempDir := opts.TempDir
if tempDir == "" {
tempDir = os.TempDir()
}
// Create unique temp subdirectory
tempSubDir := filepath.Join(tempDir, fmt.Sprintf("dbbackup-download-%d", os.Getpid()))
if err := os.MkdirAll(tempSubDir, 0755); err != nil {
return nil, fmt.Errorf("failed to create temp directory: %w", err)
}
// Extract filename from remote path
filename := filepath.Base(remotePath)
localPath := filepath.Join(tempSubDir, filename)
d.log.Info("Downloading backup from cloud", "remote", remotePath, "local", localPath)
// Get file size for progress tracking
size, err := d.backend.GetSize(ctx, remotePath)
if err != nil {
d.log.Warn("Could not get remote file size", "error", err)
size = 0 // Continue anyway
}
// Progress callback
var lastPercent int
progressCallback := func(transferred, total int64) {
if total > 0 {
percent := int(float64(transferred) / float64(total) * 100)
if percent != lastPercent && percent%10 == 0 {
d.log.Info("Download progress", "percent", percent, "transferred", cloud.FormatSize(transferred), "total", cloud.FormatSize(total))
lastPercent = percent
}
}
}
// Download file
if err := d.backend.Download(ctx, remotePath, localPath, progressCallback); err != nil {
// Cleanup on failure
os.RemoveAll(tempSubDir)
return nil, fmt.Errorf("download failed: %w", err)
}
result := &DownloadResult{
LocalPath: localPath,
RemotePath: remotePath,
Size: size,
IsTempFile: !opts.KeepLocal,
}
// Try to download metadata file
metaRemotePath := remotePath + ".meta.json"
exists, err := d.backend.Exists(ctx, metaRemotePath)
if err == nil && exists {
metaLocalPath := localPath + ".meta.json"
if err := d.backend.Download(ctx, metaRemotePath, metaLocalPath, nil); err != nil {
d.log.Warn("Failed to download metadata", "error", err)
} else {
result.MetadataPath = metaLocalPath
d.log.Debug("Downloaded metadata", "path", metaLocalPath)
}
}
// Verify checksum if requested
if opts.VerifyChecksum {
d.log.Info("Verifying checksum...")
checksum, err := calculateSHA256(localPath)
if err != nil {
// Cleanup on verification failure
os.RemoveAll(tempSubDir)
return nil, fmt.Errorf("checksum calculation failed: %w", err)
}
result.SHA256 = checksum
// Check against metadata if available
if result.MetadataPath != "" {
meta, err := metadata.Load(result.MetadataPath)
if err != nil {
d.log.Warn("Failed to load metadata for verification", "error", err)
} else if meta.SHA256 != "" && meta.SHA256 != checksum {
// Cleanup on verification failure
os.RemoveAll(tempSubDir)
return nil, fmt.Errorf("checksum mismatch: expected %s, got %s", meta.SHA256, checksum)
} else if meta.SHA256 == checksum {
d.log.Info("Checksum verified successfully", "sha256", checksum)
}
}
}
d.log.Info("Download completed", "path", localPath, "size", cloud.FormatSize(result.Size))
return result, nil
}
// DownloadFromURI downloads a backup using a cloud URI
func (d *CloudDownloader) DownloadFromURI(ctx context.Context, uri string, opts DownloadOptions) (*DownloadResult, error) {
// Parse URI
cloudURI, err := cloud.ParseCloudURI(uri)
if err != nil {
return nil, fmt.Errorf("invalid cloud URI: %w", err)
}
// Download using the path from URI
return d.Download(ctx, cloudURI.Path, opts)
}
// Cleanup removes downloaded temp files
func (r *DownloadResult) Cleanup() error {
if !r.IsTempFile {
return nil // Don't delete non-temp files
}
// Remove the entire temp directory
tempDir := filepath.Dir(r.LocalPath)
if err := os.RemoveAll(tempDir); err != nil {
return fmt.Errorf("failed to cleanup temp files: %w", err)
}
return nil
}
// calculateSHA256 calculates the SHA-256 checksum of a file
func calculateSHA256(filePath string) (string, error) {
file, err := os.Open(filePath)
if err != nil {
return "", err
}
defer file.Close()
hash := sha256.New()
if _, err := io.Copy(hash, file); err != nil {
return "", err
}
return hex.EncodeToString(hash.Sum(nil)), nil
}
// DownloadFromCloudURI is a convenience function to download from a cloud URI
func DownloadFromCloudURI(ctx context.Context, uri string, opts DownloadOptions) (*DownloadResult, error) {
// Parse URI
cloudURI, err := cloud.ParseCloudURI(uri)
if err != nil {
return nil, fmt.Errorf("invalid cloud URI: %w", err)
}
// Create config from URI
cfg := cloudURI.ToConfig()
// Create backend
backend, err := cloud.NewBackend(cfg)
if err != nil {
return nil, fmt.Errorf("failed to create cloud backend: %w", err)
}
// Create downloader
log := logger.New("info", "text")
downloader := NewCloudDownloader(backend, log)
// Download
return downloader.Download(ctx, cloudURI.Path, opts)
}