# Check system logs
journalctl -xe --since "10 minutes ago" # Check system resources
free -h && df -h && uptime # Check running processes
ps aux --sort=-%mem | head -20
# Check system logs
journalctl -xe --since "10 minutes ago" # Check system resources
free -h && df -h && uptime # Check running processes
ps aux --sort=-%mem | head -20
# Check system logs
journalctl -xe --since "10 minutes ago" # Check system resources
free -h && df -h && uptime # Check running processes
ps aux --sort=-%mem | head -20
# Restart the affected -weight: 500;">service
-weight: 500;">systemctl -weight: 500;">restart your--weight: 500;">service # Check the -weight: 500;">service logs
journalctl -u your--weight: 500;">service -n 100 --no-pager # Verify the fix worked
-weight: 500;">systemctl -weight: 500;">status your--weight: 500;">service
-weight: 500;">curl -I http://localhost:PORT/health
# Restart the affected -weight: 500;">service
-weight: 500;">systemctl -weight: 500;">restart your--weight: 500;">service # Check the -weight: 500;">service logs
journalctl -u your--weight: 500;">service -n 100 --no-pager # Verify the fix worked
-weight: 500;">systemctl -weight: 500;">status your--weight: 500;">service
-weight: 500;">curl -I http://localhost:PORT/health
# Restart the affected -weight: 500;">service
-weight: 500;">systemctl -weight: 500;">restart your--weight: 500;">service # Check the -weight: 500;">service logs
journalctl -u your--weight: 500;">service -n 100 --no-pager # Verify the fix worked
-weight: 500;">systemctl -weight: 500;">status your--weight: 500;">service
-weight: 500;">curl -I http://localhost:PORT/health
# Add monitoring
# Add health checks
# Set resource limits
# Configure alerting
# Add monitoring
# Add health checks
# Set resource limits
# Configure alerting
# Add monitoring
# Add health checks
# Set resource limits
# Configure alerting - Resource exhaustion (memory, disk, CPU)
- Configuration mismatch
- Dependency failure
- Code-level bug