The Refactor That Broke Production (And How Graph Analysis Would Have Prevented It)

user-service

Frontend → user-service → auth-service → database

# In user-service
def update_email(user_id, new_email):
    old_email = get_current_email(user_id)
    update_user_email(user_id, new_email)
    
    # Log the change with user context
    audit_log.info(f"Email changed", extra={
        'user_id': user_id,
        'old_email': old_email,
        'new_email': new_email,
        'user_details': get_user_context(user_id)  # <-- the problem
    })

def get_user_context(user_id):
    user = User.objects.get(id=user_id)
    return {
        'username': user.username,
        'account_type': user.account_type,
        'is_admin': check_admin_status(user_id),  # <-- oh no
        'permissions': get_user_permissions(user_id)
    }

user-service → auth-service → user-service (for user context)

import ast
import networkx as nx
from pathlib import Path

class ServiceDependencyAnalyzer:
    def __init__(self, services_dir):
        self.graph = nx.DiGraph()
        self.services_dir = Path(services_dir)
        
    def analyze_service_calls(self, service_name):
        """Extract HTTP calls from a service's codebase"""
        service_path = self.services_dir / service_name
        
        for py_file in service_path.rglob("*.py"):
            tree = ast.parse(py_file.read_text())
            
            for node in ast.walk(tree):
                if isinstance(node, ast.Call):
                    call_target = self._extract_service_call(node)
                    if call_target:
                        self.graph.add_edge(service_name, call_target)
    
    def _extract_service_call(self, node):
        """Parse AST node to identify service calls"""
        # Look for requests.post/get/etc patterns
        if (isinstance(node.func, ast.Attribute) and
            node.func.attr in ['get', 'post', 'put', 'delete']):
            
            if node.args and isinstance(node.args[0], ast.Str):
                url = node.args[0].s
                return self._extract_service_from_url(url)
        return None
    
    def find_cycles(self):
        """Find circular dependencies"""
        try:
            cycles = list(nx.simple_cycles(self.graph))
            return cycles
        except nx.NetworkXNoCycle:
            return []
    
    def analyze_impact(self, service_name):
        """Find all services that depend on this one"""
        if service_name not in self.graph:
            return []
        
        # All nodes that have paths TO this service
        dependents = []
        for node in self.graph.nodes():
            if nx.has_path(self.graph, node, service_name):
                dependents.append(node)
        
        return dependents

Circular dependencies found:
['user-service', 'auth-service', 'user-service']

Impact analysis for auth-service changes:
- user-service (direct dependency)
- billing-service (depends on user-service) 
- notification-service (depends on user-service)
- admin-dashboard (depends on user-service)

# New approach: auth-service returns minimal context
def validate_token(token):
    payload = jwt.decode(token)
    return {
        'user_id': payload['user_id'],
        'permissions': payload['permissions'],  # Embedded in token
        'expires_at': payload['exp']
    }

# user-service handles its own admin checks
def check_admin_status(user_id):
    user = User.objects.get(id=user_id)
    return user.is_admin  # No service call needed

# .github/workflows/dependency-check.yml
name: Dependency Analysis
on: [pull_request]

jobs:
  analyze:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v2
      - name: Run dependency analysis
        run: |
          python scripts/analyze_dependencies.py
          if [ $? -ne 0 ]; then
            echo "Circular dependencies detected!"
            exit 1
          fi

The Refactor That Broke Production (And How Graph Analysis Would Have Prevented It)

The Refactor That Broke Production (And How Graph Analysis Would Have Prevented It)

The "Simple" Refactor

Related Posts

Best GPT for Coding: Comparing AI Code Assistants

The Hidden Web

Why This Broke Everything

Graph Analysis Would Have Caught This

The Real Fix

The Numbers

Actually Learn From This

JavaScript Static Code Analysis Beyond ESLint

Code Refactoring Tools: When to Automate vs Manual