TinyTorch/tests/integration/test_module_dependencies.py

#!/usr/bin/env python3
"""
Module Dependency Integration Testing
Tests how each module interfaces with modules that came before it
"""

# Module dependency graph for TinyTorch
MODULE_DEPENDENCIES = {
    "01_setup": [],  # No dependencies
    "02_tensor": ["01_setup"],  # Depends on setup
    "03_activations": ["02_tensor"],  # Needs Tensor
    "04_layers": ["02_tensor"],  # Needs Tensor
    "05_dense": ["02_tensor", "04_layers"],  # Needs Tensor and Layer base
    "06_spatial": ["02_tensor", "04_layers"],  # Needs Tensor and Layer base
    "07_attention": ["02_tensor", "04_layers", "05_dense"],  # Needs Tensor, Layer, Dense
    "08_dataloader": ["02_tensor"],  # Needs Tensor
    "09_normalization": ["02_tensor", "04_layers"],  # Needs Tensor and Layer
    "10_autograd": ["02_tensor"],  # Core dependency on Tensor
    "11_optimizers": ["02_tensor", "10_autograd"],  # Needs Tensor and autograd
    "12_training": ["02_tensor", "10_autograd", "11_optimizers"],  # Training loop deps
    "13_regularization": ["02_tensor", "04_layers"],  # Regularization techniques
    "14_kernels": ["02_tensor"],  # Low-level tensor ops
    "15_benchmarking": ["02_tensor"],  # Performance testing
    "16_mlops": ["02_tensor", "12_training"],  # Production deployment
    "17_tinygpt": ["02_tensor", "04_layers", "05_dense", "07_attention", "09_normalization"]  # Full stack
}

def get_module_integration_tests(module_name: str):
    """
    Get integration tests based on module dependencies.
    Returns a list of test functions to run.
    """
    tests = []

    # Get dependencies for this module
    deps = MODULE_DEPENDENCIES.get(module_name, [])

    # Generate tests based on dependencies
    if "02_tensor" in deps:
        tests.append(("test_tensor_integration", test_tensor_integration))

    if "04_layers" in deps:
        tests.append(("test_layer_integration", test_layer_integration))

    if "05_dense" in deps:
        tests.append(("test_dense_integration", test_dense_integration))

    if "10_autograd" in deps:
        tests.append(("test_autograd_integration", test_autograd_integration))

    if "11_optimizers" in deps:
        tests.append(("test_optimizer_integration", test_optimizer_integration))

    # Module-specific integration tests
    if module_name == "05_dense":
        tests.append(("test_dense_with_tensor", test_dense_with_tensor))
        tests.append(("test_dense_with_activations", test_dense_with_activations))
        tests.append(("test_multi_layer_network", test_multi_layer_network))

    elif module_name == "06_spatial":
        tests.append(("test_conv2d_with_tensor", test_conv2d_with_tensor))
        tests.append(("test_pooling_integration", test_pooling_integration))

    elif module_name == "07_attention":
        tests.append(("test_attention_with_dense", test_attention_with_dense))
        tests.append(("test_multihead_integration", test_multihead_integration))

    elif module_name == "12_training":
        tests.append(("test_training_loop_integration", test_training_loop_integration))
        tests.append(("test_loss_backward_integration", test_loss_backward_integration))

    return tests


# Base integration tests that check module interfaces
def test_tensor_integration():
    """Test that Tensor works as expected for dependent modules."""
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Test tensor creation
    t = Tensor(np.array([1, 2, 3]))
    assert t.shape == (3,), "Tensor shape should work"
    assert t.data is not None, "Tensor should have data"

    # Test tensor operations needed by other modules
    t2 = Tensor(np.array([4, 5, 6]))
    result = t.data + t2.data  # Many modules need element-wise ops
    assert result.shape == (3,), "Element-wise ops should preserve shape"


def test_layer_integration():
    """Test Layer base class interface."""
    from tinytorch.core.layers import Layer

    # Test that Layer exists and has expected interface
    assert hasattr(Layer, 'forward'), "Layer should have forward method"
    assert hasattr(Layer, '__call__'), "Layer should be callable"

    # Test basic layer creation
    layer = Layer()
    assert layer is not None, "Should create Layer instance"


def test_dense_integration():
    """Test Dense layer integration with Tensor."""
    from tinytorch.core.layers import Linear
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Test Dense with Tensor input
    layer = Linear(10, 5)
    x = Tensor(np.random.randn(32, 10))
    output = layer(x)

    assert output.shape == (32, 5), "Dense should produce correct shape"
    assert isinstance(output, Tensor), "Dense should return Tensor"


def test_dense_with_tensor():
    """Test that Dense properly uses Tensor for weights/bias."""
    from tinytorch.core.layers import Linear
    from tinytorch.core.tensor import Tensor

    layer = Linear(10, 5)

    # Check weights are Tensors
    assert isinstance(layer.weight, Tensor), "Weights should be Tensor"
    assert layer.weight.shape == (10, 5), "Weight shape should match layer dims"
    # Bias may or may not exist depending on implementation
    if hasattr(layer, 'bias') and layer.bias is not None:
    assert isinstance(layer.bias, Tensor), "Bias should be Tensor"


def test_dense_with_activations():
    """Test Dense layer works with activation functions."""
    from tinytorch.core.layers import Linear
    from tinytorch.core.activations import ReLU, Sigmoid
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Build small network: Dense -> ReLU -> Dense -> Sigmoid
    layer1 = Linear(10, 20)
    relu = ReLU()
    layer2 = Linear(20, 1)
    sigmoid = Sigmoid()

    # Forward pass
    x = Tensor(np.random.randn(16, 10))
    h1 = layer1(x)
    h1_activated = relu(h1)
    output = layer2(h1_activated)
    final = sigmoid(output)

    # Check shapes preserved through network
    assert h1.shape == (16, 20), "First layer output shape"
    assert h1_activated.shape == (16, 20), "ReLU preserves shape"
    assert output.shape == (16, 1), "Second layer output shape"
    assert final.shape == (16, 1), "Sigmoid preserves shape"

    # Check sigmoid output range
    assert np.all(final.data >= 0) and np.all(final.data <= 1), "Sigmoid outputs in [0,1]"


def test_multi_layer_network():
    """Test building multi-layer networks with Dense."""
    from tinytorch.core.layers import Linear
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Build 3-layer network
    layers = [
        Linear(784, 128),
        Linear(128, 64),
        Linear(64, 10)
    ]

    # Forward pass through all layers
    x = Tensor(np.random.randn(32, 784))

    for i, layer in enumerate(layers):
        x = layer(x)
        if i == 0:
            assert x.shape == (32, 128), f"Layer {i} shape"
        elif i == 1:
            assert x.shape == (32, 64), f"Layer {i} shape"
        elif i == 2:
            assert x.shape == (32, 10), f"Layer {i} shape"

    assert x.shape == (32, 10), "Final output shape should be (32, 10)"


def test_conv2d_with_tensor():
    """Test Conv2d integration with Tensor."""
    from tinytorch.core.spatial import Conv2d
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Create Conv2d layer
    conv = Conv2d(in_channels=3, out_channels=16, kernel_size=3)

    # Test with image tensor (batch, channels, height, width)
    x = Tensor(np.random.randn(8, 3, 32, 32))
    output = conv(x)

    # Check output shape (with valid padding, output is smaller)
    assert output.shape[0] == 8, "Batch size preserved"
    assert output.shape[1] == 16, "Output channels correct"


def test_pooling_integration():
    """Test pooling layers work with Conv2d output."""
    from tinytorch.core.spatial import Conv2d, MaxPool2d
    from tinytorch.core.tensor import Tensor
    import numpy as np

    conv = Conv2d(3, 32, kernel_size=3, padding=1)
    pool = MaxPool2d(kernel_size=2, stride=2)

    x = Tensor(np.random.randn(4, 3, 28, 28))
    conv_out = conv(x)
    pool_out = pool(conv_out)

    # Pooling should reduce spatial dimensions by half
    assert pool_out.shape[2] == conv_out.shape[2] // 2
    assert pool_out.shape[3] == conv_out.shape[3] // 2


def test_attention_with_dense():
    """Test attention mechanism uses Dense layers."""
    from tinytorch.core.attention import MultiHeadAttention
    from tinytorch.core.tensor import Tensor
    import numpy as np

    attention = MultiHeadAttention(embed_dim=64, num_heads=4)
    x = Tensor(np.random.randn(2, 10, 64))  # (batch, seq_len, embed_dim)

    output = attention(x)
    assert output.shape == x.shape, "Attention preserves shape"


def test_multihead_integration():
    """Test multi-head attention integration."""
    from tinytorch.core.attention import MultiHeadAttention
    from tinytorch.core.tensor import Tensor
    import numpy as np

    mha = MultiHeadAttention(embed_dim=64, num_heads=8)
    x = Tensor(np.random.randn(2, 10, 64))

    output = mha(x)
    assert output.shape == x.shape, "MHA preserves input shape"


def test_autograd_integration():
    """Test autograd system with Tensor."""
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Test that Tensor works with autograd
    x = Tensor(np.array([[1, 2], [3, 4]]), requires_grad=True)
    assert hasattr(x, 'grad'), "Tensor should have grad attribute"
    assert x.requires_grad == True, "Should track gradients"


def test_optimizer_integration():
    """Test optimizers work with layers."""
    from tinytorch.core.optimizers import SGD
    from tinytorch.core.layers import Linear

    layer = Linear(10, 5)
    params = layer.parameters()
    optimizer = SGD(params, lr=0.01)

    # Test optimizer has params
    assert len(params) > 0, "Layer should have parameters"


def test_training_loop_integration():
    """Test training loop integrates optimizer and autograd."""
    from tinytorch.core.layers import Linear
    from tinytorch.core.optimizers import SGD
    from tinytorch.core.losses import MSELoss
    from tinytorch.core.tensor import Tensor
    import numpy as np

    # Simple model
    model = Linear(10, 1)
    params = model.parameters()
    optimizer = SGD(params, lr=0.01)
    loss_fn = MSELoss()

    # Dummy data
    X = Tensor(np.random.randn(32, 10))
    y = Tensor(np.random.randn(32, 1))

    # One training step
    predictions = model(X)
    loss = loss_fn(predictions, y)

    # Loss should be computed
    assert loss is not None, "Loss should be computed"


def test_loss_backward_integration():
    """Test loss functions integrate with autograd."""
    from tinytorch.core.losses import MSELoss
    from tinytorch.core.tensor import Tensor
    import numpy as np

    loss_fn = MSELoss()

    # Create tensors with gradients
    predictions = Tensor(np.array([1.0, 2.0, 3.0]), requires_grad=True)
    targets = Tensor(np.array([1.5, 2.5, 3.5]))

    loss = loss_fn(predictions, targets)

    # Test backward pass
    if hasattr(loss, 'backward'):
        loss.backward()