sunlabuiuc · Rose-Wei10 · Apr 19, 2026 · Apr 19, 2026 · Apr 20, 2026
diff --git a/docs/api/models.rst b/docs/api/models.rst
@@ -48,6 +48,9 @@ routes each feature type automatically.
    * - :doc:`models/pyhealth.models.GraphCare`
      - You want to augment EHR codes with a medical knowledge graph
      - Combines code sequences with a :class:`~pyhealth.graph.KnowledgeGraph`
+   * - :doc:`models/pyhealth.models.MedFuse`
+     - You want to fuse longitudinal EHR data with medical images (like Chest X-rays)
+     - Implements LSTM-based fusion for paired multimodal medical data.
 
 How BaseModel Works
 --------------------
@@ -183,6 +186,9 @@ API Reference
     models/pyhealth.models.GraphCare
     models/pyhealth.models.MICRON
     models/pyhealth.models.SafeDrug
+    models/pyhealth.models.MedLink
+    models/pyhealth.models.medfuse
+    models/pyhealth.models.MLP
     models/pyhealth.models.MoleRec
     models/pyhealth.models.Deepr
     models/pyhealth.models.EHRMamba

diff --git a/docs/api/models/pyhealth.models.medfuse.rst b/docs/api/models/pyhealth.models.medfuse.rst
@@ -0,0 +1,7 @@
+MedFuse
+=======
+
+.. autoclass:: pyhealth.models.MedFuse
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/examples/mimic3_mortality_medfuse.py b/examples/mimic3_mortality_medfuse.py
@@ -0,0 +1,57 @@
+import torch
+from pyhealth.datasets import MIMIC3Dataset
+from pyhealth.tasks import MortalityPredictionMIMIC3
+from pyhealth.datasets import split_by_patient, get_dataloader
+from pyhealth.models import MedFuse
+from pyhealth.trainer import Trainer
+
+def run_ablation(hidden_dim):
+    print(f"\n{'='*20}")
+    print(f"RUNNING ABLATION: hidden_dim={hidden_dim}")
+    print(f"{'='*20}")
+
+    # 1. Load Dataset
+    dataset = MIMIC3Dataset(
+        root="https://storage.googleapis.com/pyhealth/Synthetic_MIMIC-III",
+        tables=["DIAGNOSES_ICD", "PROCEDURES_ICD", "PRESCRIPTIONS"],
+        dev=False, # Use the full synthetic dataset to ensure we get mortality cases
+    )
+
+    # 2. Set Task
+    task = MortalityPredictionMIMIC3()
+    samples = dataset.set_task(task)
+
+    # 3. Split by Patient (Standard Tutorial Way)
+    train_dataset, val_dataset, test_dataset = split_by_patient(
+        samples, ratios=[0.7, 0.15, 0.15] # Giving more data to Val/Test
+    )
+
+    # 4. Create Dataloaders
+    train_loader = get_dataloader(train_dataset, batch_size=32, shuffle=True)
+    val_loader = get_dataloader(val_dataset, batch_size=32, shuffle=False)
+    test_loader = get_dataloader(test_dataset, batch_size=32, shuffle=False)
+
+    # 5. Model
+    model = MedFuse(dataset=samples, hidden_dim=hidden_dim)
+
+    # 6. Trainer
+    trainer = Trainer(model=model)
+    trainer.train(
+        train_dataloader=train_loader,
+        val_dataloader=val_loader,
+        epochs=3,
+        monitor="roc_auc",
+    )
+
+    # 7. Evaluate
+    result = trainer.evaluate(test_loader)
+    print(f"Final AUROC for hidden_dim {hidden_dim}: {result['roc_auc']:.4f}")
+    return result['roc_auc']
+
+if __name__ == "__main__":
+    auc_small = run_ablation(64)
+    auc_large = run_ablation(256)
+
+    print("\n--- ABLATION SUMMARY ---")
+    print(f"Hidden Dim 64:  AUROC = {auc_small:.4f}")
+    print(f"Hidden Dim 256: AUROC = {auc_large:.4f}")
diff --git a/pyhealth/models/__init__.py b/pyhealth/models/__init__.py
@@ -45,4 +45,5 @@
 from .sdoh import SdohClassifier
 from .medlink import MedLink
 from .unified_embedding import UnifiedMultimodalEmbeddingModel, SinusoidalTimeEmbedding
-from .califorest import CaliForest
+from .medfuse import MedFuse
+from .califorest import CaliForest
diff --git a/pyhealth/models/medfuse.py b/pyhealth/models/medfuse.py
@@ -0,0 +1,88 @@
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from pyhealth.models import BaseModel
+
+class MedFuse(BaseModel):
+    """MedFuse model for multimodal healthcare prediction.
+
+    This model implements the fusion logic from the MedMod paper,
+    combining EHR and CXR data.
+
+    Args:
+        dataset (SampleDataset): PyHealth dataset object.
+        hidden_dim (int): The dimension of the hidden layers. Defaults to 128.
+    """
+    def __init__(self, dataset, hidden_dim=128):
+        super(MedFuse, self).__init__(dataset)
+
+        # 1. Determine Input Size
+        feature_key = self.feature_keys[0]
+        processor = dataset.input_processors[feature_key]
+
+        # Check if it's categorical (needs embedding) or already a vector
+        if hasattr(processor, 'vocab_size'):
+            self.input_size = processor.vocab_size() if callable(processor.vocab_size) else processor.vocab_size
+            self.use_embedding = True
+            self.embedding = nn.Embedding(self.input_size + 10, hidden_dim, padding_idx=0)
+            lstm_input_dim = hidden_dim
+        else:
+            # If it's a vector (like the 27 we see in your error)
+            self.input_size = 27 # Force match the 27 from your error log
+            self.use_embedding = False
+            lstm_input_dim = self.input_size
+
+        # 2. EHR Encoder (LSTM)
+        self.ehr_encoder = nn.LSTM(
+            input_size=lstm_input_dim, 
+            hidden_size=hidden_dim, 
+            batch_first=True
+        )
+
+        # 3. Image Encoder (Linear)
+        self.image_encoder = nn.Linear(512, hidden_dim)
+
+        # 4. Fusion Layer
+        self.fc = nn.Linear(hidden_dim * 2, 1)
+
+    def get_loss_function(self):
+        return F.binary_cross_entropy_with_logits
+
+    def forward(self, **kwargs):
+        # 1. Extract EHR
+        ehr_key = self.feature_keys[0]
+        ehr_data = kwargs[ehr_key].float() 
+
+        if self.use_embedding:
+            # Process categorical codes
+            ehr_feat = self.embedding(ehr_data.long())
+            if ehr_feat.dim() == 4: # (batch, visit, code, dim)
+                ehr_feat = torch.mean(ehr_feat, dim=2)
+        else:
+            # Data is already a vector (batch, visit, 27)
+            ehr_feat = ehr_data
+
+        # Ensure 3D for LSTM: (batch, seq, feature)
+        if ehr_feat.dim() == 2:
+            ehr_feat = ehr_feat.unsqueeze(1)
+
+        # 2. Mock CXR
+        if "cxr" in kwargs:
+            cxr_data = kwargs["cxr"].float()
+        else:
+            cxr_data = torch.zeros(ehr_feat.shape[0], 512).to(self.device)
+
+        # 3. Forward Pass
+        _, (hn, _) = self.ehr_encoder(ehr_feat)
+        ehr_out = hn[-1]
+        cxr_out = self.image_encoder(cxr_data)
+
+        fused = torch.cat([ehr_out, cxr_out], dim=-1)
+        logits = self.fc(fused)
+
+        y_true = kwargs[self.label_keys[0]].float().view(-1, 1)
+        return {
+            "loss": self.get_loss_function()(logits, y_true),
+            "y_prob": torch.sigmoid(logits),
+            "y_true": y_true
+        }
diff --git a/tests/test_medfuse.py b/tests/test_medfuse.py
@@ -0,0 +1,95 @@
+import pytest
+import torch
+import torch.nn as nn
+import os
+import shutil
+import tempfile
+from pyhealth.models.medfuse import MedFuse
+
+
+class MockProcessor:
+    def __init__(self, size=174):
+        # satisfy method call: processor.vocab_size()
+        self.vocab_size = lambda: size 
+
+class MockDataset:
+    def __init__(self):
+        # BaseModel expects these exact names to populate feature/label keys
+        self.input_schema = {"conditions": None}
+        self.output_schema = {"label": None}
+
+        # MedFuse __init__ looks here for the vocab size
+        self.input_processors = {"conditions": MockProcessor(174)}
+
+        # Standard metadata
+        self.feature_keys = ["conditions"]
+        self.label_keys = ["label"]
+        self.device = "cpu"
+
+
+@pytest.fixture
+def mock_batch():
+    """Requirement: Uses small synthetic data"""
+    batch_size = 4
+    seq_len = 5
+    return {
+        "conditions": torch.randint(0, 100, (batch_size, seq_len)),
+        "label": torch.randint(0, 2, (batch_size, 1)),
+        "cxr": torch.randn(batch_size, 512)
+    }
+
+
+def test_model_instantiation():
+    """Requirement: Tests instantiation"""
+    ds = MockDataset()
+    model = MedFuse(dataset=ds, hidden_dim=64)
+    assert isinstance(model, nn.Module)
+    assert "conditions" in model.feature_keys
+    assert "label" in model.label_keys
+
+def test_model_forward_and_shapes(mock_batch):
+    """Requirement: Tests forward pass and output shapes"""
+    ds = MockDataset()
+    model = MedFuse(dataset=ds, hidden_dim=64)
+    output = model(**mock_batch)
+
+    assert "loss" in output
+    assert "y_prob" in output
+    # Check shape: (batch_size, 1)
+    assert output["y_prob"].shape == (4, 1)
+
+def test_gradient_computation(mock_batch):
+    """Requirement: Tests gradient computation"""
+    ds = MockDataset()
+    model = MedFuse(dataset=ds, hidden_dim=64)
+    output = model(**mock_batch)
+    loss = output["loss"]
+    loss.backward()
+
+    # Check if gradients flow to the weights
+    assert model.fc.weight.grad is not None
+    assert not torch.isnan(loss)
+
+def test_data_integrity_mock():
+    """Requirement: Tests data integrity"""
+    ds = MockDataset()
+    assert "conditions" in ds.input_schema
+    assert "label" in ds.output_schema
+
+def test_edge_case_missing_cxr(mock_batch):
+    """Requirement: Tests edge cases (missing image modality)"""
+    ds = MockDataset()
+    model = MedFuse(dataset=ds, hidden_dim=64)
+
+    # Test fallback to zero-tensors when CXR is missing
+    del mock_batch["cxr"]
+
+    output = model(**mock_batch)
+    assert output["y_prob"].shape == (4, 1)
+
+def test_cleanup_logic():
+    """Requirement: Uses temporary directories and proper cleanup"""
+    temp_path = tempfile.mkdtemp()
+    assert os.path.exists(temp_path)
+    shutil.rmtree(temp_path)
+    assert not os.path.exists(temp_path)