ez-frcnn.characterize

def characterize.get_subsampled_dataset(full_dataset, num_samples):

Returns a randomly subsampled subset of a given dataset.

Inputs

full_dataset (Dataset): A PyTorch-style dataset to sample from. num_samples (int): The number of samples to include in the returned subset.

Output

Subset: A torch.utils.data.Subset containing num_samples randomly selected items from the original dataset.

Source code in library/characterize.py

def get_subsampled_dataset(full_dataset, num_samples):
    """
    Returns a randomly subsampled subset of a given dataset.

    Inputs:
        full_dataset (Dataset): A PyTorch-style dataset to sample from.
        num_samples (int): The number of samples to include in the returned subset.

    Output:
        Subset: A torch.utils.data.Subset containing `num_samples` randomly selected items
                from the original dataset.

    """
    indices = np.random.permutation(len(full_dataset))[:num_samples]
    return Subset(full_dataset, indices)

def characterize.get_mAP(dataloader, model, device):

Computes the mean Average Precision (mAP) for a given object detection model on a dataset.

Inputs

dataloader (DataLoader): A PyTorch DataLoader providing batches of images and targets. model (nn.Module): The object detection model to evaluate. device (torch.device): The device (CPU or GPU) on which to run the model.

Output

dict: A dictionary containing mAP metrics computed by torchmetrics.MeanAveragePrecision().

Source code in library/characterize.py

def get_mAP(dataloader, model, device):
    """
    Computes the mean Average Precision (mAP) for a given object detection model on a dataset.

    Inputs:
        dataloader (DataLoader): A PyTorch DataLoader providing batches of images and targets.
        model (nn.Module): The object detection model to evaluate.
        device (torch.device): The device (CPU or GPU) on which to run the model.

    Output:
        dict: A dictionary containing mAP metrics computed by torchmetrics.MeanAveragePrecision().

    """
    metric = MeanAveragePrecision()
    model.eval()
    model.to(device)
    # Iterate over the DataLoader
    for images, targets in dataloader:
        images = [image.to(device) for image in images]
        targets = [{k: v.to(device) for k, v in t.items()} for t in targets]

        with torch.no_grad():
            outputs = model(images)

        # Prepare predictions and targets for torchmetrics
        preds = []
        for output in outputs:
            preds.append({
                "boxes": output['boxes'].cpu(),
                "scores": output['scores'].cpu(),
                "labels": output['labels'].cpu(),
            })

        tars = []
        for target in targets:
            tars.append({
                "boxes": target['boxes'].cpu(),
                "labels": target['labels'].cpu(),
            })

        # Update the metric with predictions and targets
        metric.update(preds, tars)

    # Compute the final mAP score
    mAP = metric.compute()
    return mAP

def characterize.run_experiment(full_train_dataset, valid_dataset, num_classes, BATCH_SIZE, NUM_EXPERIMENTS=5, EPOCHS_PER_EXPERIMENT=100, TRIALS_PER_EXPERIMENT=3):

Runs a series of training experiments with increasing amounts of training data to evaluate model performance.

Inputs

full_train_dataset (Dataset): The full training dataset to subsample from. valid_dataset (Dataset): The validation dataset used to compute validation mAP. num_classes (int): Number of object classes (including background if applicable). BATCH_SIZE (int): Batch size used for training and validation. NUM_EXPERIMENTS (int): Number of increasing training set sizes to evaluate. Default is 5. EPOCHS_PER_EXPERIMENT (int): Number of training epochs per experiment. Default is 100. TRIALS_PER_EXPERIMENT (int): Number of trials to average per training size. Default is 3.

Output

list: A list of tuples, each containing (num_samples, mean_mAP, std_mAP) for each experiment.

Source code in library/characterize.py

def run_experiment(full_train_dataset, valid_dataset, num_classes, BATCH_SIZE, NUM_EXPERIMENTS=5, EPOCHS_PER_EXPERIMENT=100, TRIALS_PER_EXPERIMENT=3):
    """
    Runs a series of training experiments with increasing amounts of training data to evaluate model performance.

    Inputs:
        full_train_dataset (Dataset): The full training dataset to subsample from.
        valid_dataset (Dataset):      The validation dataset used to compute validation mAP.
        num_classes (int):            Number of object classes (including background if applicable).
        BATCH_SIZE (int):             Batch size used for training and validation.
        NUM_EXPERIMENTS (int):        Number of increasing training set sizes to evaluate. Default is 5.
        EPOCHS_PER_EXPERIMENT (int):  Number of training epochs per experiment. Default is 100.
        TRIALS_PER_EXPERIMENT (int):  Number of trials to average per training size. Default is 3.

    Output:
        list: A list of tuples, each containing (num_samples, mean_mAP, std_mAP) for each experiment.
    """
    # Device configuration
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    metric = MeanAveragePrecision()
    # Directory setup for models and plots
    model_dir = 'models/'
    plot_dir = 'plots/'

    # Calculate number of samples for each experiment
    total_samples = len(full_train_dataset)
    split_sizes = np.linspace(0, total_samples, NUM_EXPERIMENTS + 1, dtype=int)[1:]

    results = []

    # Create plot
    plt.figure()
    mean_mAPs = []
    std_mAPs = []

    for num_samples in split_sizes:
        mAPs = []
        for trial in range(TRIALS_PER_EXPERIMENT):
            print(f"\nRunning training with {num_samples} samples, trial {trial + 1}...")

            # Subsample the training dataset
            train_subset = get_subsampled_dataset(full_train_dataset, num_samples)
            train_loader, valid_loader = get_loaders(train_subset, valid_dataset, BATCH_SIZE, collate_fn)

            # Initialize a fresh instance of the model
            model = create_model(num_classes).to(device)

            # Train the model
            train_model_no_val(model, train_loader, valid_loader, device, 'experiment_model', EPOCHS_PER_EXPERIMENT, model_dir, plot_dir, 10, 10)

            # Evaluate the model
            val_mAP = get_mAP(valid_loader, model, device)
            val_mAP = float(val_mAP['map_50'])
            mAPs.append(val_mAP)
            print(f"Trial {trial + 1}: Validation mAP = {val_mAP:.3f}")

        # Compute statistics
        mean_mAP = np.mean(mAPs)
        std_mAP = np.std(mAPs)
        mean_mAPs.append(mean_mAP)
        std_mAPs.append(std_mAP)
        results.append((num_samples, mean_mAP, std_mAP))
        print(f"Finished {num_samples} samples: Mean Validation mAP = {mean_mAP:.3f}, Std Dev = {std_mAP:.3f}")

    # Plotting results
    plt.errorbar(split_sizes, mean_mAPs, yerr=std_mAPs, fmt='-o', capsize=5)
    plt.title('Mean and Standard Deviation of Validation mAP')
    plt.xlabel('Number of Training Samples')
    plt.ylabel('Validation mAP')
    plt.grid(True)
    plt.savefig(f"{plot_dir}/mAP_results.png")
    plt.show()

    return results