vgg_predict 🗿

Adapt VGG-Face as the core model to predict human judgments in the face similarity task.

Run this script via the command line interface (CLI) to train the VGG-Face model on human judgments.

What arguments can be passed in CLI?

python -m facesim3d.vgg_predict --help

Functions:

Name	Description
`evaluate_vgg_face_human_judgment_model`	Evaluate the `VGG-Face` model for human similarity judgments.
`main`	Run the main function of `vgg_predict.py`.
`train_vgg_face_human_judgment_model`	Train the `VGG-Face` model for human similarity judgments.

evaluate_vgg_face_human_judgment_model 🗿

evaluate_vgg_face_human_judgment_model(
    model: VGGFaceHumanjudgment,
    data: DataLoader,
    device: str,
    loss_fn: Module | None = None,
    writer: SummaryWriter | None = None,
    global_step: int = 0,
) -> float

Evaluate the VGG-Face model for human similarity judgments.

Source code in code/facesim3d/modeling/VGG/vgg_predict.py

def evaluate_vgg_face_human_judgment_model(
    model: VGGFaceHumanjudgment,
    data: DataLoader,
    device: str,
    loss_fn: torch.nn.Module | None = None,
    writer: SummaryWriter | None = None,
    global_step: int = 0,
) -> float:
    """Evaluate the `VGG-Face` model for human similarity judgments."""
    model.eval()
    correct = 0
    total = 0

    n_print = np.maximum(len(data) // 25, 10)  # print 25 times over dataset
    running_loss = 0.0
    with torch.no_grad():
        for i, data_i in tqdm(
            enumerate(data),
            desc=f"Iterate through {'test' if loss_fn is None else 'val'} samples",
            total=len(data),
            position=0 if loss_fn is None else 2,
            leave=loss_fn is None,
        ):
            x1, x2, x3, y, _ = data_i.values()  # _ = idx
            outputs = model(x1.to(device), x2.to(device), x3.to(device))
            _, predicted = torch.max(outputs.data, 1)

            total += y.size(0)
            correct += (predicted == y.to(device)).sum().item()

            if loss_fn:
                loss = loss_fn(outputs, y.to(device))
                running_loss += loss.item()
            if (i % n_print) == (n_print - 1):
                if loss_fn:
                    msg = f"Step: {i + 1:6d}, Loss: {loss.item():.5f} | running loss: {running_loss / n_print:.5f}"
                    print(msg)
                if writer is not None:
                    if loss_fn:  # currently only for validation set
                        writer.add_scalar(
                            tag=f"loss/{'test' if loss_fn is None else 'val'}",
                            scalar_value=loss.item(),
                            global_step=i + global_step,
                        )
                    writer.add_scalar(
                        tag=f"running_acc/{'test' if loss_fn is None else 'val'}",
                        scalar_value=correct / total,
                        global_step=i + global_step,
                    )

    acc = correct / total
    msg = f"Accuracy of the network on the {'test' if loss_fn is None else 'validation'} set (n={total}): {acc:.2%}"
    print(msg)
    logger.info(msg)

    return acc

main 🗿

main()

Run the main function of vgg_predict.py.

Source code in code/facesim3d/modeling/VGG/vgg_predict.py

def main():
    """Run the main function of `vgg_predict.py`."""
    # Set device
    if FLAGS.device is None:
        device = str(torch.device("cuda:0" if torch.cuda.is_available() else "cpu"))
    else:
        device = FLAGS.device
    cprint(string=f"\nUsing {device = }\n", col="y", ts=True)
    logger.info("Using device: %s", device)

    # Set seed
    if FLAGS.seed is not None:
        torch.manual_seed(FLAGS.seed)
        np.random.seed(FLAGS.seed)

        if device.startswith("cuda"):
            torch.cuda.manual_seed(FLAGS.seed)
            torch.cuda.manual_seed_all(FLAGS.seed)
            torch.backends.cudnn.benchmark = True  # look for optimal algorithms for the given train config
        logger.info("Set seed to %s.", FLAGS.seed)

    # Init model
    if FLAGS.freeze_weights:
        # This uses pre-computed activation maps of the VGGFace model
        vgg_hum = (
            VGGFaceHumanjudgmentFrozenCore(
                decision_block=FLAGS.decision_block,
                last_core_layer=FLAGS.last_core_layer,
                parallel_bridge=FLAGS.parallel_bridge,
                session=FLAGS.session,
            )
            .to(device)
            .float()
        )
    else:
        # Here we train end-to-end from image space to human judgments
        vgg_hum = (
            VGGFaceHumanjudgment(
                decision_block=FLAGS.decision_block,
                freeze_vgg_core=FLAGS.freeze_weights,
                last_core_layer=FLAGS.last_core_layer,
                parallel_bridge=FLAGS.parallel_bridge,
                session=FLAGS.session,
            )
            .to(device)
            .float()
        )

    # Train model to predict human judgment
    cprint(
        string=f"\nTraining & testing ({pd.Timestamp.now().ceil(freq='s')})\n"
        f"\t{vgg_hum.__class__.__name__}:\n"
        f"\t\t▸ '{FLAGS.session}' session\n"
        f"\t\t▸ '{FLAGS.decision_block}' decision block\n"
        f"\t\t▸ {'frozen' if FLAGS.freeze_weights else 'unfrozen'} VGG core\n"
        f"\t\t▸ last core layer: '{FLAGS.last_core_layer}'\n"
        f"\t\t▸ parallel bridge: {FLAGS.parallel_bridge}\n"
        f"\t\t▸ learning rate: {FLAGS.learning_rate}\n"
        f"\t\t▸ exclusive gender trials : {FLAGS.exclusive_gender_trials}\n",
        col="b",
        fm="ul",
    )

    # Prepare data
    train_dl, val_dl, test_dl = prepare_data_for_human_judgment_model(
        session=FLAGS.session,
        frozen_core=FLAGS.freeze_weights,
        data_mode=FLAGS.data_mode,
        last_core_layer=FLAGS.last_core_layer,
        split_ratio=(0.7, 0.15, 0.15),  # keep training set large for testing function
        batch_size=FLAGS.batch_size,
        shuffle=FLAGS.shuffle,
        num_workers=FLAGS.num_workers,
        dtype=torch.float32,
        heads=FLAGS.heads,
        size=FLAGS.n_samples,
        exclusive_gender_trials=FLAGS.exclusive_gender_trials,
    )  # keep size small for testing of implementation
    logger.info("Data is prepared for '%s'", vgg_hum.__class__.__name__)

    # Train & test model
    trained_vgg_hum = train_vgg_face_human_judgment_model(
        model=vgg_hum,
        session=FLAGS.session,
        data_mode=FLAGS.data_mode,
        exclusive_gender_trials=FLAGS.exclusive_gender_trials,
        train_data=train_dl,
        val_data=val_dl,
        test_data=test_dl,
        epochs=FLAGS.epochs,
        learning_rate=FLAGS.learning_rate,
        device=device,
        send_message=FLAGS.notification,
        seed=FLAGS.seed,
    )
    logger.info("Finished training of '%s'.", {trained_vgg_hum.__class__.__name__})
    cprint(string=f"\nI, '{trained_vgg_hum.__class__.__name__}', am trained!\n", col="g", fm="bo")

train_vgg_face_human_judgment_model 🗿

train_vgg_face_human_judgment_model(
    model: (
        VGGFaceHumanjudgment
        | VGGFaceHumanjudgmentFrozenCore
    ),
    session: str,
    data_mode: str,
    exclusive_gender_trials: str | None,
    train_data: DataLoader,
    val_data: DataLoader,
    test_data: DataLoader,
    epochs: int,
    device: str,
    learning_rate: float,
    send_message: bool = False,
    seed: int | None = None,
) -> VGGFaceHumanjudgment

Train the VGG-Face model for human similarity judgments.

Source code in code/facesim3d/modeling/VGG/vgg_predict.py

def train_vgg_face_human_judgment_model(
    model: VGGFaceHumanjudgment | VGGFaceHumanjudgmentFrozenCore,
    session: str,
    data_mode: str,
    exclusive_gender_trials: str | None,
    train_data: DataLoader,
    val_data: DataLoader,
    test_data: DataLoader,
    epochs: int,
    device: str,
    learning_rate: float,
    send_message: bool = False,
    seed: int | None = None,
) -> VGGFaceHumanjudgment:
    """Train the `VGG-Face` model for human similarity judgments."""
    # Check arguments
    exclusive_gender_trials = check_exclusive_gender_trials(exclusive_gender_trials=exclusive_gender_trials)
    # TODO: turn "" into e.g. "full_sample", after running all models, & move previous dirs  # noqa: FIX002
    p_fix = "" if exclusive_gender_trials is None else f"{exclusive_gender_trials}_only_trials"  # path_fix

    # Prepare model
    model_name = f"{datetime.now().strftime('%Y-%m-%d_%H-%M')}_{model.__class__.__name__}"
    model.name = model_name
    save_path = Path(paths.data.models.vggbehave, p_fix, session, f"{model_name}_final.pth")
    save_path_best = Path(str(save_path).replace("_final.pth", "_best.pth"))
    save_path.parent.mkdir(parents=True, exist_ok=True)

    model.train()
    criterion = nn.CrossEntropyLoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
    writer = SummaryWriter(log_dir=str(Path(paths.data.models.vggbehave, p_fix, "runs", session, model_name)))

    # Write an input example and graph to tensorboard
    # writer.add_graph(model=model, input_to_model=(img1.to(device), img2.to(device), img3.to(device)),
    #                  verbose=True)

    n_print = np.maximum(len(train_data) // 5, 2)  # print 5 times per epoch
    val_freq = np.maximum(epochs // 10, 2)
    cprint(string=f"\nStart training of '{model_name}' ...\n", col="b", fm="ul")
    best_acc = 0.0  # for validation set, init
    start_time = pd.Timestamp.now()
    epoch_acc = 0.0  # init
    logger.info("Start training of '%s' ...", model_name)
    for epoch in tqdm(range(epochs), desc="Epochs", total=epochs, position=0):
        running_loss = 0.0  # reset for each epoch
        running_corrects = 0
        for i, data in tqdm(
            enumerate(train_data),
            desc="Iterate through training samples",
            total=len(train_data),
            position=1,
            leave=False,
        ):
            x1, x2, x3, y, _ = data.values()  # _ = idx
            optimizer.zero_grad()
            outputs = model(x1.to(device), x2.to(device), x3.to(device))
            _, predictions = torch.max(outputs, 1)
            loss = criterion(outputs, y.to(device))
            loss.backward()
            optimizer.step()

            running_loss += loss.item() * x1.size(0)  # x1.size(0) == train_data.batch_size
            # multiply by batch size to get the correct loss since average is taken over batch for x-entropy
            running_corrects += torch.sum(predictions == y.data.to(device))  # OR just y
            if (i % n_print) == (n_print - 1):
                # Save (running) loss to file / use the writer
                msg = (
                    f"Epoch: {epoch + 1} | Step: {i + 1:6d} | Current loss: {loss.item():.5f} | "
                    f"Running loss: {running_loss / ((i + 1) * train_data.batch_size):.5f}"
                )
                print(msg, end="\r")
                logger.info(msg)
                writer.add_scalar(tag="loss/train", scalar_value=loss.item(), global_step=i)
                writer.add_scalar(
                    tag="running_acc/train",
                    scalar_value=running_corrects.double() / ((i + 1) * train_data.batch_size),
                    global_step=i * (epoch + 1),
                )

        epoch_loss = running_loss / (len(train_data) * train_data.batch_size)
        # == train_data.sampler.num_samples
        epoch_acc = running_corrects.double() / (len(train_data) * train_data.batch_size)
        cprint(
            string=f"After epoch {epoch + 1}: Training Loss: {epoch_loss:.4f} | Acc: {epoch_acc:.2%}", col="g", ts=True
        )

        if (epoch % val_freq) == (val_freq - 1):
            val_acc = evaluate_vgg_face_human_judgment_model(
                model=model,
                data=val_data,
                device=device,
                loss_fn=criterion,
                writer=writer,
                global_step=i * (epoch + 1),
            )
            model.train()  # switch back to train mode

            if val_acc > best_acc:
                best_acc = val_acc
                torch.save(model.state_dict(), save_path_best)
                cprint(
                    string=f"Saved model with current best val accuracy ({best_acc:.1%}) to '{save_path_best}'",
                    col="b",
                    ts=True,
                )

    cprint("\n" + 2 * "*****_" + " FINISHED TRAINING " + "_*****" * 3 + "\n", col="g", ts=True)

    # Last evaluation of the model on the training and validation set
    accs = {
        "train": epoch_acc.cpu().item(),  # use last epoch's accuracy
        "val": evaluate_vgg_face_human_judgment_model(
            model=model, data=val_data, device=device, loss_fn=criterion, writer=writer
        ),
        "test": evaluate_vgg_face_human_judgment_model(
            model=model, data=test_data, device=device, loss_fn=None, writer=writer
        ),
    }
    for set_name, acc in accs.items():
        msg = f"Final accuracy of the network on the {set_name} set: {acc:.2%}"
        cprint(string=msg, col="g", fm="bo")
        logger.info(msg)

    # Save the final model
    if accs["val"] >= best_acc:
        msg = f"Final model has the best val accuracy ({accs['val']:.1%}) and is saved to '{save_path}'"
        torch.save(model.state_dict(), save_path)
        if save_path_best.exists():
            save_path_best.unlink()
    else:
        msg = (
            f"Final model has not the best val accuracy ({accs['val']:.1%}), hence we keep previous best model "
            f"only and rename it to '{save_path}'"
        )
        if save_path_best.exists():
            save_path_best.rename(save_path)
    cprint(string=msg, col="b", ts=True)
    logger.info(msg)

    # Save model hyperparameters to a table
    hp_tab = get_vgg_performance_table(hp_search=False, exclusive_gender_trials=exclusive_gender_trials)

    n_heads = len(np.unique(train_data.dataset.dataset.session_data.to_numpy().flatten()))
    # Fill in hyperparameters & accuracies
    hp_tab.loc[len(hp_tab), :] = [
        model_name,
        session,
        data_mode.lower(),
        model.freeze_vgg_core,
        model.last_core_layer,
        model.parallel_bridge,
        model.decision_block_mode,
        train_data.batch_size,
        epochs,
        learning_rate,
        seed,
        device,
        n_heads,
        len(train_data),
        len(val_data),
        (pd.Timestamp.now() - start_time).round(freq="s"),
        accs["train"],
        accs["val"],
        accs["test"],
    ]
    # Convert columns to correct types
    hp_tab.time_taken = hp_tab.time_taken.astype(str)  # the writer (below) cannot handle timedelta64
    acc_cols = [c for c in hp_tab.columns if "_acc" in c]
    col_convert = ["bs", "epochs", "seed", "n_train", "n_val"]
    hp_tab[col_convert] = hp_tab[col_convert].astype(int)
    hp_tab[acc_cols] = hp_tab[acc_cols].astype(float).round(3)

    # Also save hyperparameters & accuracies to tensorboard
    writer.add_hparams(
        hparam_dict=hp_tab.loc[len(hp_tab) - 1, hp_tab.columns[:-3]].to_dict(),
        metric_dict=hp_tab.loc[len(hp_tab) - 1, hp_tab.columns[-3:]].to_dict(),
    )

    # Save hp table
    p2_save = (
        paths.data.models.behave.hp_table
        if exclusive_gender_trials is None
        else paths.data.models.behave.hp_table_gender.format(gender=exclusive_gender_trials)
    )
    Path(p2_save).parent.mkdir(parents=True, exist_ok=True)
    hp_tab.to_csv(p2_save, index=False)
    logger.info("Saved hyperparameters & accuracies to '%s'.", p2_save)

    # Close tensorboard writer
    writer.close()

    # Send notification
    if send_message:
        response = send_to_mattermost(
            text=MODEL_MESSAGE.format(
                model_name=model_name, hp=hp_tab.loc[len(hp_tab) - 1].to_markdown()
            ),  # long narrow table (better for Mattermost)
            username=config.PROJECT_NAME,
            incoming_webhook=config.minerva.webhook_in,
            icon_url=config.PROJECT_ICON_URL2,
        )

        if not response.ok:
            msg = f"Could not send message to Mattermost: {response.text}"
            cprint(string=msg, col="r", ts=True)
            logger.error(msg)
    return model