Source code for nvflare.app_opt.pt.ditto

# Copyright (c) 2023, NVIDIA CORPORATION.  All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
from abc import abstractmethod

import torch

from nvflare.apis.signal import Signal
from nvflare.app_opt.pt.fedproxloss import PTFedProxLoss



[docs]
class PTDittoHelper(object):
    def __init__(
        self, criterion, model, optimizer, device, app_dir: str, ditto_lambda: float = 0.1, model_epochs: int = 1
    ):
        """Helper to be used with Ditto components.
        Implements the functions used for the algorithm proposed in
        Li et al. "Ditto: Fair and Robust Federated Learning Through Personalization"
        (https://arxiv.org/abs/2012.04221) using PyTorch.

        Args:
            criterion: base loss criterion
            model: the personalized model of Ditto method
            optimizer: training optimizer for personalized model
            device: device for personalized model training
            app_dir: needed for local personalized model saving
            ditto_lambda: lambda weight for Ditto prox loss term when combining with the base loss, defaults to 0.1
            model_epochs: training epoch for personalized model, defaults to 1

        Returns:
            None
        """

        self.criterion = criterion
        self.model = model
        self.optimizer = optimizer
        if device is None:
            self.device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
        else:
            self.device = device
        self.model_epochs = model_epochs
        # initialize Ditto criterion
        self.prox_criterion = PTFedProxLoss(mu=ditto_lambda)
        # check criterion, model, and optimizer type
        if not isinstance(self.criterion, torch.nn.modules.loss._Loss):
            raise ValueError(f"criterion component must be torch loss. " f"But got: {type(self.criterion)}")
        if not isinstance(self.model, torch.nn.Module):
            raise ValueError(f"model component must be torch model. " f"But got: {type(self.model)}")
        if not isinstance(self.optimizer, torch.optim.Optimizer):
            raise ValueError(f"optimizer component must be torch optimizer. " f"But got: {type(self.optimizer)}")
        if not isinstance(self.device, torch.device):
            raise ValueError(f"device component must be torch device. " f"But got: {type(self.device)}")

        # initialize other recording related parameters
        self.epoch_global = 0
        self.epoch_of_start_time = 0
        self.best_metric: int = 0
        self.model_file_path = os.path.join(app_dir, "personalized_model.pt")
        self.best_model_file_path = os.path.join(app_dir, "best_personalized_model.pt")


[docs]
    def load_model(self, global_weights):
        # load local model from last round's record if model exist,
        # otherwise initialize from global model weights for the first round.
        if os.path.exists(self.model_file_path):
            model_data = torch.load(self.model_file_path, weights_only=True)
            self.model.load_state_dict(model_data["model"])
            self.epoch_of_start_time = model_data["epoch"]
        else:
            self.model.load_state_dict(global_weights)
            self.epoch_of_start_time = 0
        if os.path.exists(self.best_model_file_path):
            model_data = torch.load(self.best_model_file_path, weights_only=True)
            self.best_metric = model_data["best_metric"]



[docs]
    def save_model(self, is_best=False):
        # save personalized model locally
        model_weights = self.model.state_dict()
        save_dict = {"model": model_weights, "epoch": self.epoch_global}
        if is_best:
            save_dict.update({"best_metric": self.best_metric})
            torch.save(save_dict, self.best_model_file_path)
        else:
            torch.save(save_dict, self.model_file_path)



[docs]
    def update_metric_save_model(self, metric):
        self.save_model(is_best=False)
        if metric > self.best_metric:
            self.best_metric = metric
            self.save_model(is_best=True)



[docs]
    @abstractmethod
    def local_train(self, train_loader, model_global, abort_signal: Signal, writer):
        # Train personal model for self.model_epochs, and keep track of curves
        # This part is task dependent, need customization
        # Basic idea is to train personalized model with prox term as compare to model_global
        raise NotImplementedError