From 1bb37595ff0ed772231ca669b55b6581489f807f Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 12:45:18 -0400 Subject: [PATCH 01/29] add FedPFT baseline --- baselines/fedpft/.gitignore | 3 + baselines/fedpft/EXTENDED_README.md | 123 ++++++++++ baselines/fedpft/LICENSE | 202 ++++++++++++++++ baselines/fedpft/README.md | 109 +++++++++ baselines/fedpft/fedpft/__init__.py | 1 + baselines/fedpft/fedpft/client.py | 170 ++++++++++++++ baselines/fedpft/fedpft/conf/base.yaml | 15 ++ .../fedpft/fedpft/conf/client/fedavg.yaml | 2 + .../fedpft/fedpft/conf/client/fedpft.yaml | 2 + .../fedpft/fedpft/conf/dataset/CIFAR100.yaml | 10 + .../fedpft/conf/dataset/Caltech101.yaml | 10 + baselines/fedpft/fedpft/conf/model/clip.yaml | 9 + .../fedpft/fedpft/conf/model/resnet50.yaml | 8 + .../fedpft/fedpft/conf/strategy/fedavg.yaml | 12 + .../fedpft/fedpft/conf/strategy/fedpft.yaml | 22 ++ baselines/fedpft/fedpft/dataset.py | 108 +++++++++ .../fedpft/fedpft/dataset_preparation.py | 1 + baselines/fedpft/fedpft/main.py | 88 +++++++ baselines/fedpft/fedpft/models.py | 221 ++++++++++++++++++ baselines/fedpft/fedpft/server.py | 94 ++++++++ baselines/fedpft/fedpft/strategy.py | 145 ++++++++++++ baselines/fedpft/fedpft/utils.py | 102 ++++++++ baselines/fedpft/pyproject.toml | 143 ++++++++++++ 23 files changed, 1600 insertions(+) create mode 100644 baselines/fedpft/.gitignore create mode 100644 baselines/fedpft/EXTENDED_README.md create mode 100644 baselines/fedpft/LICENSE create mode 100644 baselines/fedpft/README.md create mode 100644 baselines/fedpft/fedpft/__init__.py create mode 100644 baselines/fedpft/fedpft/client.py create mode 100644 baselines/fedpft/fedpft/conf/base.yaml create mode 100644 baselines/fedpft/fedpft/conf/client/fedavg.yaml create mode 100644 baselines/fedpft/fedpft/conf/client/fedpft.yaml create mode 100644 baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml create mode 100644 baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml create mode 100644 baselines/fedpft/fedpft/conf/model/clip.yaml create mode 100644 baselines/fedpft/fedpft/conf/model/resnet50.yaml create mode 100644 baselines/fedpft/fedpft/conf/strategy/fedavg.yaml create mode 100644 baselines/fedpft/fedpft/conf/strategy/fedpft.yaml create mode 100644 baselines/fedpft/fedpft/dataset.py create mode 100644 baselines/fedpft/fedpft/dataset_preparation.py create mode 100644 baselines/fedpft/fedpft/main.py create mode 100644 baselines/fedpft/fedpft/models.py create mode 100644 baselines/fedpft/fedpft/server.py create mode 100644 baselines/fedpft/fedpft/strategy.py create mode 100644 baselines/fedpft/fedpft/utils.py create mode 100644 baselines/fedpft/pyproject.toml diff --git a/baselines/fedpft/.gitignore b/baselines/fedpft/.gitignore new file mode 100644 index 00000000000..4ab8207aedb --- /dev/null +++ b/baselines/fedpft/.gitignore @@ -0,0 +1,3 @@ +outputs/ +multirun/ +.ruff_cache/ \ No newline at end of file diff --git a/baselines/fedpft/EXTENDED_README.md b/baselines/fedpft/EXTENDED_README.md new file mode 100644 index 00000000000..9c8f5bc72fa --- /dev/null +++ b/baselines/fedpft/EXTENDED_README.md @@ -0,0 +1,123 @@ + +# Extended Readme + +> The baselines are expected to run in a machine running Ubuntu 22.04 + +While `README.md` should include information about the baseline you implement and how to run it, this _extended_ readme provides info on what's the expected directory structure for a new baseline and more generally the instructions to follow before your baseline can be merged into the Flower repository. Please follow closely these instructions. It is likely that you have already completed steps 1-2. + +1. Fork the Flower repository and clone it. +2. Navigate to the `baselines/` directory and from there run: + ```bash + # This will create a new directory with the same structure as this `baseline_template` directory. + ./dev/create-baseline.sh + ``` +3. All your code and configs should go into a sub-directory with the same name as the name of your baseline. + * The sub-directory contains a series of Python scripts that you can edit. Please stick to these files and consult with us if you need additional ones. + * There is also a basic config structure in `/conf` ready be parsed by [Hydra](https://hydra.cc/) when executing your `main.py`. +4. Therefore, the directory structure in your baseline should look like: + ```bash + baselines/ + ├── README.md # describes your baseline and everything needed to use it + ├── EXTENDED_README.md # to remove before creating your PR + ├── pyproject.toml # details your Python environment + └── + ├── *.py # several .py files including main.py and __init__.py + └── conf + └── *.yaml # one or more Hydra config files + + ``` +> :warning: Make sure the variable `name` in `pyproject.toml` is set to the name of the sub-directory containing all your code. + +5. Add your dependencies to the `pyproject.toml` (see below a few examples on how to do it). Read more about Poetry below in this `EXTENDED_README.md`. +6. Regularly check that your coding style and the documentation you add follow good coding practices. To test whether your code meets the requirements, please run the following: + ```bash + # After activating your environment and from your baseline's directory + cd .. # to go to the top-level directory of all baselines + ./dev/test-baseline.sh + ./dev/test-baseline-structure.sh + ``` + Both `test-baseline.sh` and `test-baseline-structure.sh` will also be automatically run when you create a PR, and both tests need to pass for the baseline to be merged. + To automatically solve some formatting issues and apply easy fixes, please run the formatting script: + ```bash + # After activating your environment and from your baseline's directory + cd .. # to go to the top-level directory of all baselines + ./dev/format-baseline.sh + ``` +7. Ensure that the Python environment for your baseline can be created without errors by simply running `poetry install` and that this is properly described later when you complete the `Environment Setup` section in `README.md`. This is specially important if your environment requires additional steps after doing `poetry install`. +8. Ensure that your baseline runs with default arguments by running `poetry run python -m .main`. Then, describe this and other forms of running your code in the `Running the Experiments` section in `README.md`. +9. Once your code is ready and you have checked: + * that following the instructions in your `README.md` the Python environment can be created correctly + + * that running the code following your instructions can reproduce the experiments in the paper + + , then you just need to create a Pull Request (PR) to kickstart the process of merging your baseline into the Flower repository. + +> Once you are happy to merge your baseline contribution, please delete this `EXTENDED_README.md` file. + + +## About Poetry + +We use Poetry to manage the Python environment for each individual baseline. You can follow the instructions [here](https://python-poetry.org/docs/) to install Poetry in your machine. + + +### Specifying a Python Version (optional) +By default, Poetry will use the Python version in your system. In some settings, you might want to specify a particular version of Python to use inside your Poetry environment. You can do so with [`pyenv`](https://github.com/pyenv/pyenv). Check the documentation for the different ways of installing `pyenv`, but one easy way is using the [automatic installer](https://github.com/pyenv/pyenv-installer): +```bash +curl https://pyenv.run | bash # then, don't forget links to your .bashrc/.zshrc +``` + +You can then install any Python version with `pyenv install ` (e.g. `pyenv install 3.9.17`). Then, in order to use that version for your baseline, you'd do the following: + +```bash +# cd to your baseline directory (i.e. where the `pyproject.toml` is) +pyenv local + +# set that version for poetry +poetry env use + +# then you can install your Poetry environment (see the next setp) +``` + +### Installing Your Environment +With the Poetry tool already installed, you can create an environment for this baseline with commands: +```bash +# run this from the same directory as the `pyproject.toml` file is +poetry install +``` + +This will create a basic Python environment with just Flower and additional packages, including those needed for simulation. Next, you should add the dependencies for your code. It is **critical** that you fix the version of the packages you use using a `=` not a `=^`. You can do so via [`poetry add`](https://python-poetry.org/docs/cli/#add). Below are some examples: + +```bash +# For instance, if you want to install tqdm +poetry add tqdm==4.65.0 + +# If you already have a requirements.txt, you can add all those packages (but ensure you have fixed the version) in one go as follows: +poetry add $( cat requirements.txt ) +``` +With each `poetry add` command, the `pyproject.toml` gets automatically updated so you don't need to keep that `requirements.txt` as part of this baseline. + + +More critically however, is adding your ML framework of choice to the list of dependencies. For some frameworks you might be able to do so with the `poetry add` command. Check [the Poetry documentation](https://python-poetry.org/docs/cli/#add) for how to add packages in various ways. For instance, let's say you want to use PyTorch: + +```bash +# with plain `pip` you'd run a command such as: +pip install torch==1.13.1+cu117 torchvision==0.14.1+cu117 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu117 + +# to add the same 3 dependencies to your Poetry environment you'd need to add the URL to the wheel that the above pip command auto-resolves for you. +# You can find those wheels in `https://download.pytorch.org/whl/cu117`. Copy the link and paste it after the `poetry add` command. +# For instance to add `torch==1.13.1+cu117` and a x86 Linux system with Python3.8 you'd: +poetry add https://download.pytorch.org/whl/cu117/torch-1.13.1%2Bcu117-cp38-cp38-linux_x86_64.whl +# you'll need to repeat this for both `torchvision` and `torchaudio` +``` +The above is just an example of how you can add these dependencies. Please refer to the Poetry documentation to extra reference. + +If all attempts fail, you can still install packages via standard `pip`. You'd first need to source/activate your Poetry environment. +```bash +# first ensure you have created your environment +# and installed the base packages provided in the template +poetry install + +# then activate it +poetry shell +``` +Now you are inside your environment (pretty much as when you use `virtualenv` or `conda`) so you can install further packages with `pip`. Please note that, unlike with `poetry add`, these extra requirements won't be captured by `pyproject.toml`. Therefore, please ensure that you provide all instructions needed to: (1) create the base environment with Poetry and (2) install any additional dependencies via `pip` when you complete your `README.md`. \ No newline at end of file diff --git a/baselines/fedpft/LICENSE b/baselines/fedpft/LICENSE new file mode 100644 index 00000000000..d6456956733 --- /dev/null +++ b/baselines/fedpft/LICENSE @@ -0,0 +1,202 @@ + + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "[]" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright [yyyy] [name of copyright owner] + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md new file mode 100644 index 00000000000..3f045810835 --- /dev/null +++ b/baselines/fedpft/README.md @@ -0,0 +1,109 @@ +--- +title: Parametric Feature Transfer, One-shot Federated Learning with Foundation Models +url: https://arxiv.org/abs/2402.01862 +labels: [foundation-models, pre-trained, one-shot, one-round] # please add between 4 and 10 single-word (maybe two-words) labels (e.g. system heterogeneity, image classification, asynchronous, weight sharing, cross-silo). Do not use "" +dataset: [CIFAR100, Caltech101] # list of datasets you include in your baseline. Do not use "" +--- + +# FedPFT: One-shot Federated Learning with Foundation Models + +> Note: If you use this baseline in your work, please remember to cite the original authors of the paper as well as the Flower paper. + +**Paper:** [arxiv.org/abs/2402.01862](https://arxiv.org/abs/2402.01862) + +**Authors:** Mahdi Beitollahi, Alex Bie, Sobhan Hemati, Leo Maxime Brunswic, Xu Li, Xi Chen, Guojun Zhang. + +**Abstract:** In one-shot federated learning (FL), clients collaboratively train a global model in a single round of communication. Existing approaches for one-shot FL enhance communication efficiency at the expense of diminished accuracy. This paper introduces FedPFT (Federated Learning with Parametric Feature Transfer), a methodology that harnesses the transferability of foundation models to enhance both accuracy and communication efficiency in one-shot FL. The approach involves transferring per-client parametric models (specifically, Gaussian mixtures) of features extracted from foundation models. Subsequently, each parametric model is employed to generate synthetic features for training a classifier head. Experimental results on eight datasets demonstrate that FedPFT enhances the communication-accuracy frontier in both centralized and decentralized FL scenarios, as well as across diverse data-heterogeneity settings such as covariate shift and task shift, with improvements of up to 20.6%. Additionally, FedPFT adheres to the data minimization principle of FL, as clients do not send real features. We demonstrate that sending real features is vulnerable to potent reconstruction attacks. Moreover, we show that FedPFT is amenable to formal privacy guarantees via differential privacy, demonstrating favourable privacy-accuracy tradeoffs. + + +## About this baseline + +**What’s implemented:** The code in this directory replicates the centralized experiments in *Parametric Feature Transfer, One-shot Federated Learning with Foundation Models* (Beitollahi et al., 2024) for CIFAR100 and Caltech101 datasets, which proposed the FedPFT algorithm. Concretely, it replicates the results in Section 5.2. + +**Datasets:** CIFAR100 and Caltech101 from HuggingFace + +**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8Gigs of ram. + +**Contributors:** Mahdi Beitollahi + + +## Experimental Setup + +**Task:** Image classification + +**Model:** This directory utilize two pre-trained, frozen models as shown in Table 1 of the paper: +* ResNet50 pre-trained on ImageNet is used for CIFAR100 dataset(see `models/resnet50`). +* CLIP, ViT-B/32 pre-trained on web dataset is used for Caltech101 dataset (see `models/clip_vit`) + +**Dataset:** This baseline includes the CIFAR100 and Caltech101 datasets. By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. + +| Dataset | #classes | #partitions | partitioning method | partition settings | +| :------ | :---: | :---: | :---: | :---: | +| CIFAR100 | 100 | 50 | Dirichlet distribution | $\alpha$=0.1 | +| Caltech101 | 101 | 50 | Dirichlet distribution | $\alpha$=0.1 | + +**Training Hyperparameters:** The following table shows the main hyperparameters for this baseline with their default value (i.e. the value used if you run `python main.py` directly) + +| Description | Default Value | +| ----------- | ----- | +| total clients | 50 | +| clients per round | 50 | +| number of rounds | 1 | +| client resources | {'num_cpus': 2.0, 'num_gpus': 0.0 }| +| data partition | distribution with $\alpha$=0.1 | +| Number of mixtures | 2 | +| Covariance type | spherical | +| tolerance | 1e-12 | +| maximum GMM iterations | 1e3 | + + +## Environment Setup + +To construct the Python environment, simply run: + +```bash +# Set directory to use python 3.10 (install with `pyenv install ` if you don't have it) +pyenv local 3.10.12 + +# Tell poetry to use python3.10 +poetry env use 3.10.12 + +# Install +poetry install +``` + + +## Running the Experiments + +To run this FedProx with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: + +```bash +python -m fedpft.main # this will run using the default settings in the `conf/config.yaml` + +# you can override settings directly from the command line +python -m fedprox.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 +``` + +To run using FedAvg: +```bash +# this will use a frozen, pre-trained model and train the classifier head +python -m fedpft.main strategy=FedAvg client=FedAvg + +``` + + +## Expected Results + + +With the following command, we run both FedPFT and FedAvg configurations. + +```bash +python -m fedprox.main --multirun dataset=CIFAR100, Caltech101 + +# FedAvg +python -m fedprox.main --multirun strategy=fedavg client=fedavg dataset=CIFAR100, Caltech101 +``` + +The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. + +![](_static/FedProx_mnist.png) \ No newline at end of file diff --git a/baselines/fedpft/fedpft/__init__.py b/baselines/fedpft/fedpft/__init__.py new file mode 100644 index 00000000000..a5e567b5913 --- /dev/null +++ b/baselines/fedpft/fedpft/__init__.py @@ -0,0 +1 @@ +"""Template baseline package.""" diff --git a/baselines/fedpft/fedpft/client.py b/baselines/fedpft/fedpft/client.py new file mode 100644 index 00000000000..434055808f8 --- /dev/null +++ b/baselines/fedpft/fedpft/client.py @@ -0,0 +1,170 @@ +"""Define your client class and a function to construct such clients. + +Please overwrite `flwr.client.NumPyClient` or `flwr.client.Client` and create a function +to instantiate your client. +""" + +from collections import OrderedDict +from typing import Callable, Dict, List, Tuple + +import flwr as fl +import torch +from flwr.common.typing import NDArrays, Scalar +from hydra.utils import instantiate +from omegaconf import DictConfig +from torch import nn +from torch.utils.data import DataLoader + +from fedpft.models import extract_features, test, train +from fedpft.utils import gmmparam_to_ndarrays, learn_gmm + + +class FedPFTClient(fl.client.NumPyClient): + """Flower FedPFTClient.""" + + def __init__( + self, + trainloader: DataLoader, + testloader: DataLoader, + feature_extractor: torch.nn.Module, + num_classes: int, + device: torch.device, + ) -> None: + """FedPFT client strategy. + + Implementation based on https://arxiv.org/abs/2402.01862 + + Parameters + ---------- + trainloader : DataLoader + Dataset used for learning GMMs + testloader : DataLoader + Dataset used for evaluating `classifier_head` sent from the server + feature_extractor : torch.nn.Module + Model used to extract features of each client + num_classes : int + Number of total classes in the dataset + device : torch.device + Device used to extract features and evaluate `classifier_head` + """ + self.trainloader = trainloader + self.testloader = testloader + self.feature_extractor = feature_extractor + self.classifier_head = nn.Linear( + feature_extractor.hidden_dimension, num_classes + ) + self.device = device + + def get_parameters(self, config) -> NDArrays: + """Return the parameters of the `classifier_head`.""" + return [ + val.cpu().numpy() for _, val in self.classifier_head.state_dict().items() + ] + + def set_parameters(self, parameters: NDArrays) -> None: + """Set the parameters of the `classifier_head`.""" + params_dict = zip(self.classifier_head.state_dict().keys(), parameters) + state_dict = OrderedDict({k: torch.tensor(v) for k, v in params_dict}) + self.classifier_head.load_state_dict(state_dict, strict=True) + + def fit( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[NDArrays, int, Dict]: + """Fit a GMM on features and return GMM parameters.""" + # Extracting features + features, labels = extract_features( + dataloader=self.trainloader, + feature_extractor=self.feature_extractor, + device=self.device, + ) + + # Learning GMM + gmm_list = learn_gmm( + features=features, + labels=labels, + n_mixtures=int(config["n_mixtures"]), + cov_type=config["cov_type"], + seed=int(config["seed"]), + tol=float(config["tol"]), + max_iter=int(config["max_iter"]), + ) + + # Reshaping GMM parameters into an NDArray + return [array for gmm in gmm_list for array in gmmparam_to_ndarrays(gmm)], 0, {} + + def evaluate( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[float, int, Dict]: + """Evaluate `classifier_head` on the test data.""" + self.set_parameters(parameters) + loss, acc = test( + classifier_head=self.classifier_head, + dataloader=self.testloader, + feature_extractor=self.feature_extractor, + device=self.device, + ) + return loss, len(self.testloader.dataset), {"accuracy": acc} + + +class FedAvgClient(FedPFTClient): + """Flower FedAvgClient.""" + + def fit( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[NDArrays, int, Dict]: + """Train the classifier head.""" + self.set_parameters(parameters) + + # train classifier head + opt = torch.optim.AdamW( + params=self.classifier_head.parameters(), lr=float(config["lr"]) + ) + train( + classifier_head=self.classifier_head, + dataloader=self.trainloader, + feature_extractor=self.feature_extractor, + device=self.device, + num_epochs=int(config["num_epochs"]), + opt=opt, + ) + return self.get_parameters(config={}), len(self.trainloader.dataset), {} + + +def generate_client_fn( + client_cfg: DictConfig, + trainloaders: List[DataLoader], + testloaders: List[DataLoader], + feature_extractor: torch.nn.Module, + num_classes: int, + device: torch.device, +) -> Callable[[str], fl.client.NumPyClient]: + """Generate the client function that creates the Flower Clients. + + Parameters + ---------- + client_cfg : DictConfig + Type of client + trainloaders : List[DataLoader] + List of train dataloaders for clients + testloaders : List[DataLoader] + List of test dataloaders for clients + feature_extractor : torch.nn.Module + Pre-trained model as the backbone + num_classes : int + Number of classes in the dataset + device : torch.device + Device to load the `feature_extractor` + """ + + def client_fn(cid: str) -> fl.client.NumPyClient: + """Create a FedPFT client.""" + return instantiate( + client_cfg, + trainloader=trainloaders[int(cid)], + testloader=testloaders[int(cid)], + feature_extractor=feature_extractor, + num_classes=num_classes, + device=device, + ) + + return client_fn diff --git a/baselines/fedpft/fedpft/conf/base.yaml b/baselines/fedpft/fedpft/conf/base.yaml new file mode 100644 index 00000000000..ab1477bd696 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/base.yaml @@ -0,0 +1,15 @@ +--- + +num_clients: 2 +dirichlet_alpha: 0.1 +num_rounds: 1 +num_cpus: 1 +num_gpus: 0.1 +batch_size: 64 +device: cuda + +defaults: + - strategy: fedpft + - client: fedpft + - model: resnet50 + - dataset: CIFAR100 diff --git a/baselines/fedpft/fedpft/conf/client/fedavg.yaml b/baselines/fedpft/fedpft/conf/client/fedavg.yaml new file mode 100644 index 00000000000..10fc2b0f922 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/client/fedavg.yaml @@ -0,0 +1,2 @@ +--- +_target_: fedpft.client.FedAvgClient \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/client/fedpft.yaml b/baselines/fedpft/fedpft/conf/client/fedpft.yaml new file mode 100644 index 00000000000..6ef0f175976 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/client/fedpft.yaml @@ -0,0 +1,2 @@ +--- +_target_: fedpft.client.FedPFTClient \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml b/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml new file mode 100644 index 00000000000..322c2d80c18 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml @@ -0,0 +1,10 @@ +--- +_target_: fedpft.dataset.Dataset +name: cifar100 +dataset: CIFAR100 +num_classes: 100 +image_column_name: img +partition_by: fine_label +num_clients: ${num_clients} +dirichlet_alpha: ${dirichlet_alpha} +batch_size: ${batch_size} \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml b/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml new file mode 100644 index 00000000000..96dcc50fa8d --- /dev/null +++ b/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml @@ -0,0 +1,10 @@ +--- +_target_: fedpft.dataset.Dataset +name: caltech101 +dataset: clip-benchmark/wds_vtab-caltech101 +num_classes: 102 +image_column_name: webp +partition_by: cls +num_clients: ${num_clients} +dirichlet_alpha: ${dirichlet_alpha} +batch_size: ${batch_size} \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/model/clip.yaml b/baselines/fedpft/fedpft/conf/model/clip.yaml new file mode 100644 index 00000000000..23d350a2347 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/model/clip.yaml @@ -0,0 +1,9 @@ +feature_extractor: + _target_: fedpft.models.clip_vit + name: openai/clip-vit-base-patch32 +transform: + _target_: fedpft.models.transform + mean: [0.48145466, 0.4578275, 0.40821073] + std: [0.26862954, 0.26130258, 0.27577711] +image_input_size: 224 +hidden_dimension: 768 diff --git a/baselines/fedpft/fedpft/conf/model/resnet50.yaml b/baselines/fedpft/fedpft/conf/model/resnet50.yaml new file mode 100644 index 00000000000..260d9151e68 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/model/resnet50.yaml @@ -0,0 +1,8 @@ +feature_extractor: + _target_: fedpft.models.resnet50 +transform: + _target_: fedpft.models.transform + mean: [0.485, 0.456, 0.406] + std: [0.229, 0.224, 0.225] +image_input_size: 224 +hidden_dimension: 2048 diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml new file mode 100644 index 00000000000..3a4e290ced2 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -0,0 +1,12 @@ +--- +_target_: fedpft.strategy.FedAvg +fraction_fit: 1 +fraction_evaluate: 1 +accept_failures: False +on_fit_config_fn: + _target_: fedpft.server.fedavg_get_on_fit_config_fn + lr: 0.001 + num_epochs: 10 +evaluate_metrics_aggregation_fn: + _target_: fedpft.server.weighted_average + _partial_: true \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml new file mode 100644 index 00000000000..c4982074633 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml @@ -0,0 +1,22 @@ +--- +_target_: fedpft.strategy.FedPFT +fraction_fit: 1 +fraction_evaluate: 1 +accept_failures: False +num_classes: ${dataset.num_classes} +feature_dimension: ${model.hidden_dimension} +device: ${device} +server_batch_size: 32 +num_epochs: 1 +server_opt: + lr: 1e-4 +on_fit_config_fn: + _target_: fedpft.server.fedpft_get_on_fit_config_fn + n_mixtures: 2 + cov_type: spherical + seed: 0 + tol: 1e-12 + max_iter: 10000 +evaluate_metrics_aggregation_fn: + _target_: fedpft.server.weighted_average + _partial_: true diff --git a/baselines/fedpft/fedpft/dataset.py b/baselines/fedpft/fedpft/dataset.py new file mode 100644 index 00000000000..733234074ef --- /dev/null +++ b/baselines/fedpft/fedpft/dataset.py @@ -0,0 +1,108 @@ +"""Dataset creation.""" + +from typing import Callable, Dict + +from flwr_datasets.federated_dataset import FederatedDataset +from flwr_datasets.partitioner import DirichletPartitioner +from torch.utils.data import DataLoader +from torchvision import transforms + + +class Dataset: + """Dataset class.""" + + def __init__( + self, + dataset: str, + num_clients: int, + batch_size: int, + dirichlet_alpha: float, + partition_by: str, + image_column_name: str, + transform: transforms, + image_input_size: int, + seed: int = 0, + split_size: float = 0.8, + **kwargs, + ) -> None: + """Load the dataset and partition it using dirichlet distribution. + + Parameters + ---------- + dataset : str + Name of dataset to be downloaded from HuggingFace. + num_clients: int + Number of clients. + batch_size: int + Batch size of training and testing dataloaders of clients. + dirichlet_alpha: float + Alpha parameter of Dirichlet distribution. + partition_by: str + Label named used for partitioning the dataset. + image_column_name: str + Column name of image in the dataset. + transform: transforms + Transformation of each batch. + image_input_size: int + Input size of pre-trained model. + seed: int, optional + Seed for partitioning the dataset. Default is 0. + split_size: float, optional + The portion of dataset to be used as training and rest as test. + """ + self.dataset = dataset + self.num_clients = num_clients + self.image_input_size = image_input_size + self.transform = transform + self.batch_size = batch_size + self.dirichlet_alpha = dirichlet_alpha + self.partition_by = partition_by + self.seed = seed + self.split_size = split_size + self.image_column_name = image_column_name + + def get_loaders(self): + """Partition the datasets and return a list of dataloaders.""" + partitioner = DirichletPartitioner( + num_partitions=self.num_clients, + partition_by=self.partition_by, + alpha=self.dirichlet_alpha, + min_partition_size=10, + self_balancing=True, + ) + + fds = FederatedDataset( + dataset=self.dataset, partitioners={"train": partitioner} + ) + # Create train/val for each partition and wrap it into DataLoader + trainloaders, testloaders = [], [] + for partition_id in range(self.num_clients): + partition = fds.load_partition(partition_id) + partition = partition.with_transform(self.apply_batch_transforms()) + partition = partition.train_test_split( + train_size=self.split_size, seed=self.seed + ) + trainloaders.append( + DataLoader(partition["train"], batch_size=self.batch_size) + ) + testloaders.append( + DataLoader(partition["test"], batch_size=self.batch_size) + ) + + return trainloaders, testloaders + + def apply_batch_transforms(self) -> Callable[[Dict], Dict]: + """Apply batch transforms for each batch.""" + + def batch_transform(batch): + batch_img = [ + self.transform( + img.resize((self.image_input_size, self.image_input_size)) + ) + for img in batch[self.image_column_name] + ] + batch_label = list(batch[self.partition_by]) + + return {"img": batch_img, "label": batch_label} + + return batch_transform diff --git a/baselines/fedpft/fedpft/dataset_preparation.py b/baselines/fedpft/fedpft/dataset_preparation.py new file mode 100644 index 00000000000..83a9c5dd9e2 --- /dev/null +++ b/baselines/fedpft/fedpft/dataset_preparation.py @@ -0,0 +1 @@ +"""Handle the dataset partitioning and (optionally) complex downloads.""" diff --git a/baselines/fedpft/fedpft/main.py b/baselines/fedpft/fedpft/main.py new file mode 100644 index 00000000000..9860b1232bf --- /dev/null +++ b/baselines/fedpft/fedpft/main.py @@ -0,0 +1,88 @@ +"""Run FL with frozen, pre-trained models.""" + +import pickle +from pathlib import Path + +import flwr as fl +import hydra +import torch +from hydra.core.hydra_config import HydraConfig +from hydra.utils import instantiate +from omegaconf import DictConfig, OmegaConf + +from fedpft.client import generate_client_fn + + +@hydra.main(config_path="conf", config_name="base", version_base=None) +def main(cfg: DictConfig) -> None: + """Run federated learning with frozen, pre-trained models. + + Parameters + ---------- + cfg : DictConfig + An omegaconf object that stores the hydra config. + """ + # Print Config + print(OmegaConf.to_yaml(cfg)) + + # Set device + device = torch.device(cfg.device) + + # Prepare dataset + trainloaders, testloaders = instantiate( + cfg.dataset, + transform=cfg.model.transform, + image_input_size=cfg.model.image_input_size, + ).get_loaders() + + # Define clients + client_fn = generate_client_fn( + client_cfg=cfg.client, + trainloaders=trainloaders, + testloaders=testloaders, + feature_extractor=instantiate(cfg.model.feature_extractor), + num_classes=cfg.dataset.num_classes, + device=device, + ) + + # Setup strategy + strategy = instantiate(cfg.strategy) + + # Start simulation + history = fl.simulation.start_simulation( + client_fn=client_fn, + num_clients=cfg.num_clients, + config=fl.server.ServerConfig(num_rounds=cfg.num_rounds), + strategy=strategy, + client_resources={"num_cpus": cfg.num_cpus, "num_gpus": cfg.num_gpus}, + ) + + # Save results + accuracy_per_round = history.metrics_distributed["accuracy"] + print(accuracy_per_round) + save_path = HydraConfig.get().runtime.output_dir + + strategy_name = strategy.__class__.__name__ + + def format_variable(x): + return f"{x!r}" if isinstance(x, bytes) else x + + file_suffix: str = ( + f"_{format_variable(strategy_name)}" + f"_{format_variable(cfg.dataset.name)}" + f"_clients={format_variable(cfg.num_clients)}" + f"_rounds={format_variable(cfg.num_rounds)}" + f"_finalacc={format_variable(accuracy_per_round[-1][1]):.2f}" + ) + filename = "results" + file_suffix + ".pkl" + + print(f">>> Saving {filename}") + results_path = Path(save_path) / filename + results = {"history": history} + + with open(str(results_path), "wb") as hist_file: + pickle.dump(results, hist_file, protocol=pickle.HIGHEST_PROTOCOL) + + +if __name__ == "__main__": + main() diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py new file mode 100644 index 00000000000..0514b2f3283 --- /dev/null +++ b/baselines/fedpft/fedpft/models.py @@ -0,0 +1,221 @@ +"""Models, training and eval functions.""" + +import logging +from typing import List, Optional, Tuple + +import numpy as np +import torch +import torch.utils +import torchvision.transforms as transforms +from flwr.common.logger import log +from torch import nn +from torch.utils.data import DataLoader +from torchvision import models +from transformers import CLIPModel + + +def resnet50() -> torch.nn.modules: + """Return ResNet-50 model as feature extractor.""" + resnet50 = models.resnet50(weights=models.ResNet50_Weights.DEFAULT) + + # Remove last layer and flatten outputs + resnet50 = torch.nn.Sequential( + *(list(resnet50.children())[:-1]), torch.nn.Flatten() + ) + + # Set the hidden_dimension + resnet50.hidden_dimension = 2048 + + return resnet50 + + +def clip_vit(name: str) -> torch.nn.modules: + """Return CLIP-ViT as feature extractor. + + Parameters + ---------- + name : str + Name of the CLIP model on transformer library, + e.g. `openai/clip-vit-base-patch32`. + """ + + class ClipVit(nn.Module): + """Wrap outputs to return only pooled outputs.""" + + def __init__(self, vision_model): + super().__init__() + self.vision_model = vision_model + self.hidden_dimension = vision_model.config.hidden_size + + def forward(self, input): + output = self.vision_model(input) + return output[1] # return pooled_output (CLS token) + + vision_model = CLIPModel.from_pretrained(name).vision_model + + return ClipVit(vision_model) + + +def transform(mean: List, std: List) -> transforms.Compose: + """Return `transforms.Compose` function for normalizing images. + + Parameters + ---------- + mean : List + Sequence of means for each channel + std : List + Sequence of standard deviations for each channel. + + Returns + ------- + transforms.Compose + Transform function for normalizing images + """ + tr = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize(mean, std), + ] + ) + return tr + + +def extract_features( + dataloader: DataLoader, feature_extractor: torch.nn.Module, device: torch.device +) -> Tuple[np.array, np.array]: + """Extract features and labels from images using feature extractor. + + Parameters + ---------- + dataloader : DataLoader + Dataloader containing {'img': img, 'label': label} + dicts to be extracted. + feature_extractor : torch.nn.Module + Model for extracting features. + device : torch.device + Device for loading `feature_extractor`. + + Returns + ------- + features : np.array + 2D array containing features extracted from `feature_extractor`. + labels : np.array + 2D array containing labels of `features`. + """ + features, labels = [], [] + for dict in dataloader: + batch_samples = dict["img"].to(device) + batch_label = dict["label"].to(device) + with torch.no_grad(): + feature = feature_extractor(batch_samples) + features.append(feature.cpu().detach().numpy()) + labels.append(batch_label) + + # reshape feauturs and labels into a single numpy array + features = np.concatenate(features, axis=0, dtype=np.float64) + labels = np.concatenate(labels, dtype=int) + + return features, labels + + +def test( + classifier_head: torch.nn.Linear, + dataloader: DataLoader, + feature_extractor: torch.nn.Module, + device: torch.device, +) -> Tuple[float, float]: + """"Evaluates the `classifier_head` on the dataset. + + Parameters + ---------- + classifier_head : torch.nn.Linear + Classifier head model. + dataloader : DataLoader + Dataset used for evaluating `classifier_head` containing + {'img': img, 'label': label} dicts. + feature_extractor : torch.nn.Module + Model used for extracting features from the `dataloader`. + device : torch.device + Device for loading `feature_extractor`. + + Returns + ------- + loss : float + CrossEntropy Loss of `classifier_head` on the dataset. + accuracy : float + Accuracy of `classifier_head` on the dataset. + """ + classifier_head.eval() + feature_extractor.eval() + classifier_head.to(device) + feature_extractor.to(device) + + correct, total, loss = 0, 0, 0 + for dict in dataloader: + samples = dict["img"].to(device) + labels = dict["label"].to(device) + with torch.no_grad(): + feature = feature_extractor(samples) + output = classifier_head(feature) + pred = torch.max(output, 1)[1].data.squeeze() + correct += (pred == labels).sum().item() + total += samples.shape[0] + running_loss = nn.CrossEntropyLoss()(output, labels) + loss += running_loss + + return loss.cpu().item(), correct / total + + +def train( + classifier_head: torch.nn.Linear, + dataloader: DataLoader, + opt: torch.optim.Optimizer, + num_epochs: int, + device: torch.device, + feature_extractor: Optional[torch.nn.Module] = None, + verbose: Optional[bool] = False, +) -> None: + """Trains the `classifier_head`. + + Parameters + ---------- + classifier_head : torch.nn.Linear + Classifier head model. + dataloader : DataLoader + Dataset used for evaluating `classifier_head` + containing {'img': img, 'label': label} dicts. + opt : torch.optim.Optimizer + Optimizer for the `classifier_head`. + num_epochs: int + Number of epochs to train the `classifier_head`. + device : torch.device + Device for loading `feature_extractor`. + feature_extractor : torch.nn.Module, Optional + Model used for extracting features from the `dataloader`, optional. + `verbose` : bool, Optional + Whether or not log the accuracy during the training. Defaults to False. + """ + classifier_head.to(device) + if feature_extractor: + feature_extractor.eval() + feature_extractor.to(device) + + for epoch in range(num_epochs): + correct, total, loss = 0, 0, 0 + for _, dict in enumerate(dataloader): + classifier_head.zero_grad() + samples = dict["img"].to(device) + labels = dict["label"].to(device) + if feature_extractor: + with torch.no_grad(): + samples = feature_extractor(samples) + output = classifier_head(samples) + pred = torch.max(output, 1)[1].data.squeeze() + correct += (pred == labels).sum().item() + total += samples.shape[0] + running_loss = nn.CrossEntropyLoss()(output, labels) + loss += running_loss + running_loss.backward() + opt.step() + if verbose: + log(logging.INFO, f"Epoch:{epoch+1} --- Accuracy: {correct/total}") diff --git a/baselines/fedpft/fedpft/server.py b/baselines/fedpft/fedpft/server.py new file mode 100644 index 00000000000..00d88360e9f --- /dev/null +++ b/baselines/fedpft/fedpft/server.py @@ -0,0 +1,94 @@ +"""Create global evaluation function.""" + +from typing import Callable, Dict, List, Tuple + +from flwr.common import Metrics + + +def fedpft_get_on_fit_config_fn( + n_mixtures: int, cov_type: str, seed: int, tol: float, max_iter: int +) -> Callable[[int], Dict[str, str]]: + """Return a function which returns FedPFT training configurations. + + Parameters + ---------- + n_mixtures : int + Number of mixtures for GMMs + cov_type : str + Type of covariance + seed : int + Seed for learning and sampling from the GMMs + tol : float + Error tolerance for learning GMMs + max_iter : int + Maximum number of iteration for EM algorithm + + Returns + ------- + Callable[[int], Dict[str, str]] + Function to return a config with the `lr` and `num_epochs` + """ + + def fit_config(server_round: int) -> Dict[str, str]: + """Return a configuration for training Gaussian Mixtures.""" + config = { + "n_mixtures": str(n_mixtures), + "cov_type": cov_type, + "seed": str(seed), + "tol": str(tol), + "max_iter": str(max_iter), + } + return config + + return fit_config + + +def fedavg_get_on_fit_config_fn( + lr: float, + num_epochs: int, +) -> Callable[[int], Dict[str, str]]: + """Return a function which returns FedAvg training configurations. + + Parameters + ---------- + lr : float + Client's learning rate + num_epochs : int + Number of epochs for local learning of clients + + Returns + ------- + Callable[[int], Dict[str, str]] + Function to return a config with the `lr` and `num_epochs` + """ + + def fit_config(server_round: int) -> Dict[str, str]: + """Return a configuration number of epochs and learning rate.""" + config = { + "lr": str(lr), + "num_epochs": str(num_epochs), + } + return config + + return fit_config + + +def weighted_average(metrics: List[Tuple[int, Metrics]]) -> Metrics: + """Aggregate with weighted average during evaluation. + + Parameters + ---------- + metrics : List[Tuple[int, Metrics]] + The list of metrics to aggregate. + + Returns + ------- + Metrics + The weighted average metric. + """ + # Multiply accuracy of each client by number of examples used + accuracies = [num_examples * float(m["accuracy"]) for num_examples, m in metrics] + examples = [num_examples for num_examples, _ in metrics] + + # Aggregate and return custom metric (weighted average) + return {"accuracy": int(sum(accuracies)) / int(sum(examples))} diff --git a/baselines/fedpft/fedpft/strategy.py b/baselines/fedpft/fedpft/strategy.py new file mode 100644 index 00000000000..f9546140124 --- /dev/null +++ b/baselines/fedpft/fedpft/strategy.py @@ -0,0 +1,145 @@ +"""FedPFT strategy.""" + +from typing import Dict, List, Optional, Tuple, Union + +import torch +from flwr.common import ( + FitRes, + Parameters, + Scalar, + ndarrays_to_parameters, + parameters_to_ndarrays, +) +from flwr.server.client_proxy import ClientProxy +from flwr.server.strategy import FedAvg +from omegaconf import DictConfig +from sklearn.mixture import GaussianMixture as GMM +from torch.utils.data import DataLoader + +from fedpft.models import train +from fedpft.utils import chunks, ndarrays_to_gmmparam + + +class FedPFT(FedAvg): + """Implementation of FedPFT. + + https://arxiv.org/abs/2402.01862 + Authors: + Mahdi Beitollahi, Alex Bie, Sobhan Hemati, Leo Maxime Brunswic, + Xu Li, Xi Chen, Guojun Zhang. + """ + + def __init__( + self, + *args, + num_classes: int, + feature_dimension: int, + server_opt: DictConfig, + server_batch_size: int, + num_epochs: int, + device: torch.device, + **kwargs, + ) -> None: + """Create FedPFT strategy. + + Parameters + ---------- + num_classes : int + Number of classes in the dataset. + feature_dimension : int + Size of feature embeddings + server_opt : DictConfig + Configuration of server optimizer for training classifier head. + server_batch_size : int + Batch size of synthetic features. + num_epochs : int + Number of epochs to train the classifier head. + + Attributes + ---------- + device : torch.device() + Device to train the classifier head at the server. + """ + super().__init__(*args, **kwargs) + self.num_classes = num_classes + self.feature_dimension = feature_dimension + self.server_opt = server_opt + self.server_batch_size = server_batch_size + self.num_epochs = num_epochs + self.device = device + + def aggregate_fit( + self, + server_round: int, + results: List[Tuple[ClientProxy, FitRes]], + failures: List[Union[Tuple[ClientProxy, FitRes], BaseException]], + ) -> Tuple[Optional[Parameters], Dict[str, Scalar]]: + """Learn a classifier head by generating samples from the GMMs.""" + # Do not aggregate if there are failures. + if not self.accept_failures and failures: + raise Exception("there are failures and failures are not accepted") + + config = self.on_fit_config_fn(server_round) + + # Sample from the GMMs to create synthetic feature dataset + synthetic_features_dataset = [] + for _, fit_res in results: + # Convert byte parameters into ndarrays and GMMParameters + ndarray = parameters_to_ndarrays(fit_res.parameters) + all_gmm_parameters = [ + ndarrays_to_gmmparam(array) for array in chunks(ndarray, 5) + ] + + # Sample from GMM_label pairs to create synthetic features + for gmm_parameter in all_gmm_parameters: + gmm = GMM( + n_components=int(config["n_mixtures"]), + covariance_type=config["cov_type"], + random_state=int(config["seed"]), + tol=float(config["tol"]), + max_iter=int(config["max_iter"]), + ) + # Set values of the GMMs + gmm.means_ = gmm_parameter.means.astype("float32") + gmm.weights_ = gmm_parameter.weights.astype("float32") + gmm.covariances_ = gmm_parameter.covariances.astype("float32") + + # Sample features + syn_features, _ = gmm.sample(gmm_parameter.num_samples) + syn_features = torch.tensor(syn_features, dtype=torch.float32) + gmm_labels = torch.tensor( + [int(gmm_parameter.label)] * int(gmm_parameter.num_samples) + ) + + # Add to train data + synthetic_features_dataset += list(zip(syn_features, gmm_labels)) + + # Train a classifier head + synthetic_features_dataset = [ + {"img": img, "label": label} for img, label in synthetic_features_dataset + ] + synthetic_loader = DataLoader( + synthetic_features_dataset, + batch_size=self.server_batch_size, + shuffle=True, + ) + classifier_head = torch.nn.Linear(self.feature_dimension, self.num_classes) + opt = torch.optim.AdamW( + params=classifier_head.parameters(), lr=self.server_opt.lr + ) + + train( + classifier_head=classifier_head, + dataloader=synthetic_loader, + device=self.device, + num_epochs=self.num_epochs, + opt=opt, + verbose=True, + ) + + # Send the classifier head to clients + classifier_ndarray = [ + val.cpu().numpy() for _, val in classifier_head.state_dict().items() + ] + + return ndarrays_to_parameters(classifier_ndarray), {} diff --git a/baselines/fedpft/fedpft/utils.py b/baselines/fedpft/fedpft/utils.py new file mode 100644 index 00000000000..c1a27c14647 --- /dev/null +++ b/baselines/fedpft/fedpft/utils.py @@ -0,0 +1,102 @@ +"""Utility functions.""" + +from dataclasses import dataclass +from typing import List + +import numpy as np +from flwr.common import NDArrays +from sklearn.mixture import GaussianMixture + + +@dataclass +class GMMParameters: + """GMM parameters.""" + + label: int + means: NDArrays + weights: NDArrays + covariances: NDArrays + num_samples: int + + +def gmmparam_to_ndarrays(gmm: GMMParameters) -> NDArrays: + """Convert gmm object to NumPy ndarrays.""" + return [gmm.label, gmm.means, gmm.weights, gmm.covariances, gmm.num_samples] + + +def ndarrays_to_gmmparam(ndarrays: NDArrays) -> GMMParameters: + """Convert NumPy ndarray to GMM object.""" + return GMMParameters( + label=ndarrays[0], + means=ndarrays[1], + weights=ndarrays[2], + covariances=ndarrays[3], + num_samples=ndarrays[4], + ) + + +def learn_gmm( + features: np.array, + labels: np.array, + n_mixtures: int, + cov_type: str, + seed: int, + tol: float = 1e-12, + max_iter: int = 1000, +) -> List[GMMParameters]: + """Learn a list of 16-bits GMMs for each label. + + Parameters + ---------- + features : np.array + A 2-d array with size (n_samples, feature_dimension) containing + extracted features for all the samples. + labels : np.array + An array with size (n_samples) containing labels associated for + each sample in `features`. + n_mixtures : int + Number of mixtures in each Gaussian Mixture. + cov_type : str + Covariance type of Gaussian Mixtures, e.g. spherical. + seed: int + Seed for learning and sampling from Gaussian Mixtures. + tol: float + Tolerance of Gaussian Mixtures. + max_iter: int + Number of maximum iterations to learn the Gaussian Mixtures. + + Returns + ------- + List[GMMParameters] + Returns a list containing the GMMParameters for each class. + """ + gmm_list = [] + for label in np.unique(labels): + cond_features = features[label == labels] + if ( + len(cond_features) > n_mixtures + ): # number of samples should be larger than `n_mixtures`. + gmm = GaussianMixture( + n_components=n_mixtures, + covariance_type=cov_type, + random_state=seed, + tol=tol, + max_iter=max_iter, + ) + gmm.fit(cond_features) + gmm_list.append( + GMMParameters( + label=label, + means=gmm.means_.astype("float16"), + weights=gmm.weights_.astype("float16"), + covariances=gmm.covariances_.astype("float16"), + num_samples=len(cond_features), + ) + ) + return gmm_list + + +def chunks(lst, n): + """Yield successive n-sized chunks from lst.""" + for i in range(0, len(lst), n): + yield lst[i : i + n] diff --git a/baselines/fedpft/pyproject.toml b/baselines/fedpft/pyproject.toml new file mode 100644 index 00000000000..30e47defbda --- /dev/null +++ b/baselines/fedpft/pyproject.toml @@ -0,0 +1,143 @@ +[build-system] +requires = ["poetry-core>=1.4.0"] +build-backend = "poetry.masonry.api" + +[tool.poetry] +name = "fedpft" # <----- Ensure it matches the name of your baseline directory containing all the source code +version = "1.0.0" +description = "Flower Baselines" +license = "Apache-2.0" +authors = ["The Flower Authors "] +readme = "README.md" +homepage = "https://flower.ai" +repository = "https://github.com/adap/flower" +documentation = "https://flower.ai" +classifiers = [ + "Development Status :: 3 - Alpha", + "Intended Audience :: Developers", + "Intended Audience :: Science/Research", + "License :: OSI Approved :: Apache Software License", + "Operating System :: MacOS :: MacOS X", + "Operating System :: POSIX :: Linux", + "Programming Language :: Python", + "Programming Language :: Python :: 3", + "Programming Language :: Python :: 3 :: Only", + "Programming Language :: Python :: 3.8", + "Programming Language :: Python :: 3.9", + "Programming Language :: Python :: 3.10", + "Programming Language :: Python :: 3.11", + "Programming Language :: Python :: Implementation :: CPython", + "Topic :: Scientific/Engineering", + "Topic :: Scientific/Engineering :: Artificial Intelligence", + "Topic :: Scientific/Engineering :: Mathematics", + "Topic :: Software Development", + "Topic :: Software Development :: Libraries", + "Topic :: Software Development :: Libraries :: Python Modules", + "Typing :: Typed", +] + +[tool.poetry.dependencies] +python = ">=3.8.15, <3.12.0" # don't change this +flwr = { extras = ["simulation"], version = "1.5.0" } +hydra-core = "1.3.2" # don't change this +torch = {url = "https://download.pytorch.org/whl/cu117/torch-1.13.0%2Bcu117-cp310-cp310-linux_x86_64.whl"} +scikit-learn = "1.2.2" +flwr-datasets = "0.1.0" +torchvision = {url = "https://download.pytorch.org/whl/cu117/torchvision-0.14.0%2Bcu117-cp310-cp310-linux_x86_64.whl"} +transformers = "4.39.3" +datasets = "2.18.0" + +[tool.poetry.dev-dependencies] +isort = "==5.13.2" +black = "==24.2.0" +docformatter = "==1.7.5" +mypy = "==1.4.1" +pylint = "==2.8.2" +flake8 = "==3.9.2" +pytest = "==6.2.4" +pytest-watch = "==4.2.0" +ruff = "==0.0.272" +types-requests = "==2.27.7" + +[tool.isort] +line_length = 88 +indent = " " +multi_line_output = 3 +include_trailing_comma = true +force_grid_wrap = 0 +use_parentheses = true + +[tool.black] +line-length = 88 +target-version = ["py38", "py39", "py310", "py311"] + +[tool.pytest.ini_options] +minversion = "6.2" +addopts = "-qq" +testpaths = [ + "flwr_baselines", +] + +[tool.mypy] +ignore_missing_imports = true +strict = false +plugins = "numpy.typing.mypy_plugin" + +[tool.pylint."MESSAGES CONTROL"] +disable = "bad-continuation,duplicate-code,too-few-public-methods,useless-import-alias" +good-names = "i,j,k,_,x,y,X,Y" +signature-mutators = "hydra.main.main" + +[tool.pylint.typecheck] +generated-members = "numpy.*, torch.*, tensorflow.*" + +[[tool.mypy.overrides]] +module = [ + "importlib.metadata.*", + "importlib_metadata.*", +] +follow_imports = "skip" +follow_imports_for_stubs = true +disallow_untyped_calls = false + +[[tool.mypy.overrides]] +module = "torch.*" +follow_imports = "skip" +follow_imports_for_stubs = true + +[tool.docformatter] +wrap-summaries = 88 +wrap-descriptions = 88 + +[tool.ruff] +target-version = "py38" +line-length = 88 +select = ["D", "E", "F", "W", "B", "ISC", "C4"] +fixable = ["D", "E", "F", "W", "B", "ISC", "C4"] +ignore = ["B024", "B027"] +exclude = [ + ".bzr", + ".direnv", + ".eggs", + ".git", + ".hg", + ".mypy_cache", + ".nox", + ".pants.d", + ".pytype", + ".ruff_cache", + ".svn", + ".tox", + ".venv", + "__pypackages__", + "_build", + "buck-out", + "build", + "dist", + "node_modules", + "venv", + "proto", +] + +[tool.ruff.pydocstyle] +convention = "numpy" From 302543c9502e92f6887787e11d782d5b3d1ca1df Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:41:38 -0400 Subject: [PATCH 02/29] fixd model to gpu bug --- baselines/fedpft/fedpft/models.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index 0514b2f3283..7ebc9beed4a 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -102,6 +102,8 @@ def extract_features( labels : np.array 2D array containing labels of `features`. """ + feature_extractor.to(device) + features, labels = [], [] for dict in dataloader: batch_samples = dict["img"].to(device) @@ -109,7 +111,7 @@ def extract_features( with torch.no_grad(): feature = feature_extractor(batch_samples) features.append(feature.cpu().detach().numpy()) - labels.append(batch_label) + labels.append(batch_label.cpu().detach().numpy()) # reshape feauturs and labels into a single numpy array features = np.concatenate(features, axis=0, dtype=np.float64) From 02724f9a600694feb1a62d5913145bc1cfa5a0f4 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:42:26 -0400 Subject: [PATCH 03/29] fixed config --- baselines/fedpft/fedpft/conf/base.yaml | 4 ++-- baselines/fedpft/fedpft/conf/strategy/fedavg.yaml | 2 +- baselines/fedpft/fedpft/conf/strategy/fedpft.yaml | 4 ++-- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/baselines/fedpft/fedpft/conf/base.yaml b/baselines/fedpft/fedpft/conf/base.yaml index ab1477bd696..01b1495c241 100644 --- a/baselines/fedpft/fedpft/conf/base.yaml +++ b/baselines/fedpft/fedpft/conf/base.yaml @@ -1,10 +1,10 @@ --- -num_clients: 2 +num_clients: 50 dirichlet_alpha: 0.1 num_rounds: 1 num_cpus: 1 -num_gpus: 0.1 +num_gpus: 1 batch_size: 64 device: cuda diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml index 3a4e290ced2..5f9e1d9e777 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -6,7 +6,7 @@ accept_failures: False on_fit_config_fn: _target_: fedpft.server.fedavg_get_on_fit_config_fn lr: 0.001 - num_epochs: 10 + num_epochs: 1 evaluate_metrics_aggregation_fn: _target_: fedpft.server.weighted_average _partial_: true \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml index c4982074633..5612193071d 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml @@ -7,12 +7,12 @@ num_classes: ${dataset.num_classes} feature_dimension: ${model.hidden_dimension} device: ${device} server_batch_size: 32 -num_epochs: 1 +num_epochs: 50 server_opt: lr: 1e-4 on_fit_config_fn: _target_: fedpft.server.fedpft_get_on_fit_config_fn - n_mixtures: 2 + n_mixtures: 1 cov_type: spherical seed: 0 tol: 1e-12 From a7730cc3a35aab6efc581a1a018ddbcc006a2276 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:43:04 -0400 Subject: [PATCH 04/29] added notebook for visualization --- .../fedpft/docs/viz_and_plot_results.ipynb | 204 ++++++++++++++++++ 1 file changed, 204 insertions(+) create mode 100644 baselines/fedpft/docs/viz_and_plot_results.ipynb diff --git a/baselines/fedpft/docs/viz_and_plot_results.ipynb b/baselines/fedpft/docs/viz_and_plot_results.ipynb new file mode 100644 index 00000000000..866ffb5d8c7 --- /dev/null +++ b/baselines/fedpft/docs/viz_and_plot_results.ipynb @@ -0,0 +1,204 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "id": "5e0cf2a9-b782-48de-ac45-128726a26e64", + "metadata": {}, + "outputs": [ + { + "ename": "ModuleNotFoundError", + "evalue": "No module named 'matplotlib'", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[1;32mIn[2], line 7\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mos\u001b[39;00m\n\u001b[0;32m 6\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mnp\u001b[39;00m\n\u001b[1;32m----> 7\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mpyplot\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mplt\u001b[39;00m\n", + "\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'matplotlib'" + ] + } + ], + "source": [ + "import pickle\n", + "import yaml\n", + "from pathlib import Path\n", + "import os\n", + "\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "7ea3e149-ce6f-4ba0-aa41-e0501a04efe3", + "metadata": {}, + "outputs": [], + "source": [ + "def saveFig(name, fig):\n", + " fig.savefig(\n", + " name,\n", + " dpi=None,\n", + " facecolor=fig.get_facecolor(),\n", + " edgecolor=\"none\",\n", + " orientation=\"portrait\",\n", + " format=\"png\",\n", + " transparent=False,\n", + " bbox_inches=\"tight\",\n", + " pad_inches=0.2,\n", + " metadata=None,\n", + " )" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "id": "4b010856-0d99-4d81-8fb0-7a927f10eeaf", + "metadata": {}, + "outputs": [], + "source": [ + "# Update the path belows to the directories containing the results for FedPFT and FedAvg\n", + "path_fedpft_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n", + "path_fedpft_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-44-20')\n", + "\n", + "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','18-16-41')\n", + "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "2e3e165c-1ce6-4efa-a4e1-1372586e436e", + "metadata": {}, + "outputs": [], + "source": [ + "# load results\n", + "def read_accuracies(path_to_pickle):\n", + " for result in list(Path(path_to_pickle).glob(\"*.pkl\")):\n", + " with open(result, \"rb\") as handle:\n", + " data = pickle.load(handle)\n", + "\n", + " accuracies = data['history'].metrics_distributed['accuracy']\n", + " return accuracies\n" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "id": "77b70c73", + "metadata": {}, + "outputs": [], + "source": [ + "fedpft_cifar = read_accuracies(path_fedpft_resutls_cifar100)\n", + "fedpft_caltech = read_accuracies(path_fedpft_resutls_caltech101)\n", + "fedavg_cifar = read_accuracies(path_fedavg_resutls_cifar100)\n", + "fedavg_caltech = read_accuracies(path_fedavg_resutls_caltech101)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "6f4c87ad", + "metadata": {}, + "outputs": [], + "source": [ + "fedavg_cifar = [(1, 0.06924765515865097),\n", + " (2, 0.1315106765116743),\n", + " (3, 0.16773099181800039),\n", + " (4, 0.1946717222111355),\n", + " (5, 0.2171223308720814),\n", + " (6, 0.2375773298742766),\n", + " (7, 0.2597285970864099),\n", + " (8, 0.276092596288166),\n", + " (9, 0.290560766314109),\n", + " (10, 0.3036320095789264),\n", + " (11, 0.3128118140091798),\n", + " (12, 0.3261823987228098),\n", + " (13, 0.33745759329475156),\n", + " (14, 0.3477349830373179),\n", + " (15, 0.35831171422869684),\n", + " (16, 0.36679305527838757),\n", + " (17, 0.37407703053282776),\n", + " (18, 0.3817601277190182),\n", + " (19, 0.38824585910995807),\n", + " (20, 0.3942326880862103)]" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "id": "e1a678de", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "No artists with labels found to put in legend. Note that artists whose label start with an underscore are ignored when legend() is called with no argument.\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def viz():\n", + " fig, axs = plt.subplots(figsize=(10, 2), nrows=1, ncols=2)\n", + " \n", + " # cifar100 - fedavg\n", + " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', linewidth=2.0)\n", + " \n", + " axs[0].set_title('CIFAR100 - ResNet50')\n", + " \n", + " for ax in axs:\n", + " ax.set_xticks([1, 5, 10 , 15, 20])\n", + " ax.grid()\n", + " ax.legend(fontsize=14, loc='lower right')\n", + " ax.set_xlabel(\"Round\", fontsize=14)\n", + " ax.set_ylabel(\"Accuracy\", fontsize=14)\n", + "\n", + " return fig\n", + "\n", + "f = viz()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "92460065", + "metadata": {}, + "outputs": [], + "source": [ + "saveFig(\"FedProx_mnist.png\", f)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.11" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} From 056919e1b2bbcc1c07849d256342669e13a524f2 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:43:34 -0400 Subject: [PATCH 05/29] completed readme file --- baselines/fedpft/README.md | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 3f045810835..3370fd22d8f 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -51,10 +51,10 @@ dataset: [CIFAR100, Caltech101] # list of datasets you include in your baseline. | number of rounds | 1 | | client resources | {'num_cpus': 2.0, 'num_gpus': 0.0 }| | data partition | distribution with $\alpha$=0.1 | -| Number of mixtures | 2 | +| Number of mixtures | 1 | | Covariance type | spherical | | tolerance | 1e-12 | -| maximum GMM iterations | 1e3 | +| maximum EM iterations | 1e3 | ## Environment Setup @@ -98,10 +98,13 @@ python -m fedpft.main strategy=FedAvg client=FedAvg With the following command, we run both FedPFT and FedAvg configurations. ```bash -python -m fedprox.main --multirun dataset=CIFAR100, Caltech101 +# FedPFT +python -m fedprox.main dataset=CIFAR100 model=resnet50 +python -m fedprox.main dataset=Caltech101 model=clip -# FedAvg -python -m fedprox.main --multirun strategy=fedavg client=fedavg dataset=CIFAR100, Caltech101 +# FedAvg with pre-trained, frozen models +python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 +python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 fedavg.num_epochs=10 fedavg.lr=0.01 num_gpus=0.2 ``` The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. From 6d9218e5a75803dc02a480ddf435415709c6808e Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 23:47:09 -0400 Subject: [PATCH 06/29] fixed cofig --- baselines/fedpft/fedpft/conf/strategy/fedavg.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml index 5f9e1d9e777..166bcd10aef 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -5,8 +5,8 @@ fraction_evaluate: 1 accept_failures: False on_fit_config_fn: _target_: fedpft.server.fedavg_get_on_fit_config_fn - lr: 0.001 - num_epochs: 1 + lr: 0.01 + num_epochs: 10 evaluate_metrics_aggregation_fn: _target_: fedpft.server.weighted_average _partial_: true \ No newline at end of file From a58786b2e2f6e6737f75ef5c66182b94be3c5b44 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 23:47:39 -0400 Subject: [PATCH 07/29] fixed readme --- baselines/fedpft/README.md | 18 +++++++++--------- 1 file changed, 9 insertions(+), 9 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 3370fd22d8f..c25f6de8f71 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -75,19 +75,19 @@ poetry install ## Running the Experiments -To run this FedProx with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: +To run this FedPFT with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: ```bash python -m fedpft.main # this will run using the default settings in the `conf/config.yaml` # you can override settings directly from the command line -python -m fedprox.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 +python -m fedpft.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 ``` To run using FedAvg: ```bash # this will use a frozen, pre-trained model and train the classifier head -python -m fedpft.main strategy=FedAvg client=FedAvg +python -m fedpft.main strategy=FedAvg client=FedAvg num_rounds=20 dataset=Caltech101 model=clip num_gpus=0.2 ``` @@ -99,14 +99,14 @@ With the following command, we run both FedPFT and FedAvg configurations. ```bash # FedPFT -python -m fedprox.main dataset=CIFAR100 model=resnet50 -python -m fedprox.main dataset=Caltech101 model=clip +python -m fedpft.main dataset=CIFAR100 model=resnet50 +python -m fedpft.main dataset=Caltech101 model=clip # FedAvg with pre-trained, frozen models -python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 -python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 fedavg.num_epochs=10 fedavg.lr=0.01 num_gpus=0.2 +python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 strategy.on_fit_config_fn.num_epochs=1=1 num_gpus=0.5 +python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 num_gpus=0.2 ``` -The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. +The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the commands above. -![](_static/FedProx_mnist.png) \ No newline at end of file +![](_static/FedPft.png) \ No newline at end of file From 1127ce6aaa84c5f6085910535880e81e821b893c Mon Sep 17 00:00:00 2001 From: Mahdi Date: Mon, 15 Apr 2024 00:12:08 -0400 Subject: [PATCH 08/29] add plots --- baselines/fedpft/_static/FedPft.png | Bin 0 -> 28010 bytes 1 file changed, 0 insertions(+), 0 deletions(-) create mode 100644 baselines/fedpft/_static/FedPft.png diff --git a/baselines/fedpft/_static/FedPft.png b/baselines/fedpft/_static/FedPft.png new file mode 100644 index 0000000000000000000000000000000000000000..76028f4f24b02b424b9bbbb2ffff0a37d260f45c GIT binary patch literal 28010 zcmd43WmHye*EV{Ql2QsH2ndLDmr6<_-QAMXNH-!SAR-DS@|J?VuAAN>5Ue{XdJkL3gdBloRQ;{RYyN-uKp$HY^r8Q6}3>y>* z4F?As{$#@QSv&l8$3sTXL(|#X!^_<5AxhcY!{w2)$0IunI?so0?sm>je4Ij@{OokL z9v&|4ce%J6|K|rdo!xA>$isyD;X`m;r+CD^WF*$06U!iX!=Pnwd_>1_)jqwsPIt9{Jhwob z&A_Ipgsd|JJru8(V4)!>O(^6!3XSwd%YnObE#o(RAtD~HjkMn)a`ZT%DEfc@46%^~ zT#}If_YZr2%U^O%su<}N8PA$VTONy#*6x&A4C2B;m71Z-}Tyf)}Maw z^^vQP^AtgpbZ86(*Q=unLVYDA0!C6?LFcJrTYP-{FlqWhL#1Qi*yrZvuCmx1ckf;& zV^Rvv&%a$NMAWd`e@}5jk&*NRk&TT_?q8E8e_S>; zHhD(U$xp6Qj@0ku;&sL&a&vD@dCwC*dGdsgfkEownQ^_Rc}FBkfoZcCBdJ1`^T(8w zlw?sqK_eq0Ge<{4Q&UrT)&<4~Yd@=Or<+6{J$f{=w)U)0Gk@;y>L}Jmea_B7N=XUF z-N%2Pv_}v*oawpkNV6o!mpf03B`xmcq$DTntp#L?`jMNPn|mMai(~`*UPj+vD6#w)j-p0YlZ~sxG`+&Ci)#=|+(_|4JUVndoGbbk#tE@`%c5H7y zzxLi1OYE7MnF%gyI>xiMw!X$=Asw>Xi5b62(x$Wd9p32Hf zm!+?iU(@c8U7VkA1)gqyzJD^mzM&zT=ya7$e75bxM@K4hE|X$U(^s!v z=`{z6qUi42p}cgNx+PmChWN&fSjUNvEG6~UebowCezklcdonQRmGJBuk8n=YQv{?o$6h1k7 z%ktnma~qrd$_AYh1HDSCD2>#Zn3!JQH|PJBi{awRA}p6)xfz;>h{ymuqjgLZMY%ZY z*5kjcgVlDL-oCzb`|A@}r6=t~;%0LlQQjA42PD+g&%WoYTK*X>lz;G`9X8a}RT&wX z+4{{UsrILYv+L_6yB7TX{8#WPIHk{y|MHl(VScKwXJBE$MLzmuvpF6fj`>)*xqVH# zc#zoA*A&h7^B1sD5?}zG(5Sjno+>s?EX8h+@ce&)7{Ii?h}3uIN4|6AR;8Z zio*GpAzQzpbm4ScC5_q5_-ON$kST8H zVQnt#`p}q|2MH&1XS3z9yz-_2f3KP}2gVXo3BI-Nd&Bx=^+!=eyx4KU@MoXHt(z*D zVzD=+o|<((zxgTXLaaYSv}o`nX%y!AL`?)8&L^+Uj3HhjA)(~tD`(RVn^TS40s@_f z+w)f)b#!#D-ScG6&d%Oi9%MjCC@SJXo8h+Tz!@7KXC3)_a3HtXn^fU<;1p}YNeG*3 zY+{1p?p=dIQ9eGhtgNg8-7*?>4vyKSrKkE;);Ib1H0>HABXO#or)fMrJqwI#d9U-^ z2K($T6;j*4#d*)i3YEk0#0gciGWz{3Q?AUUQSF1h_So3iTUfF~C~H^0w70c!yDurB zB+~Cbz9J>ELsZn$-_Pk0S&$dRM$hZi*(aVV=y-p$)OdDz8Rx-+2mFu5h#f|XS@y2M z9+v*{iUSR0+4W4lforkxys+Rvuy$-r@7axeQ{pUxK<$PBxw~&yo{sxpFH(Y6xKc#mPc}a;rp{1t> z*V>v|*rxk%^k$gH^1w|fM%hp}a>rGn7W4`zYQNV~Zy?zitH3}$>E31ohJ%9x94`u} z&EF3{?GPRQc(2W-?yp;F)Jo;tkfr5nYwM>{5tosrd){M(LqMQa zA6ru+M9ygx`TRLCatk-^dZ199JOVz>7#&#&B?cebzP#q*2|V@o_VKwXC`b;)QO3aF zIy*c2mCtFs5Aoh>7d;&qQ0wUEFzbxIiY#rZaeeeJxt+8`@!Lm-hb@?L7MI?Tzw%R#E8+00i028R2umd|_!weSbav_)inr($e zFNhrc_t#R8JwLngtG;d2G>8N6RTgxWP$ecd?vHIx1q6`_KK`Ld@ud0UoDD@hQfkbG zbAQ9-DV*2B;(N9Obge&s*0#*Q#zdK~ja9T&*?a>qhB-Ue8FL>_x7JgIM?WiNxOsR; zph%TepN)TTz(TcU2A#7&p=CF1YUsWhn|P=vL}G^$cB0A`NXb`x z5wy^b+TGdRB@+=9O&aIFF`}1tAQ%)B)Y{P@z5ZP0=;Mxg?5}z+-SO$YmG4-ZnwqnV zUtZe>mBC$OLkGyq%d>xdM_3p~>M4PGz0&LU>qOMTbSPrj^reHxf1V2T?kbt=e7j7+ zWujFr>b)gVURg;x<+mxC`&j7F7@Z!Vq(&ydR_rL^z{A-~xsMHNoH#z!)vgs@U%cx1xvL%nW!lS^S5O1JLZ+|-q@<;v3`vQlbc$b`hB=IunnOR2 z{u^=mMl@VLwWzPwL({^-LKhd8;IJ?Z*isRceAaJamkGPfNJQN(l~+~OP3!#frMFkH zLS(ZUtE4D4rG00j+#CbW(#-O5Bsqrx9WO6wm37~J7ngF2bWy+kmWc@}6B84_A6g=H zp6hrL)W_%&Jh-1jFfIYoj28KLy7qHA=%PgUN})>2PGsVP@bDpv9MKHM!xSk%Sd+>F&^FCz&=&W0dJx9iy#eSQ7efh;Lh@aK5i`J%F>`}gmM z%FgfNTR1wFxH*!eI`>X@0=`^u*#644h>VHR^fmcl|AW3}WweYoG&B@21e8wB8EAxZ z1_p05=xdQmGWjWsUz)oNjuol}?z|%K%=a0U&}H|fuabb0x#1}jPz#s0bnyEhy09Bm z;~00+oC~m+o=s^(+3k#%#cg_yy<0}AUot~d;+Wx8&K=u9Su$-Unsy=!8 zl%ACp4-lu~7gz~(xHOB-w<~^zIy&S~Z(ctAaWxO-G{tX=o3UIb4a_?J!H0pbFWv~= zQFeQg2Y(|8PZVao+^i5EJ7huNMC;o5LDL6d_0;BD29yd)jlwG=BqXeS7jIHh%wZw* z8hr&UEG=jM{CUqjtavYnhm8&YTc)_K{g>4E)zPxDJxX~o{GI5lY+JJtwAl)YOu2W( zRmTxAX2vnD^H4Xs#FW@GkfT7xZun7YU2I|03`U~);X+Me*EvjNn%dfO zSsVX=52vxS!t%2je1ByLoE`W$*O?YH7$mDK5FGAu{ZB(s^W5{#=|U@Z$2Iiy^V*ZA zWH2>3{iDikmPYTY4vy@Or(Ru1`KS*!enTIyoy$G7A1RJX zOQU9FWNaB6R3FTMJ(QEfSkg!vxHl+wIDK)R?>zb-U%cHWmVf#0=oREsQ3G&RH(|Yx*85Lo$Wy=VvG3PTxxmg^&>v zkc@?^^;^BP1WDiD>0Vp&@#4tVfg?D0e135_Pb3m}dJQ(BR-GvhU0{qbG}g80=H>zX zH-Ocmpw(NphGGc=A2LVqz?I*5iW(p=z|ZI*X)*wYy6l&NyJD%@zkVfv^4f8U*8i;@ z7izN3!)WHCCSYPZ<=bLN3@KL=;WJPkxQQk zdTr0iXQs@90A zs;Zp5Ju9l!w!GUl{#2l)rA5%HY0%k+amGZi=w-zuRx}i_J%!aO zupfH2u_V_k7^{&B4u!RaMJR01d8odh zytlJ^eQ(`i$SVZslClqR9nL?cUl?&F$;LZVU2R%?Dev?XHWxSD{|sr%$-z z&9F9Cpi}ZjG4QqNC1c{FMasT60&IV`6@$ylWXcZ$^CVRt>F41;D1D@qkz<$??llNgIXt89>A z#D8XUtb*aL=NgX0sh}gw8Ois&I7vxK)yhmnPd9@uq=17Hd^GmfqZoP{0dy!C`1{;& z6p_O@?Y~RtyT2A?(&(F1z!mKPLpKgCZtH8)z$kc(mJ8hpV~u`7Oe$%SWVcliWC1&) zwJ%i&nFgV=Ug0pPZfOh0cl|TW0{H0?Ou6#%@-2Ww)QfaDU;=C!u7zyC56JsB90)Sz=8!r4+uzk9v8CgA+&w=mEt^jyHk%|ls&d7h|0 z?asU8X9}7`G$Ji9wWB1|w|d-P*Vo^Zjibhupnl(EJ4g>4fdxG9t=-*r_*)f^S9SdN zf7&RHhTpn*f07s-d04RU%Pm;@@TqAhq(*;oxp|pdI2gKcp=f)a zBl3{oM$sZi=VWAMEdVY7C&vNHTDUu}iM#T+R6d)2vMIn22M323xCu*+ zKiO=)FzN2@Rx8#W&^m_kmi1(^#u?ZasQXeOpGAFka!?XTp~8~vPFFNdhf>lyJgjw1 z!2V^nve=EXIyqb0f}wp_m$qk=e3(Ge0)wbw`?E3^?xl2JFJCp2eEg#$8;riVmoHzw zZ)W!P`HL4CGn?ufSbx*$aP9*yIpomn4Nno@(!836X1Y z@$#Y&JDkC|$;+!@*9apnZfR+0C=8nxtiKWND-4^E6nQ8>E4Oxa$!=|LlfZaW=1K|=AeKv1SOhd<9@wE&QA9P^b0wN@( zwX$Gj#Q_*SqNfU38+NH-M;TonY6m#Dv|>TtpldS%5SC^#OZ- zG;&B$9pb?yC5{y}uN8BlMqPtbjSIEWF~Y`UjCQ>9e3)}Te?RG?s-}j<%+gYxH&{qX$?)ekXeg~qw--vCf$K_xWk zL%vi}%&22zL2-wcFP%6ReW>v^GW0Ii@AeC z(S9){O3%Om$R3Sc7?b|w_9_d&yz#$$jp~sg+}5JyfEWo$0*U?iJVJT~hNN-WaszqF zRH8DV$sBheT9^C-gyk&KEt`WiMs*bK0EG|@>?=BP1miJi4KGeI$;L7 zIBaMM*kfCLLepk2bVE7+{@_$vI>)qO>EGobd%ewxw$5kQ`ojcNY?%mkxP^+Dl>hG% zU3N6RsBz6I8Hsw~KNasi&PWNy8$m1@(V<6Ya`7F1M@zmt8o_t|Q~L@U9;jXdJ?E1j z#qwnBGWz-;gKJ~GSLeDnc5GyU(!Wn&-7GE%ng5KYsyZ{(*oM#VWA3?`@#%bfer_K= z#{Hi{$O>CEBS6TRP2@6~U zz6azJeh1d(veG#=vc_q^iQxehh0+&VR>pM>3e5e{prf5zAPA@fVGqkb7b`T?0^&k1 zvjMCnMna85Occq4g@s-+3CT*zAh`{+8DJN| zzP9$Oo&x6BHYk693Jkgu$Vf;iQ9?pyU&t3fav1*mu!NK*4CX?pW(e&E^e!5z*tnh? zc19Oe0Un!v>ZHFyPLq)^I?MyC0xtFv%G=xf<-=~+4NvC>8O#>s7e6L2_`s^l$3LqS z2418s_rYs!uMH!aR6r*%*vAzVFn^e!7V##ALoNw40Q6bZrAwC(iUU}!r@*$1JM!}J zC8VSjdS|?NfsO(a4gT$nGi*{;_{b6e|2ULKH3QiVRlL4_F^)7eEwNM<_wf1Y=^MFw z=h%S@0|Cy(%}vAJ%gwC~Ak_~i_suC$YVkm7s8*lhfw~-Q7%OFnAj2}S?DjSKl~%aq z?0Rp90@ucPfGvM1d=5L8)Y*`xLcAI|%4@3YY<8J>xw&?CUf{7_cpS;ap@J?r&L>I? zH`wFY2O=YT)6~grZrudM5Xc{3BuRkZf{rKo=n?xXPGbWzS3!6dn3pcGW#s4NwDk26 z0wMGSDLPWh_>##|J#_p5!rny1Lu7{&(O$ zvw3Y^cBV8oiYh59lhD$Z4b#xlA}a2OiQ!^>vZbXZMX76zjg3$cBY@1+)6*+>WNBxI z3$%BVr@Q-ZwzytSKE}w1Jw@TKrssdZ+>1R<cpMy^{K$0T#npU zTH4nfzAii*3*=Q|N=gL2Vi13O27rj3nOS~a5a^(GpxEKw%`E6uG<;6>9pO4O9nE!E zS4YrH1F)#YOZD&j?cpqsUriRk$H5tJVuyXRvSN`jxFBYIgkN2191?V1SZ+#3ny}wv zHFt17H^9o~HD}z~Bi!@zdh+)=NpIb4N>1%_tzULhqTnf74i~7~4rXH+e6SC{%BDjn zAfV0T_YN3vBV*$Vs~%EROO8TfIdp1&n9-AgUf!6j4f`g3K@IKlhm#q6wYld(sr9t* z(izikQCTnvLozBVQog>pq>~FJa5krA^0ud0*vf>S*I;F(Wqo4KUtGu;y~YVGxABQC zaYtK0!5jPnenH$WQ;FDhaaJ6>k^njvafAEIv<6Q!DX^X5@RGPQU=ro6Ot z9SN~o0~hMoq<7b|?np+a=+4&-IEfcjWDMk*R@Bcv3S$Jneft(Yf(KfnMs5jwA~NyE zy}RFPxxZ^dq&qMc1a-rh#VM<^?OFHRg$301wjd7C>zV!=i}dU~>dh4jjKQ@&gGBiF zeIwr&%&nPdYH|?%51?zdY4cN*QnXPs`?bfe)&s*=Z4(maD#ykqSEBWy{E(1n3x}d| z@}gyuPPf-mjx!g5R1ykP8j+f}gl6yU6IH{vx6>N{>vVkB_w^-yF1i!dqk$X^$~fxU z_zcm;zc-@6h+*7o`u6VzA-g{P`Ik1tj8ULuWp%~>Ow*30^OueNd$+-)1og>j=`%Ze z3W`N~rSr0w2P^&T>OU=A^BjEetCO!)a4+Y#2?3~o+rbL@W8t61nh?B8*qB>QZvDg(t?xP#-^1 z+skA9yK|d|d*>H1grXuHg^&4biLOIMPtq>ZF<%+V1=dpvX}Lhsyn{c&Ds2YE8Q>!} z5v|x0s2L!DMc#Vws-?I0J;6IB%a>^cM$Md4+cTL#9ieOE0(7@zrW00V;ap{!_fDI9 zV2z>U6}!vP-=8T?1Z;&dO$KAX#e&`vsLI^N5dadl5NEZ)Q$b@-xF||iiOqJW3cK9vWz_MZdm{E zKB|H&$?I-FN{!ujY|vsPfq;>Hb`1??Lt~o$@`C#Kl&UJdwA#A&%|zFse)7`uQf{5z zdH$SEY;GR^;s};@xcDbcd&H`clkrmC|F#XnAdGlv5Mu#Yn}~>j;=TfHanwM`N(2)v zGDefL<^1T<;ikB&j)d}XDIvcj9={#>a9O6IOV0(z>dnV<0vf;1FRrt+e~Q17aPzyJ zt02h1YZEm@P?|bnow$KQ!oUx!7&imxCLJA1A$d-?XM-m`4$W#LF_In)LNj-@~CiFM_XxD|v2MQ8`vzr{c`#A&FI$K9yBOR=$`m8Xf zIZP#{Dl_mH7jz9#a34g2!fpmvGX};MpvdBbgHg|}3*hbV@7EDzt>xxp7}wi-(pH^f z8H|?B>00fu_(Vo3Di8-#aPi-(N_ze_)j|8c?j`CQXmWCtl~rWV6X$W<-PdX5G~o%r z;0Y8;NMd55Mtx!;83=@ho~giA-vmJLUrK#W8eqvb##o)wPF||zs*V+iUb(ohN^kow6>rRi+R8*BJyH( z;~eYlu>DE)p`i2-)*8kNxP4-f_eL_Y)6n(k@aFR8Y z4pn9nC8KSWcF4SD;}}$7V}6tCBkK0;#h~4bwHcJmO{UAvbvT-uXJ02@z0O+5OT4W* z2Xe<}0Q|G7t1v<2pg_rI*6GvZvntRteTpb!FVI5Gtp8ctYzrb|+U z#}Ps!>f2(Jsa=J}>}U!d$fnip+Y>a9DkTlxSlhIxrMrK7DqzoezPcWJkxAW!7p$pX z&n^6)yPwEpxqB#ErNmX@5A$d__>_RsC-B=}Yi;n^E%(|qL9i(>TgfnXFe$%z0`l|A zhkD}_#HeT2vV5`@m%8|@r7=^Ks96seqIRTAY!^8isztFrrW?=7=uG`ybj0R&Tx9a| z^Gkm7hF(m}q)=2$jHbW8-@fK(@4G4wkco(pgF>_fkS-8j>u@1a)yyK>H#QEeZR{M{ z5fN`vQ(ymSH?XVWQjPu-^Hs@pXz_IPsc69apXVhdA+oVSVZ=D5HFbP{kih>i$?+9g!C z6|eMvKo@K)R;=X0LT^ibN#g3=FX~Z?jW&8y^lKv=eWf)onPbU%ii1F18` zdKKsZ>7##Aot>S5`Vpc9$IXg;$J zT^)__`d0quhkFc{&&`nn61Cb&CrhU69hv-2eSd!u;LV>v8G+f%j~EjT{3dP4nFf_E zS2F}`a>@L5q#IL>G0^)~c-iT*Equ-l0%mVr+~F+sIC(AKQKiet`GEwd|FSProEBIcpdsV{$%D2#0N0C9k>eMg3LGf} zkTEw9LW)xHTqZg;K*riT4=YILM7_K+a~|NDY6^R_XKK+gTO`u_6I`HI=}$%hxZCSFL*HL7_VbpHC4@c>2#r^^Cv&%+canh zSAx#|QXTIHq<+8pn(wRf)z6K7E#n_rx?O(9CeY}iz}@}(CgM=K%N*>gOD7OpBUmrx|}a#n&K^2F4fgz}0cDnnG0qi#W5+?R2R zs^AklM<;#JTl8WBfxvglb)P4-0vVamzvrQWs$X+*6lK$Myf@o77S;U;o`Azp4lZ2W z6DSmgH^g2fB!qw_h)C0Q1YwbQTgL(}yG$_Kk*)S^kt>q0~lo=43NOXllUpk+gI!Y@tVAlX(zp9wG-J;5Z{A zBl_Xs;2`26hB6)sHi1991lf38EDE)##Ea8q_3Z=g#yUM)AKxW%^PM1vQEYbhYFhCG zK^`H>n%k-!xT5=;-yEx|FkW#{*qAQhs?zgX-{tC$qrMXgE*eB`e*9-R1O`4>1J{dl zm~U+?q4Zqivwj9^`yMKpykg~js~pT4XEq9RpJsi|=p=4Nc92w6tf4d`X&b%)mMvL-7ZXd;3j! z8ueqtf(wtig_nlGiyR$k=|>??Svi-O=IIinY&w_vwVN(`cHo$G;=Pq6Y=l0OLk5p( z2UucKGFo-9sHm1CwwAxEy)t_DLzhmT%cH!!(0&x%erqY`$8T@-p1I?__IKko=|wd6 zMDx1G57N*tzKOd}*#AHeJVaamWf#%^m1{`z%tKZ-1btNF@iguJwt$x4H; z-`+9_II*7rj=iCpAtI@x^Q!kQG=`r)f7V?NFZhZRs^_uD)iF26Khb2Zj7+Kp+C?*~ ztvMR&ovK<>uy%RP7uaH_YW~eHiwr6BnrW6N^_|Uu+NXq-1F#+j9H2>qHvo?7;PWH{ zPz1za8%&RY!v>4>`Nmw2g?KG^Q@n5Jo!?(O+Rd&h(ZKTFRh}uS3AXO*aA>>Ek9x23 zBVbbc>Q(o|*#yOqaQqOiCgN{tXmb?m-}7VE1qF{|<0A`-;e;827aPPM5+HMcod&}e zCUAa|^71$tVgb>xQ)Z#$v;zrH3iYA-J`>rur)MW+JM&$HbQ~qi>qXia{{9{J;T8>F z^D&Sn2`n+S)8owjtSm8fpSUi7F6e}5@L|XlIM?I1-{ZsKv+nsGY{bGhv5aF%qEHA) z1T9Y{S;uF+5B66<`!Rd?5DNxO#I|?cvBv$k3RvY3nW5uz-VRIvmxzKH?#=PFBw%Z&K6&TpJ(o| z1^d^?UK9NVrlCn9@da|Q@=Mqj2p-yF7>i z{wS`&bFcOBaG?AVI<%>&Nw2~J3v>#X)e#QiyLZVy8G{0B{WUoR%GJx|Pf*ktBl&Li zehW2*k-8e@%D#^X;xLW9&XP&u?mFl=DXryJ*RPyY8$%HiFV-8-WEtT-%}bvht(gCh z(9_tROzxPPqT%7;=|xLUK^$|p#xE)#ejz3%4(74!LZLuGivehYSYiQS#*I4yU&DP7ba zwn!0-g{P1JLmFr}i1T>60dSMB?;bO#0GGg5AmX=AfLJvFIL0(?0-J~g4ZvllT@6_c z#NiI|4XaB%Vn`hvBmsH96SM++QCYx~yt`lLQ~$%`zB02HITF0}^P|Yn!yqdwggk8x z$0s#vU>0+l9$Aa~LPLXoUGU1xI&i852`H|zP%e3)m*TfgO%WxgX=uOj<2iZVSLGba z6oRb-iiqbJ5~+f7&z<4XspNP51gBXrny4C% zc*P0YJ9kJ${PnQBHpgfC)9pX`jb0|A8Kb|QzlC2{TwJMMv+-cKfFCj6*AGMiMRgd{)b4mQ^3MUM=FMaY*2%Qd0 zoaw;DEj3D@6K&k8vRGO|ec=w2b;re$;!T)2 zqmCzA02?k8y+{5Ve_`;z244I@6-;$^@!qu~c2 zJ}o_6dn7(CP8JRj3PVb2C7B))TPRbNz_;Fyv%9WjjQxpwKe- zZjK-tj2ux>SY-|t=s@Rj7%qvu5lm_s(x@_z?TRboTDJ(YH&r;%G7P$8yu`#hnRvTp zAZxB%7KMY4;k!5B0K_UbGD?8OeX!K{9yt2sS5H2cmj}nk6M=4a_519X|CzHM27sr{ zsNPe#&=K)K{rz*b>1^NdQ*EuCs4VN96s0u9qnc^p%}#w>qx~L>h$i7z)J&nX>T*ta zM|FEI^9rd$2iO**$Hkp<7Z>05WRRAA`2hCo(eCfTy2lRb>*D|CsR@`myjUtBo$)Df zS)jDW6~s*%P;ocN@GGYSzbMZfX&2H5ejl$F8YrTe`D5_Wl{CTi`(r2ize{}>{b?jY zp6+Cuj$MADq$DgrHZ3hKhF{t#O!hGQ-^@McZC-(4w{Th-{XQPf;geC{!%h=Ty*GTT zSvI!AqS(v%t)rodu!{7p{MAY6_kl-PhsO@vHtz1O=){Cv7fkf;)jSN+lv8-IBqb#e zp^G3AemXS+q7`t7aN_X$$15R#VkBwdDCN%H47m@O!&^7_IAxFfZ#wiw;j0qXCLG=lh z&c4ed1qQpvlz1!Z8ZU$&?u1~>S<%!U1ZoG~0Ae~^Z*xi_;&SjCD1niR%A>V*;NaJ* z^I(~qn**Jl&mTfDw(v(GtIbeO5Z6rL`H_uC&^a|UWuyT>Gc#VZq{O(W0jhjf<&*yqXk!f&?+9KS-kXWSK@PDk>pgx(}u0Vmim*LIkk?JY_S`$F&`1 zra3>q?EU)&O(DXz~*Ym|@lRgP`enpP$}A0x+MngCim$R4mvW zQU%ed1S7>K#!x4Kn(hJ<-wNv=9v;5pc93I3Nhx8K0|Ak{m>r#kre%Qv71vfriEO`P zA6}d^-Dl;f*Nci=@JLEUGI1+Ix1e_E4kA`F=sygstcvS`;3ky@9~v=WSYT3GT3gWo z(f-SW3H9`I0aOC(M)dEURQCtD8uAaex>ynVl6+yaIix4CkB+vf$zEG<%3F&2@F2i= zPe$gm*bmV4J(E6)Ki>8luyd7NR8@%+{&m(BJLhpwI~u?ELcSxWaS0fMz~aPx%0rT1|I-8)__v$d2tKUZXt>%h&$EN zQgiMQ(xr+GjwXeL*2z5Y$Y9g+g*5v9lKWtPG1E;_veu+zTg1goaiWD(SM8y5h(>*P zV`T4_mvVKrklde-53ZvuC@Jpni~qZN`?BHJgP%_#BZt9U0hD@2y!bireVPbS1i1>t z_*yQU3P!ciu&}G&{>!}Z6me#Q^k$J5LSV1Y2KqFdVoUEi%=; zYv;X#g9sQoU$N_>qYz#U40BNsYs1mZQ)*4W=e2e8I}-_5-a7uZck3qFH4(iAPD<2L z|J8_3WR%yJn0kxeo)62xg-`epAtqJ`{(%4N7D8Er*0{p<5^w#;9RPSow$iV^e}2`$ zZA=AFa947?KY>4E>$g=~Sy%q5_# zAXeL^_5w9fY@*ReO0o9WNb)n=1#VlUn>4LJ$3JV{|LfC4S{C{)8<+@yp-i$T(Bl{qP9D$!?@t2 zhp3jCd&!*y*&GcPutu0eLa@3gzBf*qUJ@D<2^AGS>|kz+PkcglvaDFIIQs&c-1GI` zk|2x6dO2W;sqv}}Bt0Oi)(%G9fovK4fN=Gjpaa)?VZ=~iT%6@M03%~I%xre*-7;Y) zzO8;l-~4t&P0T8BHnCX;MvJ}kI&&x1j7GnZ2%^qRzXS5-1qNQ}ugY3R$GysM@F4s1 z<0DuP7;fH_RFCTAdd9Tg+mG$JP8w5rI-2;w9t#s2Jq#OdWaKz1zE>!aPvH&g>L{Lj zq9;!1j($}N-(L#+guLWbdCg@tvv`^;T_#BU+TN)`|W7}EF`75MMZ0-a#x0OE8MN+gq=zn(T>@e_3@S4g7m%G z;NgFEjpzP4FB@ACZ|p

d_7*2>qXO)q5X%DR0Q)4ebQi-R}&>+5*hiF25l@RuX$zmJKxU0O+++dK}!@eb4paJy!^nUCZXxtxnYR1b#yXM;$X3yg?J zh_@UNJ+Pc$zz>DE#)s81(`Fig(NB|-u7V4L8=U-BU^Vas(*X{+Gl(ID)(S!(8j4Er zk(z3K`(K|C(=`fWTUynQ0PO&w zi$STvfao65M8KF2L7GcB8g@~~Iqa}1lkwuwSl3a9Cm1R!$f8uo*D8F&yzyrsD-3** zOz;#7i~)&r4!_ra0Pg4#&h~*fP|?wXpQoi6Wv^FNRz3ms3LgY&nNqey+_t8G(3wB1 zICCXpopSGFLtTzNqAokTM1QB%;+I6RV#WcoC$y-jh!|W_ zwyG*B5GXzpu#zFpp^f-_pNh6NaO^uK#Viob(kuDU4G&<}g zVuNbiEL*?rxo|Zw?`A=oxeX-ctLqwtT1a{mB>`S&-EmdPfcGm7dDWY(ZeNvq`2#k) zziRa>2syu6cERpbo09uNCbgou#I(fpxVEtTe0V|NT}i{s*D7UqsQ9c2Adnm5H61_! z`JIsb{Co?24-bAO)r@D5x;C3_3$G(+U+(CLl#&TN6R7DMH%MEyJoad5yYHMul4KA= zE@70`^o}{Lif?PwGMUJN1> z5`n3#s)83T5P+Y*vkvkC$>KpxLp4u*9Di0~!MZ7a0S&JLg5{6K$|ZSTViGs|h`28i zAYmpz9x^9LeiqXC9%x4(b|SejrS!X3k#JfyXjA4;r?3P1Q0|&NYvWkma=wrR@;)KY z-U+RZs_jt&LiwKC0uIxA_5ScrC50#^^WZwtkFXR##|OTxgw z$!~M2r8fyO?8h;&@`iJBZsIdZUSNI%`>}5QBbaSb!JyeO+`TZKM}r-ToD}c}l-JaJ z1_qZ91!2#y-nu{I3lQHxfiwAK1H`an5I+jo8$Y?uV>dK5qM>O0x6txb(xagfG2d!| zv(pBFDL@a})jjieuuFP*0s;cety|oS_=K)z(lJkaydit9?$bWWXyG&@o-X(4|H#L` zbJ=I-Hb-|k^L0v%!QWc1nd=kvS;0u6=cOjus;YK~tcQUDfgCC+L<@lY z8-S~9AjK3vzcQ`L<)k4aBZJSSIQCnia@X93X&>xJ=aY2;&ZGAiiQE$-YZWd$Owtq> zNingoAZURDvaY;}iYy=y^(gmEbX11;rKPWEBPCxP`FPMmLxW{vP=ZnQU;^*4=0A^v11T%u~eM4zpIMRf?pw` zw)PIn^{^WPC*=>nkOL)o&-pIr$m)g@YwkQM=t*UtvhoU9_D>W-+(pp(kxsH>lc^^lcuOPCuM2$X#dcLKbXAosTqs5Rz4D<2~9CGfIxyUt02^^(fD>4*uW7c>eAisa;% zD>DSKJVJIGtr)JaWKm!sl#Ly77Lm>|{HlDM|9zR$=+j%zk1rcw;*10ye1(@F49@V@ zh@th^hcD3N<_-;rh-S9T%?_MeS|XZB6D}j^E#&PGNIdoI_%T8+A@(PTvLKAU86XYC z)rcog5N}2S1k#XnG!!AoWNx8>_r9ch3JMSMx*()Bg4=<0>yU|w31UK5peL4tabCs` zm|t}W^TTWpJs2MbJDvIf@DlB>{lowYAHi7wyJX>~T*2N9y@0vvoC+p{z7jpOg@s7* zOW5dwg1&?ik-aGQ#K0Ag`_JJO1N2;V?vR1>8#M8;w8rkXVHDsa<95#jCj{RhNs=5G z*NHJD-#w;+_m4oOcWBszw;CWRKh|}h_)&NxM{ImE68$u3(91o8;(px`!aNd?qgE?i z2Wkgdf$P_nW6P6M`FH1JHUtKBbS%Iq-xULZ&pj~>HWIAW>}-2PcgJaWb5|Pco#g_XKumj?(MGZ_#*u*%eFNR( z@?`|N$dh%wNnHRS`@!kg_2$zZd~i4AcpibCQW11bfpMBuNtb#K`%(0yCHk@O)v7 z%Lb#hg(71g2_s|3f&w>1UGW0w=`GEQYZX-TN7Ej!jgcTJUr3=ACnw3!Cop%VzDZ7= zL0&5ceCvbi3t(U&Kp;`E`N3gy4&omWl-MPg5IS#y7Ym^8xXY8e!JFHS6;)nr=+*}l%&%hzHJr^5k$4gU3w&E;R99bRn4Pco4VU`_0y!$F5} zTnWE6Gg8oW0*r@?ts?i=-f8V(|aH1mWn#tq0|holV*YO|3QWN|g`Lb}zjrb|TNRjE^@| zA!#Oj?;e8fyL)?w9N5PZ6(}G=ZDV2cJE(Ly`T0m-{{O1(+~cWE*Eaqm>A*Ne=pZSl zrI2cr4yuJhC0e8=XDS(rYLszGltU#&Oi9jR5=uoyP76s*R-)08L(~u{rCo@9-D>u` z_h-+%f4%>_{;RYOzxDi{=f1D|y1omBN6o#r@y4?&lOp&Wg?TpTh8F&I4pZlB9rcI( zK1iE44seUf-arIXgQg-20;bc8!Wkb&k+l=2t z{hK?G&%aZV7c1K%-m4QmQd?bJg3uVMj{JDaIOV}owV5| ztH}fm&mQ3?3cP)|%xBV((2O$Hwe}tqvsJj|C`|0UW5*f^A>hx1G1peFyR81-(05zakIW17y!aX1H80jKz5YY)#a7+IyySi zX$Hbj(xST?GdqhKdR{~>4U>^H-}<=g*&AFk0yohXk0SQzbvId*7y_#$w0%D88iq!_B`^*@fTiWL*CY{e$*!S7K+qrfvqC7<*YYaFJu3u_@;jp+! zd*op@O2$J~)d{FE%5Y=1_4P%f>Zf{m$Bs1p{Rkn!xDW#9Ng`TT8j`>pB6Dre=b@qU zCr@Nd&(0HId_Q-_QUV&M0bbt+cQ zzNo6YC(f1{R-p?Q3qlrHs=YWSDfvO8v)UAm7}cY^OYxV(>(wvoFaG7SiENHrw(L$& zsAxg~JNd2sU4m$733r4S&HI?7eekV4jkBqGfaZ);q$Gm0adSIx%9yZsHeB9%1a}S{ zQLg$h(*ZB|*vHqvz*(+FNjJthIcwq0hxRC-3y`a?tg7QWTdJ$Se41~3N9++#XL>?H z)!vSE-1(b6tjM!Cl-jql)7g?Eci>CrJ!i|NgpA3LR(qa}jut|xO(zu8X{hr@Zipw% zMLmsXb$9FqL^!$*p@rS(G+RljoYPQfJO$~zvg)Wg1QbDm?sn&brpm9ACmsx}UH@)Q zX@RGds5~#_>5#g(sEcD-f5oQ3=rfj4dLaXsRL)p-IVQ7kIk2uOq5bFn_`43Nw-l$w z0}{Lisi0j$d$Fk)vamDo!?Kc7QY5ELIf8nh9Q5?Wg4t1O#4>DNcLG-Kx{GYQ;s0(*)E zruu&w*h1nIreSetcqjti%a)R~JP4Hw1xtgsoba#nyf%BPX7%^?m*M!>JJ4;(ebMaQ zVu($j{(zxtjGoGdADdaLy{>-Bep_-F-Jgq>wNe&C(wnNXH#*z}9{eRZ{n~I#6a5hF z{ow;M^@%Nw(yAUs-xwnq76MJi-}btNcWb`WhCM#X2em+I&CKB=;9KB=0;;h zPfyRLG!q$|NCoSS&R095XD!@$@8DzCWJgC2*7q;d%esbF?!@5Z)64UF-Xe0(+EEi8 z8d`!*z#PKd{_gro^r@|T_`9jW_^mg^K6Pufe)3#(=Gr7=M{I5j!WfRZe`F4WH^v2F zqh3?vzMBHo8>miJO9(ATA{KqfLM$*(%&2DQ?O*5G3=LKK;LIEp(Z~u~Hf@0|84}I) z`=T*d#x6SVCi__6GVcnYH}vjd?B7;lt|J;)71n?Dod?xPj7E3V` zp-!3f=H=xDrKF@Vs{n)v=B*?zZI9FK+qXr|rJe~IAcs9#S} zF(;ZoH;S35HxWjMS#fdoJntn2l_7N0uA|U>y7lb*lIkeo*kR_~N-M;Jqf@_sN$f|y@+u{zYqz@6nuo!XgpOk^fDJXbz$PexRa2ySmZW4S<``Es zp_5Sx`NfNuD*hVkX8wVn_<^VG%mMfmV_=oDOnRM`o?eET8Y*BW@xz1Ec;9m$gRto( z;o>PDj}8r8RK`yYF3fa3$eyC4voca4tlY4F+S047zg!hP1!E4=in+doP*TY;Uu)xk zDKSIgk&#-rOUO7dw)T|E5g0#iIwEozn#Q%vJL6LcPp1px$#?0Qq53VsT-AzdB ziK6|V=j6eXr;D__{(Jd(>uiHm_iqD1y!~~*qI`A$c>?E)Kik+)N@%QA%g+xkEG#T8pPlR# zUKke6zE~Lc54@`EYd3FFu!6>@uo0K>`7@|baFB^uuR^W>1Xb)E%lh*2XYaWPRyF#! zxtQ_e6Wx2@z!UF-2Aqcrbj|%g4{eqZDte`Y1(fd8Fjk6~S zE!Yf?OUh%;fM`Ec0~fr7ev8J7gAX^*JHCW>d_w0iWssIFn-1oyk^J4+ju)k(lI%T{ zO0b64jHWkbZ(F<{$l2=UIJY`u&1L@=Ccp@=MuhtzS}O#p)nM4wp{3e> z*T3la995;{{)~b{U0{dE>FrnB7{BB<>g^NsyC`mI3b|8FLa34*`I3YJ^Qfv*n0( z2idt&R6b9xi~H{#`)d%ovE2+)RChNk*prBP}M zt^nBX?l18|!y;s~EQZhpz>oxEr(iX$2Vkt|XK!q8nawHypuyK@;!Z8n-GIAI1L%Uk z;sWC1MH#C5F}2EbI%|>!WHj5t;&kcy#!NHxaB#5@W5eXxC6v^Hiq99-OT^68>Wn>m zRu~^KqH(eXV*Ad#$<@k_^vfcTrcT8j=X~x~B(os0wRUu**1zfK2!@K5)vThaxv_T; zed_K;yFal3w%|TV8Ertc04Nv@PWCp-7KaQqW80cN(BQCjP#RNY`>{e`QF3=J)RK4i zw3cRL->FTq5BQK=r(T#KJI(>S|>pRD!CQ$kjZ5{F3C< zsa7frwglgeNPjBZ^v#7P?-*br#J+GQZftwV5M0pY_U&5=YNlXE8v79r#I{R6Q3Cda z62Xr%V;vuJn0BWBApZ=^JpCMH=xPXaE5IE8F!QXrdiTKGiGmnz5&|4!>l8S)LC-zu zAGBD|aNrg7JGR#Vmf@M@8rkE*lD&suJs1R%;|bUhi*2gV?IB*#5@l_ogi^JhNV93f#ycC;(VZ;NqzRyfPWp#v^ucrD5|Z;fIJA{MdAP z=W4)4!R!K4N@%r&T_g(VGBnrHuOWN08Aa?-T^hBMBQe%A{vj@w#^ghyOLgDX%EuI9 z*jmEnj)&MHx6*eB8JYS{)to@WV2-Ay7^>+l`Igz+WU%?uEXv8bvKO~BynO~hXc0{t z9Yxo&xhV+Sh%y0!;?=5Bjwqf}`BOezGv~`~!9Eb7c6K}Q7Aat}$My;ka=KI!0X)n6Es1qsP z5g{Qh9ZaJq!d?QjBi#%89F$UmP{%a9a*GzFvPxSk24txRa%>OG9()EcxHee3HU;Z< zP%LeG#^y_6SQp61WbQIGHZCR0Hg>cXMppjIf%gNI*Z09x_!1X%HjgU?8|1wCgapji}n=yDu!~kPZ zq$yCQ;UXHSs-W>AZ;|vX2N9N1ZHwKe;*^`9udlzt$h|;t+_*fyp`Ym64+w95{7DX? z>5yarq_w2t0EaBCG9ap`oy86=jEbXS-v=3yeVa954|1^Ot$eA{tCPj&r0-)}ZNf#C zU^13N0Zi+ARKthkDFmSD$@oGI@?MbcM*QnRvHKa)13stkIhTR!&O#SD2`A7R>@mTR zNxO7+jkB^20Agnn97fVe+6uu2R@&TbLu@@*vp>wdQEJf`%LGHJRc|mhGn0ioVjkyL zs|_eXBnb@NhFX45C3Va{A+T!IgUtHs)7ZCzjIPZhu9w%xa%03&H zStuW1Z8E<-3QHw?>x%Hq)#1xbc0lH#xgo|nY@C4TbB;hlvIos&or#IX?Hp9#bOaK+ z3d{i9F(Jo~AD0?=iL)s*E;e+3eQo{>nDSTN#z2z*WCSG7R)Ntv^3nNi-=0X9F$C6TE}H z?5th_NEPZ*iVV64M_gtm5O80$CV=`+_VoNn+$j7Tj80hjiC+)rUm!Kix(+8(!7`wY=|=M z0i$1ZnT!>-u1;9OU+7wjqi57%P-r8V8l*6**f+po_J-fWoWrX>+#=P+uMWij^;qZ zMJGXNNuaSMcF)$+kntx@z%4X3oYA3K*|K;(4*4!8g|Vlz zk{_RH(}xFtfk}%+IviIpKBYa^$5V*?`4lCUk+Z~MGvF3&FCOkU1>xKgzXX=@bZ`fb zVFge@NBtD`_~>*E1=zyS6(6N!8@|heG!JqFY88JHBqP89UvwL6q&5*Lrti@q*A=$z zU5HPkOttI&GDR}Vfj-Rnbm42!UBa+n2%<5pVMJbw*AGxY5orjsSnwll2D{ s>{y-qx1z(?@BKgcR<8flO-3hJ`-@C{F-=Vg-+RUw8*VhXvc^8>pAVFp_W%F@ literal 0 HcmV?d00001 From 9084b4b7573bfd1ccfed210ae45d962332f0be27 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Mon, 15 Apr 2024 00:12:31 -0400 Subject: [PATCH 09/29] add plot notebooks --- .../fedpft/docs/viz_and_plot_results.ipynb | 88 ++++++------------- 1 file changed, 25 insertions(+), 63 deletions(-) diff --git a/baselines/fedpft/docs/viz_and_plot_results.ipynb b/baselines/fedpft/docs/viz_and_plot_results.ipynb index 866ffb5d8c7..68077f7b59c 100644 --- a/baselines/fedpft/docs/viz_and_plot_results.ipynb +++ b/baselines/fedpft/docs/viz_and_plot_results.ipynb @@ -2,22 +2,10 @@ "cells": [ { "cell_type": "code", - "execution_count": 2, + "execution_count": 16, "id": "5e0cf2a9-b782-48de-ac45-128726a26e64", "metadata": {}, - "outputs": [ - { - "ename": "ModuleNotFoundError", - "evalue": "No module named 'matplotlib'", - "output_type": "error", - "traceback": [ - "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[1;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[1;32mIn[2], line 7\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mos\u001b[39;00m\n\u001b[0;32m 6\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mnp\u001b[39;00m\n\u001b[1;32m----> 7\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mpyplot\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mplt\u001b[39;00m\n", - "\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'matplotlib'" - ] - } - ], + "outputs": [], "source": [ "import pickle\n", "import yaml\n", @@ -30,7 +18,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 17, "id": "7ea3e149-ce6f-4ba0-aa41-e0501a04efe3", "metadata": {}, "outputs": [], @@ -52,7 +40,7 @@ }, { "cell_type": "code", - "execution_count": 32, + "execution_count": 18, "id": "4b010856-0d99-4d81-8fb0-7a927f10eeaf", "metadata": {}, "outputs": [], @@ -61,13 +49,13 @@ "path_fedpft_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n", "path_fedpft_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-44-20')\n", "\n", - "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','18-16-41')\n", - "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n" + "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','23-24-25')\n", + "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','22-32-11')\n" ] }, { "cell_type": "code", - "execution_count": 28, + "execution_count": 19, "id": "2e3e165c-1ce6-4efa-a4e1-1372586e436e", "metadata": {}, "outputs": [], @@ -84,7 +72,7 @@ }, { "cell_type": "code", - "execution_count": 33, + "execution_count": 20, "id": "77b70c73", "metadata": {}, "outputs": [], @@ -97,49 +85,13 @@ }, { "cell_type": "code", - "execution_count": 2, - "id": "6f4c87ad", - "metadata": {}, - "outputs": [], - "source": [ - "fedavg_cifar = [(1, 0.06924765515865097),\n", - " (2, 0.1315106765116743),\n", - " (3, 0.16773099181800039),\n", - " (4, 0.1946717222111355),\n", - " (5, 0.2171223308720814),\n", - " (6, 0.2375773298742766),\n", - " (7, 0.2597285970864099),\n", - " (8, 0.276092596288166),\n", - " (9, 0.290560766314109),\n", - " (10, 0.3036320095789264),\n", - " (11, 0.3128118140091798),\n", - " (12, 0.3261823987228098),\n", - " (13, 0.33745759329475156),\n", - " (14, 0.3477349830373179),\n", - " (15, 0.35831171422869684),\n", - " (16, 0.36679305527838757),\n", - " (17, 0.37407703053282776),\n", - " (18, 0.3817601277190182),\n", - " (19, 0.38824585910995807),\n", - " (20, 0.3942326880862103)]" - ] - }, - { - "cell_type": "code", - "execution_count": 59, + "execution_count": 21, "id": "e1a678de", "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "No artists with labels found to put in legend. Note that artists whose label start with an underscore are ignored when legend() is called with no argument.\n" - ] - }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "

" ] @@ -149,13 +101,23 @@ } ], "source": [ + "color1 = 'blue'\n", + "color2 = 'red'\n", + "\n", "def viz():\n", " fig, axs = plt.subplots(figsize=(10, 2), nrows=1, ncols=2)\n", " \n", - " # cifar100 - fedavg\n", - " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', linewidth=2.0)\n", - " \n", + " # cifar100\n", + " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', color=color1, linewidth=2.0)\n", + " axs[0].scatter([r for r, _ in fedpft_cifar], [a for _, a in fedpft_cifar], label='FedPFT', color=color2, marker='x', s=100)\n", " axs[0].set_title('CIFAR100 - ResNet50')\n", + " axs[0].set_ylim(0, 0.7)\n", + " \n", + " # caltech101\n", + " axs[1].plot([r for r, _ in fedavg_caltech], [a for _, a in fedavg_caltech], label='FedAvg', color=color1, linewidth=2.0)\n", + " axs[1].scatter([r for r, _ in fedpft_caltech], [a for _, a in fedpft_caltech], label='FedPFT', color=color2, marker='x', s=100)\n", + " axs[1].set_title('Caltech101 - Clip/ViT-B')\n", + " axs[1].set_ylim(0.2, 1)\n", " \n", " for ax in axs:\n", " ax.set_xticks([1, 5, 10 , 15, 20])\n", @@ -171,12 +133,12 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 22, "id": "92460065", "metadata": {}, "outputs": [], "source": [ - "saveFig(\"FedProx_mnist.png\", f)" + "saveFig(\"FedPft.png\", f)" ] } ], From ddd0f08213746d58d3a08816baf2c560283afe66 Mon Sep 17 00:00:00 2001 From: mahdi Date: Mon, 15 Apr 2024 15:08:56 +0000 Subject: [PATCH 10/29] remove empty line --- baselines/fedpft/fedpft/models.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index 7ebc9beed4a..b4594cb986a 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -103,7 +103,7 @@ def extract_features( 2D array containing labels of `features`. """ feature_extractor.to(device) - + features, labels = [], [] for dict in dataloader: batch_samples = dict["img"].to(device) @@ -164,7 +164,7 @@ def test( total += samples.shape[0] running_loss = nn.CrossEntropyLoss()(output, labels) loss += running_loss - + return loss.cpu().item(), correct / total From 6996b816564a5378205a234a2558dbaca18deee0 Mon Sep 17 00:00:00 2001 From: mahdi Date: Mon, 15 Apr 2024 15:12:52 +0000 Subject: [PATCH 11/29] removed extended_readme --- baselines/fedpft/EXTENDED_README.md | 123 ---------------------------- 1 file changed, 123 deletions(-) delete mode 100644 baselines/fedpft/EXTENDED_README.md diff --git a/baselines/fedpft/EXTENDED_README.md b/baselines/fedpft/EXTENDED_README.md deleted file mode 100644 index 9c8f5bc72fa..00000000000 --- a/baselines/fedpft/EXTENDED_README.md +++ /dev/null @@ -1,123 +0,0 @@ - -# Extended Readme - -> The baselines are expected to run in a machine running Ubuntu 22.04 - -While `README.md` should include information about the baseline you implement and how to run it, this _extended_ readme provides info on what's the expected directory structure for a new baseline and more generally the instructions to follow before your baseline can be merged into the Flower repository. Please follow closely these instructions. It is likely that you have already completed steps 1-2. - -1. Fork the Flower repository and clone it. -2. Navigate to the `baselines/` directory and from there run: - ```bash - # This will create a new directory with the same structure as this `baseline_template` directory. - ./dev/create-baseline.sh - ``` -3. All your code and configs should go into a sub-directory with the same name as the name of your baseline. - * The sub-directory contains a series of Python scripts that you can edit. Please stick to these files and consult with us if you need additional ones. - * There is also a basic config structure in `/conf` ready be parsed by [Hydra](https://hydra.cc/) when executing your `main.py`. -4. Therefore, the directory structure in your baseline should look like: - ```bash - baselines/ - ├── README.md # describes your baseline and everything needed to use it - ├── EXTENDED_README.md # to remove before creating your PR - ├── pyproject.toml # details your Python environment - └── - ├── *.py # several .py files including main.py and __init__.py - └── conf - └── *.yaml # one or more Hydra config files - - ``` -> :warning: Make sure the variable `name` in `pyproject.toml` is set to the name of the sub-directory containing all your code. - -5. Add your dependencies to the `pyproject.toml` (see below a few examples on how to do it). Read more about Poetry below in this `EXTENDED_README.md`. -6. Regularly check that your coding style and the documentation you add follow good coding practices. To test whether your code meets the requirements, please run the following: - ```bash - # After activating your environment and from your baseline's directory - cd .. # to go to the top-level directory of all baselines - ./dev/test-baseline.sh - ./dev/test-baseline-structure.sh - ``` - Both `test-baseline.sh` and `test-baseline-structure.sh` will also be automatically run when you create a PR, and both tests need to pass for the baseline to be merged. - To automatically solve some formatting issues and apply easy fixes, please run the formatting script: - ```bash - # After activating your environment and from your baseline's directory - cd .. # to go to the top-level directory of all baselines - ./dev/format-baseline.sh - ``` -7. Ensure that the Python environment for your baseline can be created without errors by simply running `poetry install` and that this is properly described later when you complete the `Environment Setup` section in `README.md`. This is specially important if your environment requires additional steps after doing `poetry install`. -8. Ensure that your baseline runs with default arguments by running `poetry run python -m .main`. Then, describe this and other forms of running your code in the `Running the Experiments` section in `README.md`. -9. Once your code is ready and you have checked: - * that following the instructions in your `README.md` the Python environment can be created correctly - - * that running the code following your instructions can reproduce the experiments in the paper - - , then you just need to create a Pull Request (PR) to kickstart the process of merging your baseline into the Flower repository. - -> Once you are happy to merge your baseline contribution, please delete this `EXTENDED_README.md` file. - - -## About Poetry - -We use Poetry to manage the Python environment for each individual baseline. You can follow the instructions [here](https://python-poetry.org/docs/) to install Poetry in your machine. - - -### Specifying a Python Version (optional) -By default, Poetry will use the Python version in your system. In some settings, you might want to specify a particular version of Python to use inside your Poetry environment. You can do so with [`pyenv`](https://github.com/pyenv/pyenv). Check the documentation for the different ways of installing `pyenv`, but one easy way is using the [automatic installer](https://github.com/pyenv/pyenv-installer): -```bash -curl https://pyenv.run | bash # then, don't forget links to your .bashrc/.zshrc -``` - -You can then install any Python version with `pyenv install ` (e.g. `pyenv install 3.9.17`). Then, in order to use that version for your baseline, you'd do the following: - -```bash -# cd to your baseline directory (i.e. where the `pyproject.toml` is) -pyenv local - -# set that version for poetry -poetry env use - -# then you can install your Poetry environment (see the next setp) -``` - -### Installing Your Environment -With the Poetry tool already installed, you can create an environment for this baseline with commands: -```bash -# run this from the same directory as the `pyproject.toml` file is -poetry install -``` - -This will create a basic Python environment with just Flower and additional packages, including those needed for simulation. Next, you should add the dependencies for your code. It is **critical** that you fix the version of the packages you use using a `=` not a `=^`. You can do so via [`poetry add`](https://python-poetry.org/docs/cli/#add). Below are some examples: - -```bash -# For instance, if you want to install tqdm -poetry add tqdm==4.65.0 - -# If you already have a requirements.txt, you can add all those packages (but ensure you have fixed the version) in one go as follows: -poetry add $( cat requirements.txt ) -``` -With each `poetry add` command, the `pyproject.toml` gets automatically updated so you don't need to keep that `requirements.txt` as part of this baseline. - - -More critically however, is adding your ML framework of choice to the list of dependencies. For some frameworks you might be able to do so with the `poetry add` command. Check [the Poetry documentation](https://python-poetry.org/docs/cli/#add) for how to add packages in various ways. For instance, let's say you want to use PyTorch: - -```bash -# with plain `pip` you'd run a command such as: -pip install torch==1.13.1+cu117 torchvision==0.14.1+cu117 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu117 - -# to add the same 3 dependencies to your Poetry environment you'd need to add the URL to the wheel that the above pip command auto-resolves for you. -# You can find those wheels in `https://download.pytorch.org/whl/cu117`. Copy the link and paste it after the `poetry add` command. -# For instance to add `torch==1.13.1+cu117` and a x86 Linux system with Python3.8 you'd: -poetry add https://download.pytorch.org/whl/cu117/torch-1.13.1%2Bcu117-cp38-cp38-linux_x86_64.whl -# you'll need to repeat this for both `torchvision` and `torchaudio` -``` -The above is just an example of how you can add these dependencies. Please refer to the Poetry documentation to extra reference. - -If all attempts fail, you can still install packages via standard `pip`. You'd first need to source/activate your Poetry environment. -```bash -# first ensure you have created your environment -# and installed the base packages provided in the template -poetry install - -# then activate it -poetry shell -``` -Now you are inside your environment (pretty much as when you use `virtualenv` or `conda`) so you can install further packages with `pip`. Please note that, unlike with `poetry add`, these extra requirements won't be captured by `pyproject.toml`. Therefore, please ensure that you provide all instructions needed to: (1) create the base environment with Poetry and (2) install any additional dependencies via `pip` when you complete your `README.md`. \ No newline at end of file From 3ecf50c7d38d3b1bb50499dae33ef169bb89276e Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 12:45:18 -0400 Subject: [PATCH 12/29] add FedPFT baseline --- baselines/fedpft/.gitignore | 3 + baselines/fedpft/EXTENDED_README.md | 123 ++++++++++ baselines/fedpft/LICENSE | 202 ++++++++++++++++ baselines/fedpft/README.md | 109 +++++++++ baselines/fedpft/fedpft/__init__.py | 1 + baselines/fedpft/fedpft/client.py | 170 ++++++++++++++ baselines/fedpft/fedpft/conf/base.yaml | 15 ++ .../fedpft/fedpft/conf/client/fedavg.yaml | 2 + .../fedpft/fedpft/conf/client/fedpft.yaml | 2 + .../fedpft/fedpft/conf/dataset/CIFAR100.yaml | 10 + .../fedpft/conf/dataset/Caltech101.yaml | 10 + baselines/fedpft/fedpft/conf/model/clip.yaml | 9 + .../fedpft/fedpft/conf/model/resnet50.yaml | 8 + .../fedpft/fedpft/conf/strategy/fedavg.yaml | 12 + .../fedpft/fedpft/conf/strategy/fedpft.yaml | 22 ++ baselines/fedpft/fedpft/dataset.py | 108 +++++++++ .../fedpft/fedpft/dataset_preparation.py | 1 + baselines/fedpft/fedpft/main.py | 88 +++++++ baselines/fedpft/fedpft/models.py | 221 ++++++++++++++++++ baselines/fedpft/fedpft/server.py | 94 ++++++++ baselines/fedpft/fedpft/strategy.py | 145 ++++++++++++ baselines/fedpft/fedpft/utils.py | 102 ++++++++ baselines/fedpft/pyproject.toml | 143 ++++++++++++ 23 files changed, 1600 insertions(+) create mode 100644 baselines/fedpft/.gitignore create mode 100644 baselines/fedpft/EXTENDED_README.md create mode 100644 baselines/fedpft/LICENSE create mode 100644 baselines/fedpft/README.md create mode 100644 baselines/fedpft/fedpft/__init__.py create mode 100644 baselines/fedpft/fedpft/client.py create mode 100644 baselines/fedpft/fedpft/conf/base.yaml create mode 100644 baselines/fedpft/fedpft/conf/client/fedavg.yaml create mode 100644 baselines/fedpft/fedpft/conf/client/fedpft.yaml create mode 100644 baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml create mode 100644 baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml create mode 100644 baselines/fedpft/fedpft/conf/model/clip.yaml create mode 100644 baselines/fedpft/fedpft/conf/model/resnet50.yaml create mode 100644 baselines/fedpft/fedpft/conf/strategy/fedavg.yaml create mode 100644 baselines/fedpft/fedpft/conf/strategy/fedpft.yaml create mode 100644 baselines/fedpft/fedpft/dataset.py create mode 100644 baselines/fedpft/fedpft/dataset_preparation.py create mode 100644 baselines/fedpft/fedpft/main.py create mode 100644 baselines/fedpft/fedpft/models.py create mode 100644 baselines/fedpft/fedpft/server.py create mode 100644 baselines/fedpft/fedpft/strategy.py create mode 100644 baselines/fedpft/fedpft/utils.py create mode 100644 baselines/fedpft/pyproject.toml diff --git a/baselines/fedpft/.gitignore b/baselines/fedpft/.gitignore new file mode 100644 index 00000000000..4ab8207aedb --- /dev/null +++ b/baselines/fedpft/.gitignore @@ -0,0 +1,3 @@ +outputs/ +multirun/ +.ruff_cache/ \ No newline at end of file diff --git a/baselines/fedpft/EXTENDED_README.md b/baselines/fedpft/EXTENDED_README.md new file mode 100644 index 00000000000..9c8f5bc72fa --- /dev/null +++ b/baselines/fedpft/EXTENDED_README.md @@ -0,0 +1,123 @@ + +# Extended Readme + +> The baselines are expected to run in a machine running Ubuntu 22.04 + +While `README.md` should include information about the baseline you implement and how to run it, this _extended_ readme provides info on what's the expected directory structure for a new baseline and more generally the instructions to follow before your baseline can be merged into the Flower repository. Please follow closely these instructions. It is likely that you have already completed steps 1-2. + +1. Fork the Flower repository and clone it. +2. Navigate to the `baselines/` directory and from there run: + ```bash + # This will create a new directory with the same structure as this `baseline_template` directory. + ./dev/create-baseline.sh + ``` +3. All your code and configs should go into a sub-directory with the same name as the name of your baseline. + * The sub-directory contains a series of Python scripts that you can edit. Please stick to these files and consult with us if you need additional ones. + * There is also a basic config structure in `/conf` ready be parsed by [Hydra](https://hydra.cc/) when executing your `main.py`. +4. Therefore, the directory structure in your baseline should look like: + ```bash + baselines/ + ├── README.md # describes your baseline and everything needed to use it + ├── EXTENDED_README.md # to remove before creating your PR + ├── pyproject.toml # details your Python environment + └── + ├── *.py # several .py files including main.py and __init__.py + └── conf + └── *.yaml # one or more Hydra config files + + ``` +> :warning: Make sure the variable `name` in `pyproject.toml` is set to the name of the sub-directory containing all your code. + +5. Add your dependencies to the `pyproject.toml` (see below a few examples on how to do it). Read more about Poetry below in this `EXTENDED_README.md`. +6. Regularly check that your coding style and the documentation you add follow good coding practices. To test whether your code meets the requirements, please run the following: + ```bash + # After activating your environment and from your baseline's directory + cd .. # to go to the top-level directory of all baselines + ./dev/test-baseline.sh + ./dev/test-baseline-structure.sh + ``` + Both `test-baseline.sh` and `test-baseline-structure.sh` will also be automatically run when you create a PR, and both tests need to pass for the baseline to be merged. + To automatically solve some formatting issues and apply easy fixes, please run the formatting script: + ```bash + # After activating your environment and from your baseline's directory + cd .. # to go to the top-level directory of all baselines + ./dev/format-baseline.sh + ``` +7. Ensure that the Python environment for your baseline can be created without errors by simply running `poetry install` and that this is properly described later when you complete the `Environment Setup` section in `README.md`. This is specially important if your environment requires additional steps after doing `poetry install`. +8. Ensure that your baseline runs with default arguments by running `poetry run python -m .main`. Then, describe this and other forms of running your code in the `Running the Experiments` section in `README.md`. +9. Once your code is ready and you have checked: + * that following the instructions in your `README.md` the Python environment can be created correctly + + * that running the code following your instructions can reproduce the experiments in the paper + + , then you just need to create a Pull Request (PR) to kickstart the process of merging your baseline into the Flower repository. + +> Once you are happy to merge your baseline contribution, please delete this `EXTENDED_README.md` file. + + +## About Poetry + +We use Poetry to manage the Python environment for each individual baseline. You can follow the instructions [here](https://python-poetry.org/docs/) to install Poetry in your machine. + + +### Specifying a Python Version (optional) +By default, Poetry will use the Python version in your system. In some settings, you might want to specify a particular version of Python to use inside your Poetry environment. You can do so with [`pyenv`](https://github.com/pyenv/pyenv). Check the documentation for the different ways of installing `pyenv`, but one easy way is using the [automatic installer](https://github.com/pyenv/pyenv-installer): +```bash +curl https://pyenv.run | bash # then, don't forget links to your .bashrc/.zshrc +``` + +You can then install any Python version with `pyenv install ` (e.g. `pyenv install 3.9.17`). Then, in order to use that version for your baseline, you'd do the following: + +```bash +# cd to your baseline directory (i.e. where the `pyproject.toml` is) +pyenv local + +# set that version for poetry +poetry env use + +# then you can install your Poetry environment (see the next setp) +``` + +### Installing Your Environment +With the Poetry tool already installed, you can create an environment for this baseline with commands: +```bash +# run this from the same directory as the `pyproject.toml` file is +poetry install +``` + +This will create a basic Python environment with just Flower and additional packages, including those needed for simulation. Next, you should add the dependencies for your code. It is **critical** that you fix the version of the packages you use using a `=` not a `=^`. You can do so via [`poetry add`](https://python-poetry.org/docs/cli/#add). Below are some examples: + +```bash +# For instance, if you want to install tqdm +poetry add tqdm==4.65.0 + +# If you already have a requirements.txt, you can add all those packages (but ensure you have fixed the version) in one go as follows: +poetry add $( cat requirements.txt ) +``` +With each `poetry add` command, the `pyproject.toml` gets automatically updated so you don't need to keep that `requirements.txt` as part of this baseline. + + +More critically however, is adding your ML framework of choice to the list of dependencies. For some frameworks you might be able to do so with the `poetry add` command. Check [the Poetry documentation](https://python-poetry.org/docs/cli/#add) for how to add packages in various ways. For instance, let's say you want to use PyTorch: + +```bash +# with plain `pip` you'd run a command such as: +pip install torch==1.13.1+cu117 torchvision==0.14.1+cu117 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu117 + +# to add the same 3 dependencies to your Poetry environment you'd need to add the URL to the wheel that the above pip command auto-resolves for you. +# You can find those wheels in `https://download.pytorch.org/whl/cu117`. Copy the link and paste it after the `poetry add` command. +# For instance to add `torch==1.13.1+cu117` and a x86 Linux system with Python3.8 you'd: +poetry add https://download.pytorch.org/whl/cu117/torch-1.13.1%2Bcu117-cp38-cp38-linux_x86_64.whl +# you'll need to repeat this for both `torchvision` and `torchaudio` +``` +The above is just an example of how you can add these dependencies. Please refer to the Poetry documentation to extra reference. + +If all attempts fail, you can still install packages via standard `pip`. You'd first need to source/activate your Poetry environment. +```bash +# first ensure you have created your environment +# and installed the base packages provided in the template +poetry install + +# then activate it +poetry shell +``` +Now you are inside your environment (pretty much as when you use `virtualenv` or `conda`) so you can install further packages with `pip`. Please note that, unlike with `poetry add`, these extra requirements won't be captured by `pyproject.toml`. Therefore, please ensure that you provide all instructions needed to: (1) create the base environment with Poetry and (2) install any additional dependencies via `pip` when you complete your `README.md`. \ No newline at end of file diff --git a/baselines/fedpft/LICENSE b/baselines/fedpft/LICENSE new file mode 100644 index 00000000000..d6456956733 --- /dev/null +++ b/baselines/fedpft/LICENSE @@ -0,0 +1,202 @@ + + Apache License + Version 2.0, January 2004 + http://www.apache.org/licenses/ + + TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION + + 1. Definitions. + + "License" shall mean the terms and conditions for use, reproduction, + and distribution as defined by Sections 1 through 9 of this document. + + "Licensor" shall mean the copyright owner or entity authorized by + the copyright owner that is granting the License. + + "Legal Entity" shall mean the union of the acting entity and all + other entities that control, are controlled by, or are under common + control with that entity. For the purposes of this definition, + "control" means (i) the power, direct or indirect, to cause the + direction or management of such entity, whether by contract or + otherwise, or (ii) ownership of fifty percent (50%) or more of the + outstanding shares, or (iii) beneficial ownership of such entity. + + "You" (or "Your") shall mean an individual or Legal Entity + exercising permissions granted by this License. + + "Source" form shall mean the preferred form for making modifications, + including but not limited to software source code, documentation + source, and configuration files. + + "Object" form shall mean any form resulting from mechanical + transformation or translation of a Source form, including but + not limited to compiled object code, generated documentation, + and conversions to other media types. + + "Work" shall mean the work of authorship, whether in Source or + Object form, made available under the License, as indicated by a + copyright notice that is included in or attached to the work + (an example is provided in the Appendix below). + + "Derivative Works" shall mean any work, whether in Source or Object + form, that is based on (or derived from) the Work and for which the + editorial revisions, annotations, elaborations, or other modifications + represent, as a whole, an original work of authorship. For the purposes + of this License, Derivative Works shall not include works that remain + separable from, or merely link (or bind by name) to the interfaces of, + the Work and Derivative Works thereof. + + "Contribution" shall mean any work of authorship, including + the original version of the Work and any modifications or additions + to that Work or Derivative Works thereof, that is intentionally + submitted to Licensor for inclusion in the Work by the copyright owner + or by an individual or Legal Entity authorized to submit on behalf of + the copyright owner. For the purposes of this definition, "submitted" + means any form of electronic, verbal, or written communication sent + to the Licensor or its representatives, including but not limited to + communication on electronic mailing lists, source code control systems, + and issue tracking systems that are managed by, or on behalf of, the + Licensor for the purpose of discussing and improving the Work, but + excluding communication that is conspicuously marked or otherwise + designated in writing by the copyright owner as "Not a Contribution." + + "Contributor" shall mean Licensor and any individual or Legal Entity + on behalf of whom a Contribution has been received by Licensor and + subsequently incorporated within the Work. + + 2. Grant of Copyright License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + copyright license to reproduce, prepare Derivative Works of, + publicly display, publicly perform, sublicense, and distribute the + Work and such Derivative Works in Source or Object form. + + 3. Grant of Patent License. Subject to the terms and conditions of + this License, each Contributor hereby grants to You a perpetual, + worldwide, non-exclusive, no-charge, royalty-free, irrevocable + (except as stated in this section) patent license to make, have made, + use, offer to sell, sell, import, and otherwise transfer the Work, + where such license applies only to those patent claims licensable + by such Contributor that are necessarily infringed by their + Contribution(s) alone or by combination of their Contribution(s) + with the Work to which such Contribution(s) was submitted. If You + institute patent litigation against any entity (including a + cross-claim or counterclaim in a lawsuit) alleging that the Work + or a Contribution incorporated within the Work constitutes direct + or contributory patent infringement, then any patent licenses + granted to You under this License for that Work shall terminate + as of the date such litigation is filed. + + 4. Redistribution. You may reproduce and distribute copies of the + Work or Derivative Works thereof in any medium, with or without + modifications, and in Source or Object form, provided that You + meet the following conditions: + + (a) You must give any other recipients of the Work or + Derivative Works a copy of this License; and + + (b) You must cause any modified files to carry prominent notices + stating that You changed the files; and + + (c) You must retain, in the Source form of any Derivative Works + that You distribute, all copyright, patent, trademark, and + attribution notices from the Source form of the Work, + excluding those notices that do not pertain to any part of + the Derivative Works; and + + (d) If the Work includes a "NOTICE" text file as part of its + distribution, then any Derivative Works that You distribute must + include a readable copy of the attribution notices contained + within such NOTICE file, excluding those notices that do not + pertain to any part of the Derivative Works, in at least one + of the following places: within a NOTICE text file distributed + as part of the Derivative Works; within the Source form or + documentation, if provided along with the Derivative Works; or, + within a display generated by the Derivative Works, if and + wherever such third-party notices normally appear. The contents + of the NOTICE file are for informational purposes only and + do not modify the License. You may add Your own attribution + notices within Derivative Works that You distribute, alongside + or as an addendum to the NOTICE text from the Work, provided + that such additional attribution notices cannot be construed + as modifying the License. + + You may add Your own copyright statement to Your modifications and + may provide additional or different license terms and conditions + for use, reproduction, or distribution of Your modifications, or + for any such Derivative Works as a whole, provided Your use, + reproduction, and distribution of the Work otherwise complies with + the conditions stated in this License. + + 5. Submission of Contributions. Unless You explicitly state otherwise, + any Contribution intentionally submitted for inclusion in the Work + by You to the Licensor shall be under the terms and conditions of + this License, without any additional terms or conditions. + Notwithstanding the above, nothing herein shall supersede or modify + the terms of any separate license agreement you may have executed + with Licensor regarding such Contributions. + + 6. Trademarks. This License does not grant permission to use the trade + names, trademarks, service marks, or product names of the Licensor, + except as required for reasonable and customary use in describing the + origin of the Work and reproducing the content of the NOTICE file. + + 7. Disclaimer of Warranty. Unless required by applicable law or + agreed to in writing, Licensor provides the Work (and each + Contributor provides its Contributions) on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or + implied, including, without limitation, any warranties or conditions + of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A + PARTICULAR PURPOSE. You are solely responsible for determining the + appropriateness of using or redistributing the Work and assume any + risks associated with Your exercise of permissions under this License. + + 8. Limitation of Liability. In no event and under no legal theory, + whether in tort (including negligence), contract, or otherwise, + unless required by applicable law (such as deliberate and grossly + negligent acts) or agreed to in writing, shall any Contributor be + liable to You for damages, including any direct, indirect, special, + incidental, or consequential damages of any character arising as a + result of this License or out of the use or inability to use the + Work (including but not limited to damages for loss of goodwill, + work stoppage, computer failure or malfunction, or any and all + other commercial damages or losses), even if such Contributor + has been advised of the possibility of such damages. + + 9. Accepting Warranty or Additional Liability. While redistributing + the Work or Derivative Works thereof, You may choose to offer, + and charge a fee for, acceptance of support, warranty, indemnity, + or other liability obligations and/or rights consistent with this + License. However, in accepting such obligations, You may act only + on Your own behalf and on Your sole responsibility, not on behalf + of any other Contributor, and only if You agree to indemnify, + defend, and hold each Contributor harmless for any liability + incurred by, or claims asserted against, such Contributor by reason + of your accepting any such warranty or additional liability. + + END OF TERMS AND CONDITIONS + + APPENDIX: How to apply the Apache License to your work. + + To apply the Apache License to your work, attach the following + boilerplate notice, with the fields enclosed by brackets "[]" + replaced with your own identifying information. (Don't include + the brackets!) The text should be enclosed in the appropriate + comment syntax for the file format. We also recommend that a + file or class name and description of purpose be included on the + same "printed page" as the copyright notice for easier + identification within third-party archives. + + Copyright [yyyy] [name of copyright owner] + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md new file mode 100644 index 00000000000..3f045810835 --- /dev/null +++ b/baselines/fedpft/README.md @@ -0,0 +1,109 @@ +--- +title: Parametric Feature Transfer, One-shot Federated Learning with Foundation Models +url: https://arxiv.org/abs/2402.01862 +labels: [foundation-models, pre-trained, one-shot, one-round] # please add between 4 and 10 single-word (maybe two-words) labels (e.g. system heterogeneity, image classification, asynchronous, weight sharing, cross-silo). Do not use "" +dataset: [CIFAR100, Caltech101] # list of datasets you include in your baseline. Do not use "" +--- + +# FedPFT: One-shot Federated Learning with Foundation Models + +> Note: If you use this baseline in your work, please remember to cite the original authors of the paper as well as the Flower paper. + +**Paper:** [arxiv.org/abs/2402.01862](https://arxiv.org/abs/2402.01862) + +**Authors:** Mahdi Beitollahi, Alex Bie, Sobhan Hemati, Leo Maxime Brunswic, Xu Li, Xi Chen, Guojun Zhang. + +**Abstract:** In one-shot federated learning (FL), clients collaboratively train a global model in a single round of communication. Existing approaches for one-shot FL enhance communication efficiency at the expense of diminished accuracy. This paper introduces FedPFT (Federated Learning with Parametric Feature Transfer), a methodology that harnesses the transferability of foundation models to enhance both accuracy and communication efficiency in one-shot FL. The approach involves transferring per-client parametric models (specifically, Gaussian mixtures) of features extracted from foundation models. Subsequently, each parametric model is employed to generate synthetic features for training a classifier head. Experimental results on eight datasets demonstrate that FedPFT enhances the communication-accuracy frontier in both centralized and decentralized FL scenarios, as well as across diverse data-heterogeneity settings such as covariate shift and task shift, with improvements of up to 20.6%. Additionally, FedPFT adheres to the data minimization principle of FL, as clients do not send real features. We demonstrate that sending real features is vulnerable to potent reconstruction attacks. Moreover, we show that FedPFT is amenable to formal privacy guarantees via differential privacy, demonstrating favourable privacy-accuracy tradeoffs. + + +## About this baseline + +**What’s implemented:** The code in this directory replicates the centralized experiments in *Parametric Feature Transfer, One-shot Federated Learning with Foundation Models* (Beitollahi et al., 2024) for CIFAR100 and Caltech101 datasets, which proposed the FedPFT algorithm. Concretely, it replicates the results in Section 5.2. + +**Datasets:** CIFAR100 and Caltech101 from HuggingFace + +**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8Gigs of ram. + +**Contributors:** Mahdi Beitollahi + + +## Experimental Setup + +**Task:** Image classification + +**Model:** This directory utilize two pre-trained, frozen models as shown in Table 1 of the paper: +* ResNet50 pre-trained on ImageNet is used for CIFAR100 dataset(see `models/resnet50`). +* CLIP, ViT-B/32 pre-trained on web dataset is used for Caltech101 dataset (see `models/clip_vit`) + +**Dataset:** This baseline includes the CIFAR100 and Caltech101 datasets. By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. + +| Dataset | #classes | #partitions | partitioning method | partition settings | +| :------ | :---: | :---: | :---: | :---: | +| CIFAR100 | 100 | 50 | Dirichlet distribution | $\alpha$=0.1 | +| Caltech101 | 101 | 50 | Dirichlet distribution | $\alpha$=0.1 | + +**Training Hyperparameters:** The following table shows the main hyperparameters for this baseline with their default value (i.e. the value used if you run `python main.py` directly) + +| Description | Default Value | +| ----------- | ----- | +| total clients | 50 | +| clients per round | 50 | +| number of rounds | 1 | +| client resources | {'num_cpus': 2.0, 'num_gpus': 0.0 }| +| data partition | distribution with $\alpha$=0.1 | +| Number of mixtures | 2 | +| Covariance type | spherical | +| tolerance | 1e-12 | +| maximum GMM iterations | 1e3 | + + +## Environment Setup + +To construct the Python environment, simply run: + +```bash +# Set directory to use python 3.10 (install with `pyenv install ` if you don't have it) +pyenv local 3.10.12 + +# Tell poetry to use python3.10 +poetry env use 3.10.12 + +# Install +poetry install +``` + + +## Running the Experiments + +To run this FedProx with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: + +```bash +python -m fedpft.main # this will run using the default settings in the `conf/config.yaml` + +# you can override settings directly from the command line +python -m fedprox.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 +``` + +To run using FedAvg: +```bash +# this will use a frozen, pre-trained model and train the classifier head +python -m fedpft.main strategy=FedAvg client=FedAvg + +``` + + +## Expected Results + + +With the following command, we run both FedPFT and FedAvg configurations. + +```bash +python -m fedprox.main --multirun dataset=CIFAR100, Caltech101 + +# FedAvg +python -m fedprox.main --multirun strategy=fedavg client=fedavg dataset=CIFAR100, Caltech101 +``` + +The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. + +![](_static/FedProx_mnist.png) \ No newline at end of file diff --git a/baselines/fedpft/fedpft/__init__.py b/baselines/fedpft/fedpft/__init__.py new file mode 100644 index 00000000000..a5e567b5913 --- /dev/null +++ b/baselines/fedpft/fedpft/__init__.py @@ -0,0 +1 @@ +"""Template baseline package.""" diff --git a/baselines/fedpft/fedpft/client.py b/baselines/fedpft/fedpft/client.py new file mode 100644 index 00000000000..434055808f8 --- /dev/null +++ b/baselines/fedpft/fedpft/client.py @@ -0,0 +1,170 @@ +"""Define your client class and a function to construct such clients. + +Please overwrite `flwr.client.NumPyClient` or `flwr.client.Client` and create a function +to instantiate your client. +""" + +from collections import OrderedDict +from typing import Callable, Dict, List, Tuple + +import flwr as fl +import torch +from flwr.common.typing import NDArrays, Scalar +from hydra.utils import instantiate +from omegaconf import DictConfig +from torch import nn +from torch.utils.data import DataLoader + +from fedpft.models import extract_features, test, train +from fedpft.utils import gmmparam_to_ndarrays, learn_gmm + + +class FedPFTClient(fl.client.NumPyClient): + """Flower FedPFTClient.""" + + def __init__( + self, + trainloader: DataLoader, + testloader: DataLoader, + feature_extractor: torch.nn.Module, + num_classes: int, + device: torch.device, + ) -> None: + """FedPFT client strategy. + + Implementation based on https://arxiv.org/abs/2402.01862 + + Parameters + ---------- + trainloader : DataLoader + Dataset used for learning GMMs + testloader : DataLoader + Dataset used for evaluating `classifier_head` sent from the server + feature_extractor : torch.nn.Module + Model used to extract features of each client + num_classes : int + Number of total classes in the dataset + device : torch.device + Device used to extract features and evaluate `classifier_head` + """ + self.trainloader = trainloader + self.testloader = testloader + self.feature_extractor = feature_extractor + self.classifier_head = nn.Linear( + feature_extractor.hidden_dimension, num_classes + ) + self.device = device + + def get_parameters(self, config) -> NDArrays: + """Return the parameters of the `classifier_head`.""" + return [ + val.cpu().numpy() for _, val in self.classifier_head.state_dict().items() + ] + + def set_parameters(self, parameters: NDArrays) -> None: + """Set the parameters of the `classifier_head`.""" + params_dict = zip(self.classifier_head.state_dict().keys(), parameters) + state_dict = OrderedDict({k: torch.tensor(v) for k, v in params_dict}) + self.classifier_head.load_state_dict(state_dict, strict=True) + + def fit( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[NDArrays, int, Dict]: + """Fit a GMM on features and return GMM parameters.""" + # Extracting features + features, labels = extract_features( + dataloader=self.trainloader, + feature_extractor=self.feature_extractor, + device=self.device, + ) + + # Learning GMM + gmm_list = learn_gmm( + features=features, + labels=labels, + n_mixtures=int(config["n_mixtures"]), + cov_type=config["cov_type"], + seed=int(config["seed"]), + tol=float(config["tol"]), + max_iter=int(config["max_iter"]), + ) + + # Reshaping GMM parameters into an NDArray + return [array for gmm in gmm_list for array in gmmparam_to_ndarrays(gmm)], 0, {} + + def evaluate( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[float, int, Dict]: + """Evaluate `classifier_head` on the test data.""" + self.set_parameters(parameters) + loss, acc = test( + classifier_head=self.classifier_head, + dataloader=self.testloader, + feature_extractor=self.feature_extractor, + device=self.device, + ) + return loss, len(self.testloader.dataset), {"accuracy": acc} + + +class FedAvgClient(FedPFTClient): + """Flower FedAvgClient.""" + + def fit( + self, parameters: NDArrays, config: Dict[str, Scalar] + ) -> Tuple[NDArrays, int, Dict]: + """Train the classifier head.""" + self.set_parameters(parameters) + + # train classifier head + opt = torch.optim.AdamW( + params=self.classifier_head.parameters(), lr=float(config["lr"]) + ) + train( + classifier_head=self.classifier_head, + dataloader=self.trainloader, + feature_extractor=self.feature_extractor, + device=self.device, + num_epochs=int(config["num_epochs"]), + opt=opt, + ) + return self.get_parameters(config={}), len(self.trainloader.dataset), {} + + +def generate_client_fn( + client_cfg: DictConfig, + trainloaders: List[DataLoader], + testloaders: List[DataLoader], + feature_extractor: torch.nn.Module, + num_classes: int, + device: torch.device, +) -> Callable[[str], fl.client.NumPyClient]: + """Generate the client function that creates the Flower Clients. + + Parameters + ---------- + client_cfg : DictConfig + Type of client + trainloaders : List[DataLoader] + List of train dataloaders for clients + testloaders : List[DataLoader] + List of test dataloaders for clients + feature_extractor : torch.nn.Module + Pre-trained model as the backbone + num_classes : int + Number of classes in the dataset + device : torch.device + Device to load the `feature_extractor` + """ + + def client_fn(cid: str) -> fl.client.NumPyClient: + """Create a FedPFT client.""" + return instantiate( + client_cfg, + trainloader=trainloaders[int(cid)], + testloader=testloaders[int(cid)], + feature_extractor=feature_extractor, + num_classes=num_classes, + device=device, + ) + + return client_fn diff --git a/baselines/fedpft/fedpft/conf/base.yaml b/baselines/fedpft/fedpft/conf/base.yaml new file mode 100644 index 00000000000..ab1477bd696 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/base.yaml @@ -0,0 +1,15 @@ +--- + +num_clients: 2 +dirichlet_alpha: 0.1 +num_rounds: 1 +num_cpus: 1 +num_gpus: 0.1 +batch_size: 64 +device: cuda + +defaults: + - strategy: fedpft + - client: fedpft + - model: resnet50 + - dataset: CIFAR100 diff --git a/baselines/fedpft/fedpft/conf/client/fedavg.yaml b/baselines/fedpft/fedpft/conf/client/fedavg.yaml new file mode 100644 index 00000000000..10fc2b0f922 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/client/fedavg.yaml @@ -0,0 +1,2 @@ +--- +_target_: fedpft.client.FedAvgClient \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/client/fedpft.yaml b/baselines/fedpft/fedpft/conf/client/fedpft.yaml new file mode 100644 index 00000000000..6ef0f175976 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/client/fedpft.yaml @@ -0,0 +1,2 @@ +--- +_target_: fedpft.client.FedPFTClient \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml b/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml new file mode 100644 index 00000000000..322c2d80c18 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/dataset/CIFAR100.yaml @@ -0,0 +1,10 @@ +--- +_target_: fedpft.dataset.Dataset +name: cifar100 +dataset: CIFAR100 +num_classes: 100 +image_column_name: img +partition_by: fine_label +num_clients: ${num_clients} +dirichlet_alpha: ${dirichlet_alpha} +batch_size: ${batch_size} \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml b/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml new file mode 100644 index 00000000000..96dcc50fa8d --- /dev/null +++ b/baselines/fedpft/fedpft/conf/dataset/Caltech101.yaml @@ -0,0 +1,10 @@ +--- +_target_: fedpft.dataset.Dataset +name: caltech101 +dataset: clip-benchmark/wds_vtab-caltech101 +num_classes: 102 +image_column_name: webp +partition_by: cls +num_clients: ${num_clients} +dirichlet_alpha: ${dirichlet_alpha} +batch_size: ${batch_size} \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/model/clip.yaml b/baselines/fedpft/fedpft/conf/model/clip.yaml new file mode 100644 index 00000000000..23d350a2347 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/model/clip.yaml @@ -0,0 +1,9 @@ +feature_extractor: + _target_: fedpft.models.clip_vit + name: openai/clip-vit-base-patch32 +transform: + _target_: fedpft.models.transform + mean: [0.48145466, 0.4578275, 0.40821073] + std: [0.26862954, 0.26130258, 0.27577711] +image_input_size: 224 +hidden_dimension: 768 diff --git a/baselines/fedpft/fedpft/conf/model/resnet50.yaml b/baselines/fedpft/fedpft/conf/model/resnet50.yaml new file mode 100644 index 00000000000..260d9151e68 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/model/resnet50.yaml @@ -0,0 +1,8 @@ +feature_extractor: + _target_: fedpft.models.resnet50 +transform: + _target_: fedpft.models.transform + mean: [0.485, 0.456, 0.406] + std: [0.229, 0.224, 0.225] +image_input_size: 224 +hidden_dimension: 2048 diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml new file mode 100644 index 00000000000..3a4e290ced2 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -0,0 +1,12 @@ +--- +_target_: fedpft.strategy.FedAvg +fraction_fit: 1 +fraction_evaluate: 1 +accept_failures: False +on_fit_config_fn: + _target_: fedpft.server.fedavg_get_on_fit_config_fn + lr: 0.001 + num_epochs: 10 +evaluate_metrics_aggregation_fn: + _target_: fedpft.server.weighted_average + _partial_: true \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml new file mode 100644 index 00000000000..c4982074633 --- /dev/null +++ b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml @@ -0,0 +1,22 @@ +--- +_target_: fedpft.strategy.FedPFT +fraction_fit: 1 +fraction_evaluate: 1 +accept_failures: False +num_classes: ${dataset.num_classes} +feature_dimension: ${model.hidden_dimension} +device: ${device} +server_batch_size: 32 +num_epochs: 1 +server_opt: + lr: 1e-4 +on_fit_config_fn: + _target_: fedpft.server.fedpft_get_on_fit_config_fn + n_mixtures: 2 + cov_type: spherical + seed: 0 + tol: 1e-12 + max_iter: 10000 +evaluate_metrics_aggregation_fn: + _target_: fedpft.server.weighted_average + _partial_: true diff --git a/baselines/fedpft/fedpft/dataset.py b/baselines/fedpft/fedpft/dataset.py new file mode 100644 index 00000000000..733234074ef --- /dev/null +++ b/baselines/fedpft/fedpft/dataset.py @@ -0,0 +1,108 @@ +"""Dataset creation.""" + +from typing import Callable, Dict + +from flwr_datasets.federated_dataset import FederatedDataset +from flwr_datasets.partitioner import DirichletPartitioner +from torch.utils.data import DataLoader +from torchvision import transforms + + +class Dataset: + """Dataset class.""" + + def __init__( + self, + dataset: str, + num_clients: int, + batch_size: int, + dirichlet_alpha: float, + partition_by: str, + image_column_name: str, + transform: transforms, + image_input_size: int, + seed: int = 0, + split_size: float = 0.8, + **kwargs, + ) -> None: + """Load the dataset and partition it using dirichlet distribution. + + Parameters + ---------- + dataset : str + Name of dataset to be downloaded from HuggingFace. + num_clients: int + Number of clients. + batch_size: int + Batch size of training and testing dataloaders of clients. + dirichlet_alpha: float + Alpha parameter of Dirichlet distribution. + partition_by: str + Label named used for partitioning the dataset. + image_column_name: str + Column name of image in the dataset. + transform: transforms + Transformation of each batch. + image_input_size: int + Input size of pre-trained model. + seed: int, optional + Seed for partitioning the dataset. Default is 0. + split_size: float, optional + The portion of dataset to be used as training and rest as test. + """ + self.dataset = dataset + self.num_clients = num_clients + self.image_input_size = image_input_size + self.transform = transform + self.batch_size = batch_size + self.dirichlet_alpha = dirichlet_alpha + self.partition_by = partition_by + self.seed = seed + self.split_size = split_size + self.image_column_name = image_column_name + + def get_loaders(self): + """Partition the datasets and return a list of dataloaders.""" + partitioner = DirichletPartitioner( + num_partitions=self.num_clients, + partition_by=self.partition_by, + alpha=self.dirichlet_alpha, + min_partition_size=10, + self_balancing=True, + ) + + fds = FederatedDataset( + dataset=self.dataset, partitioners={"train": partitioner} + ) + # Create train/val for each partition and wrap it into DataLoader + trainloaders, testloaders = [], [] + for partition_id in range(self.num_clients): + partition = fds.load_partition(partition_id) + partition = partition.with_transform(self.apply_batch_transforms()) + partition = partition.train_test_split( + train_size=self.split_size, seed=self.seed + ) + trainloaders.append( + DataLoader(partition["train"], batch_size=self.batch_size) + ) + testloaders.append( + DataLoader(partition["test"], batch_size=self.batch_size) + ) + + return trainloaders, testloaders + + def apply_batch_transforms(self) -> Callable[[Dict], Dict]: + """Apply batch transforms for each batch.""" + + def batch_transform(batch): + batch_img = [ + self.transform( + img.resize((self.image_input_size, self.image_input_size)) + ) + for img in batch[self.image_column_name] + ] + batch_label = list(batch[self.partition_by]) + + return {"img": batch_img, "label": batch_label} + + return batch_transform diff --git a/baselines/fedpft/fedpft/dataset_preparation.py b/baselines/fedpft/fedpft/dataset_preparation.py new file mode 100644 index 00000000000..83a9c5dd9e2 --- /dev/null +++ b/baselines/fedpft/fedpft/dataset_preparation.py @@ -0,0 +1 @@ +"""Handle the dataset partitioning and (optionally) complex downloads.""" diff --git a/baselines/fedpft/fedpft/main.py b/baselines/fedpft/fedpft/main.py new file mode 100644 index 00000000000..9860b1232bf --- /dev/null +++ b/baselines/fedpft/fedpft/main.py @@ -0,0 +1,88 @@ +"""Run FL with frozen, pre-trained models.""" + +import pickle +from pathlib import Path + +import flwr as fl +import hydra +import torch +from hydra.core.hydra_config import HydraConfig +from hydra.utils import instantiate +from omegaconf import DictConfig, OmegaConf + +from fedpft.client import generate_client_fn + + +@hydra.main(config_path="conf", config_name="base", version_base=None) +def main(cfg: DictConfig) -> None: + """Run federated learning with frozen, pre-trained models. + + Parameters + ---------- + cfg : DictConfig + An omegaconf object that stores the hydra config. + """ + # Print Config + print(OmegaConf.to_yaml(cfg)) + + # Set device + device = torch.device(cfg.device) + + # Prepare dataset + trainloaders, testloaders = instantiate( + cfg.dataset, + transform=cfg.model.transform, + image_input_size=cfg.model.image_input_size, + ).get_loaders() + + # Define clients + client_fn = generate_client_fn( + client_cfg=cfg.client, + trainloaders=trainloaders, + testloaders=testloaders, + feature_extractor=instantiate(cfg.model.feature_extractor), + num_classes=cfg.dataset.num_classes, + device=device, + ) + + # Setup strategy + strategy = instantiate(cfg.strategy) + + # Start simulation + history = fl.simulation.start_simulation( + client_fn=client_fn, + num_clients=cfg.num_clients, + config=fl.server.ServerConfig(num_rounds=cfg.num_rounds), + strategy=strategy, + client_resources={"num_cpus": cfg.num_cpus, "num_gpus": cfg.num_gpus}, + ) + + # Save results + accuracy_per_round = history.metrics_distributed["accuracy"] + print(accuracy_per_round) + save_path = HydraConfig.get().runtime.output_dir + + strategy_name = strategy.__class__.__name__ + + def format_variable(x): + return f"{x!r}" if isinstance(x, bytes) else x + + file_suffix: str = ( + f"_{format_variable(strategy_name)}" + f"_{format_variable(cfg.dataset.name)}" + f"_clients={format_variable(cfg.num_clients)}" + f"_rounds={format_variable(cfg.num_rounds)}" + f"_finalacc={format_variable(accuracy_per_round[-1][1]):.2f}" + ) + filename = "results" + file_suffix + ".pkl" + + print(f">>> Saving {filename}") + results_path = Path(save_path) / filename + results = {"history": history} + + with open(str(results_path), "wb") as hist_file: + pickle.dump(results, hist_file, protocol=pickle.HIGHEST_PROTOCOL) + + +if __name__ == "__main__": + main() diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py new file mode 100644 index 00000000000..0514b2f3283 --- /dev/null +++ b/baselines/fedpft/fedpft/models.py @@ -0,0 +1,221 @@ +"""Models, training and eval functions.""" + +import logging +from typing import List, Optional, Tuple + +import numpy as np +import torch +import torch.utils +import torchvision.transforms as transforms +from flwr.common.logger import log +from torch import nn +from torch.utils.data import DataLoader +from torchvision import models +from transformers import CLIPModel + + +def resnet50() -> torch.nn.modules: + """Return ResNet-50 model as feature extractor.""" + resnet50 = models.resnet50(weights=models.ResNet50_Weights.DEFAULT) + + # Remove last layer and flatten outputs + resnet50 = torch.nn.Sequential( + *(list(resnet50.children())[:-1]), torch.nn.Flatten() + ) + + # Set the hidden_dimension + resnet50.hidden_dimension = 2048 + + return resnet50 + + +def clip_vit(name: str) -> torch.nn.modules: + """Return CLIP-ViT as feature extractor. + + Parameters + ---------- + name : str + Name of the CLIP model on transformer library, + e.g. `openai/clip-vit-base-patch32`. + """ + + class ClipVit(nn.Module): + """Wrap outputs to return only pooled outputs.""" + + def __init__(self, vision_model): + super().__init__() + self.vision_model = vision_model + self.hidden_dimension = vision_model.config.hidden_size + + def forward(self, input): + output = self.vision_model(input) + return output[1] # return pooled_output (CLS token) + + vision_model = CLIPModel.from_pretrained(name).vision_model + + return ClipVit(vision_model) + + +def transform(mean: List, std: List) -> transforms.Compose: + """Return `transforms.Compose` function for normalizing images. + + Parameters + ---------- + mean : List + Sequence of means for each channel + std : List + Sequence of standard deviations for each channel. + + Returns + ------- + transforms.Compose + Transform function for normalizing images + """ + tr = transforms.Compose( + [ + transforms.ToTensor(), + transforms.Normalize(mean, std), + ] + ) + return tr + + +def extract_features( + dataloader: DataLoader, feature_extractor: torch.nn.Module, device: torch.device +) -> Tuple[np.array, np.array]: + """Extract features and labels from images using feature extractor. + + Parameters + ---------- + dataloader : DataLoader + Dataloader containing {'img': img, 'label': label} + dicts to be extracted. + feature_extractor : torch.nn.Module + Model for extracting features. + device : torch.device + Device for loading `feature_extractor`. + + Returns + ------- + features : np.array + 2D array containing features extracted from `feature_extractor`. + labels : np.array + 2D array containing labels of `features`. + """ + features, labels = [], [] + for dict in dataloader: + batch_samples = dict["img"].to(device) + batch_label = dict["label"].to(device) + with torch.no_grad(): + feature = feature_extractor(batch_samples) + features.append(feature.cpu().detach().numpy()) + labels.append(batch_label) + + # reshape feauturs and labels into a single numpy array + features = np.concatenate(features, axis=0, dtype=np.float64) + labels = np.concatenate(labels, dtype=int) + + return features, labels + + +def test( + classifier_head: torch.nn.Linear, + dataloader: DataLoader, + feature_extractor: torch.nn.Module, + device: torch.device, +) -> Tuple[float, float]: + """"Evaluates the `classifier_head` on the dataset. + + Parameters + ---------- + classifier_head : torch.nn.Linear + Classifier head model. + dataloader : DataLoader + Dataset used for evaluating `classifier_head` containing + {'img': img, 'label': label} dicts. + feature_extractor : torch.nn.Module + Model used for extracting features from the `dataloader`. + device : torch.device + Device for loading `feature_extractor`. + + Returns + ------- + loss : float + CrossEntropy Loss of `classifier_head` on the dataset. + accuracy : float + Accuracy of `classifier_head` on the dataset. + """ + classifier_head.eval() + feature_extractor.eval() + classifier_head.to(device) + feature_extractor.to(device) + + correct, total, loss = 0, 0, 0 + for dict in dataloader: + samples = dict["img"].to(device) + labels = dict["label"].to(device) + with torch.no_grad(): + feature = feature_extractor(samples) + output = classifier_head(feature) + pred = torch.max(output, 1)[1].data.squeeze() + correct += (pred == labels).sum().item() + total += samples.shape[0] + running_loss = nn.CrossEntropyLoss()(output, labels) + loss += running_loss + + return loss.cpu().item(), correct / total + + +def train( + classifier_head: torch.nn.Linear, + dataloader: DataLoader, + opt: torch.optim.Optimizer, + num_epochs: int, + device: torch.device, + feature_extractor: Optional[torch.nn.Module] = None, + verbose: Optional[bool] = False, +) -> None: + """Trains the `classifier_head`. + + Parameters + ---------- + classifier_head : torch.nn.Linear + Classifier head model. + dataloader : DataLoader + Dataset used for evaluating `classifier_head` + containing {'img': img, 'label': label} dicts. + opt : torch.optim.Optimizer + Optimizer for the `classifier_head`. + num_epochs: int + Number of epochs to train the `classifier_head`. + device : torch.device + Device for loading `feature_extractor`. + feature_extractor : torch.nn.Module, Optional + Model used for extracting features from the `dataloader`, optional. + `verbose` : bool, Optional + Whether or not log the accuracy during the training. Defaults to False. + """ + classifier_head.to(device) + if feature_extractor: + feature_extractor.eval() + feature_extractor.to(device) + + for epoch in range(num_epochs): + correct, total, loss = 0, 0, 0 + for _, dict in enumerate(dataloader): + classifier_head.zero_grad() + samples = dict["img"].to(device) + labels = dict["label"].to(device) + if feature_extractor: + with torch.no_grad(): + samples = feature_extractor(samples) + output = classifier_head(samples) + pred = torch.max(output, 1)[1].data.squeeze() + correct += (pred == labels).sum().item() + total += samples.shape[0] + running_loss = nn.CrossEntropyLoss()(output, labels) + loss += running_loss + running_loss.backward() + opt.step() + if verbose: + log(logging.INFO, f"Epoch:{epoch+1} --- Accuracy: {correct/total}") diff --git a/baselines/fedpft/fedpft/server.py b/baselines/fedpft/fedpft/server.py new file mode 100644 index 00000000000..00d88360e9f --- /dev/null +++ b/baselines/fedpft/fedpft/server.py @@ -0,0 +1,94 @@ +"""Create global evaluation function.""" + +from typing import Callable, Dict, List, Tuple + +from flwr.common import Metrics + + +def fedpft_get_on_fit_config_fn( + n_mixtures: int, cov_type: str, seed: int, tol: float, max_iter: int +) -> Callable[[int], Dict[str, str]]: + """Return a function which returns FedPFT training configurations. + + Parameters + ---------- + n_mixtures : int + Number of mixtures for GMMs + cov_type : str + Type of covariance + seed : int + Seed for learning and sampling from the GMMs + tol : float + Error tolerance for learning GMMs + max_iter : int + Maximum number of iteration for EM algorithm + + Returns + ------- + Callable[[int], Dict[str, str]] + Function to return a config with the `lr` and `num_epochs` + """ + + def fit_config(server_round: int) -> Dict[str, str]: + """Return a configuration for training Gaussian Mixtures.""" + config = { + "n_mixtures": str(n_mixtures), + "cov_type": cov_type, + "seed": str(seed), + "tol": str(tol), + "max_iter": str(max_iter), + } + return config + + return fit_config + + +def fedavg_get_on_fit_config_fn( + lr: float, + num_epochs: int, +) -> Callable[[int], Dict[str, str]]: + """Return a function which returns FedAvg training configurations. + + Parameters + ---------- + lr : float + Client's learning rate + num_epochs : int + Number of epochs for local learning of clients + + Returns + ------- + Callable[[int], Dict[str, str]] + Function to return a config with the `lr` and `num_epochs` + """ + + def fit_config(server_round: int) -> Dict[str, str]: + """Return a configuration number of epochs and learning rate.""" + config = { + "lr": str(lr), + "num_epochs": str(num_epochs), + } + return config + + return fit_config + + +def weighted_average(metrics: List[Tuple[int, Metrics]]) -> Metrics: + """Aggregate with weighted average during evaluation. + + Parameters + ---------- + metrics : List[Tuple[int, Metrics]] + The list of metrics to aggregate. + + Returns + ------- + Metrics + The weighted average metric. + """ + # Multiply accuracy of each client by number of examples used + accuracies = [num_examples * float(m["accuracy"]) for num_examples, m in metrics] + examples = [num_examples for num_examples, _ in metrics] + + # Aggregate and return custom metric (weighted average) + return {"accuracy": int(sum(accuracies)) / int(sum(examples))} diff --git a/baselines/fedpft/fedpft/strategy.py b/baselines/fedpft/fedpft/strategy.py new file mode 100644 index 00000000000..f9546140124 --- /dev/null +++ b/baselines/fedpft/fedpft/strategy.py @@ -0,0 +1,145 @@ +"""FedPFT strategy.""" + +from typing import Dict, List, Optional, Tuple, Union + +import torch +from flwr.common import ( + FitRes, + Parameters, + Scalar, + ndarrays_to_parameters, + parameters_to_ndarrays, +) +from flwr.server.client_proxy import ClientProxy +from flwr.server.strategy import FedAvg +from omegaconf import DictConfig +from sklearn.mixture import GaussianMixture as GMM +from torch.utils.data import DataLoader + +from fedpft.models import train +from fedpft.utils import chunks, ndarrays_to_gmmparam + + +class FedPFT(FedAvg): + """Implementation of FedPFT. + + https://arxiv.org/abs/2402.01862 + Authors: + Mahdi Beitollahi, Alex Bie, Sobhan Hemati, Leo Maxime Brunswic, + Xu Li, Xi Chen, Guojun Zhang. + """ + + def __init__( + self, + *args, + num_classes: int, + feature_dimension: int, + server_opt: DictConfig, + server_batch_size: int, + num_epochs: int, + device: torch.device, + **kwargs, + ) -> None: + """Create FedPFT strategy. + + Parameters + ---------- + num_classes : int + Number of classes in the dataset. + feature_dimension : int + Size of feature embeddings + server_opt : DictConfig + Configuration of server optimizer for training classifier head. + server_batch_size : int + Batch size of synthetic features. + num_epochs : int + Number of epochs to train the classifier head. + + Attributes + ---------- + device : torch.device() + Device to train the classifier head at the server. + """ + super().__init__(*args, **kwargs) + self.num_classes = num_classes + self.feature_dimension = feature_dimension + self.server_opt = server_opt + self.server_batch_size = server_batch_size + self.num_epochs = num_epochs + self.device = device + + def aggregate_fit( + self, + server_round: int, + results: List[Tuple[ClientProxy, FitRes]], + failures: List[Union[Tuple[ClientProxy, FitRes], BaseException]], + ) -> Tuple[Optional[Parameters], Dict[str, Scalar]]: + """Learn a classifier head by generating samples from the GMMs.""" + # Do not aggregate if there are failures. + if not self.accept_failures and failures: + raise Exception("there are failures and failures are not accepted") + + config = self.on_fit_config_fn(server_round) + + # Sample from the GMMs to create synthetic feature dataset + synthetic_features_dataset = [] + for _, fit_res in results: + # Convert byte parameters into ndarrays and GMMParameters + ndarray = parameters_to_ndarrays(fit_res.parameters) + all_gmm_parameters = [ + ndarrays_to_gmmparam(array) for array in chunks(ndarray, 5) + ] + + # Sample from GMM_label pairs to create synthetic features + for gmm_parameter in all_gmm_parameters: + gmm = GMM( + n_components=int(config["n_mixtures"]), + covariance_type=config["cov_type"], + random_state=int(config["seed"]), + tol=float(config["tol"]), + max_iter=int(config["max_iter"]), + ) + # Set values of the GMMs + gmm.means_ = gmm_parameter.means.astype("float32") + gmm.weights_ = gmm_parameter.weights.astype("float32") + gmm.covariances_ = gmm_parameter.covariances.astype("float32") + + # Sample features + syn_features, _ = gmm.sample(gmm_parameter.num_samples) + syn_features = torch.tensor(syn_features, dtype=torch.float32) + gmm_labels = torch.tensor( + [int(gmm_parameter.label)] * int(gmm_parameter.num_samples) + ) + + # Add to train data + synthetic_features_dataset += list(zip(syn_features, gmm_labels)) + + # Train a classifier head + synthetic_features_dataset = [ + {"img": img, "label": label} for img, label in synthetic_features_dataset + ] + synthetic_loader = DataLoader( + synthetic_features_dataset, + batch_size=self.server_batch_size, + shuffle=True, + ) + classifier_head = torch.nn.Linear(self.feature_dimension, self.num_classes) + opt = torch.optim.AdamW( + params=classifier_head.parameters(), lr=self.server_opt.lr + ) + + train( + classifier_head=classifier_head, + dataloader=synthetic_loader, + device=self.device, + num_epochs=self.num_epochs, + opt=opt, + verbose=True, + ) + + # Send the classifier head to clients + classifier_ndarray = [ + val.cpu().numpy() for _, val in classifier_head.state_dict().items() + ] + + return ndarrays_to_parameters(classifier_ndarray), {} diff --git a/baselines/fedpft/fedpft/utils.py b/baselines/fedpft/fedpft/utils.py new file mode 100644 index 00000000000..c1a27c14647 --- /dev/null +++ b/baselines/fedpft/fedpft/utils.py @@ -0,0 +1,102 @@ +"""Utility functions.""" + +from dataclasses import dataclass +from typing import List + +import numpy as np +from flwr.common import NDArrays +from sklearn.mixture import GaussianMixture + + +@dataclass +class GMMParameters: + """GMM parameters.""" + + label: int + means: NDArrays + weights: NDArrays + covariances: NDArrays + num_samples: int + + +def gmmparam_to_ndarrays(gmm: GMMParameters) -> NDArrays: + """Convert gmm object to NumPy ndarrays.""" + return [gmm.label, gmm.means, gmm.weights, gmm.covariances, gmm.num_samples] + + +def ndarrays_to_gmmparam(ndarrays: NDArrays) -> GMMParameters: + """Convert NumPy ndarray to GMM object.""" + return GMMParameters( + label=ndarrays[0], + means=ndarrays[1], + weights=ndarrays[2], + covariances=ndarrays[3], + num_samples=ndarrays[4], + ) + + +def learn_gmm( + features: np.array, + labels: np.array, + n_mixtures: int, + cov_type: str, + seed: int, + tol: float = 1e-12, + max_iter: int = 1000, +) -> List[GMMParameters]: + """Learn a list of 16-bits GMMs for each label. + + Parameters + ---------- + features : np.array + A 2-d array with size (n_samples, feature_dimension) containing + extracted features for all the samples. + labels : np.array + An array with size (n_samples) containing labels associated for + each sample in `features`. + n_mixtures : int + Number of mixtures in each Gaussian Mixture. + cov_type : str + Covariance type of Gaussian Mixtures, e.g. spherical. + seed: int + Seed for learning and sampling from Gaussian Mixtures. + tol: float + Tolerance of Gaussian Mixtures. + max_iter: int + Number of maximum iterations to learn the Gaussian Mixtures. + + Returns + ------- + List[GMMParameters] + Returns a list containing the GMMParameters for each class. + """ + gmm_list = [] + for label in np.unique(labels): + cond_features = features[label == labels] + if ( + len(cond_features) > n_mixtures + ): # number of samples should be larger than `n_mixtures`. + gmm = GaussianMixture( + n_components=n_mixtures, + covariance_type=cov_type, + random_state=seed, + tol=tol, + max_iter=max_iter, + ) + gmm.fit(cond_features) + gmm_list.append( + GMMParameters( + label=label, + means=gmm.means_.astype("float16"), + weights=gmm.weights_.astype("float16"), + covariances=gmm.covariances_.astype("float16"), + num_samples=len(cond_features), + ) + ) + return gmm_list + + +def chunks(lst, n): + """Yield successive n-sized chunks from lst.""" + for i in range(0, len(lst), n): + yield lst[i : i + n] diff --git a/baselines/fedpft/pyproject.toml b/baselines/fedpft/pyproject.toml new file mode 100644 index 00000000000..30e47defbda --- /dev/null +++ b/baselines/fedpft/pyproject.toml @@ -0,0 +1,143 @@ +[build-system] +requires = ["poetry-core>=1.4.0"] +build-backend = "poetry.masonry.api" + +[tool.poetry] +name = "fedpft" # <----- Ensure it matches the name of your baseline directory containing all the source code +version = "1.0.0" +description = "Flower Baselines" +license = "Apache-2.0" +authors = ["The Flower Authors "] +readme = "README.md" +homepage = "https://flower.ai" +repository = "https://github.com/adap/flower" +documentation = "https://flower.ai" +classifiers = [ + "Development Status :: 3 - Alpha", + "Intended Audience :: Developers", + "Intended Audience :: Science/Research", + "License :: OSI Approved :: Apache Software License", + "Operating System :: MacOS :: MacOS X", + "Operating System :: POSIX :: Linux", + "Programming Language :: Python", + "Programming Language :: Python :: 3", + "Programming Language :: Python :: 3 :: Only", + "Programming Language :: Python :: 3.8", + "Programming Language :: Python :: 3.9", + "Programming Language :: Python :: 3.10", + "Programming Language :: Python :: 3.11", + "Programming Language :: Python :: Implementation :: CPython", + "Topic :: Scientific/Engineering", + "Topic :: Scientific/Engineering :: Artificial Intelligence", + "Topic :: Scientific/Engineering :: Mathematics", + "Topic :: Software Development", + "Topic :: Software Development :: Libraries", + "Topic :: Software Development :: Libraries :: Python Modules", + "Typing :: Typed", +] + +[tool.poetry.dependencies] +python = ">=3.8.15, <3.12.0" # don't change this +flwr = { extras = ["simulation"], version = "1.5.0" } +hydra-core = "1.3.2" # don't change this +torch = {url = "https://download.pytorch.org/whl/cu117/torch-1.13.0%2Bcu117-cp310-cp310-linux_x86_64.whl"} +scikit-learn = "1.2.2" +flwr-datasets = "0.1.0" +torchvision = {url = "https://download.pytorch.org/whl/cu117/torchvision-0.14.0%2Bcu117-cp310-cp310-linux_x86_64.whl"} +transformers = "4.39.3" +datasets = "2.18.0" + +[tool.poetry.dev-dependencies] +isort = "==5.13.2" +black = "==24.2.0" +docformatter = "==1.7.5" +mypy = "==1.4.1" +pylint = "==2.8.2" +flake8 = "==3.9.2" +pytest = "==6.2.4" +pytest-watch = "==4.2.0" +ruff = "==0.0.272" +types-requests = "==2.27.7" + +[tool.isort] +line_length = 88 +indent = " " +multi_line_output = 3 +include_trailing_comma = true +force_grid_wrap = 0 +use_parentheses = true + +[tool.black] +line-length = 88 +target-version = ["py38", "py39", "py310", "py311"] + +[tool.pytest.ini_options] +minversion = "6.2" +addopts = "-qq" +testpaths = [ + "flwr_baselines", +] + +[tool.mypy] +ignore_missing_imports = true +strict = false +plugins = "numpy.typing.mypy_plugin" + +[tool.pylint."MESSAGES CONTROL"] +disable = "bad-continuation,duplicate-code,too-few-public-methods,useless-import-alias" +good-names = "i,j,k,_,x,y,X,Y" +signature-mutators = "hydra.main.main" + +[tool.pylint.typecheck] +generated-members = "numpy.*, torch.*, tensorflow.*" + +[[tool.mypy.overrides]] +module = [ + "importlib.metadata.*", + "importlib_metadata.*", +] +follow_imports = "skip" +follow_imports_for_stubs = true +disallow_untyped_calls = false + +[[tool.mypy.overrides]] +module = "torch.*" +follow_imports = "skip" +follow_imports_for_stubs = true + +[tool.docformatter] +wrap-summaries = 88 +wrap-descriptions = 88 + +[tool.ruff] +target-version = "py38" +line-length = 88 +select = ["D", "E", "F", "W", "B", "ISC", "C4"] +fixable = ["D", "E", "F", "W", "B", "ISC", "C4"] +ignore = ["B024", "B027"] +exclude = [ + ".bzr", + ".direnv", + ".eggs", + ".git", + ".hg", + ".mypy_cache", + ".nox", + ".pants.d", + ".pytype", + ".ruff_cache", + ".svn", + ".tox", + ".venv", + "__pypackages__", + "_build", + "buck-out", + "build", + "dist", + "node_modules", + "venv", + "proto", +] + +[tool.ruff.pydocstyle] +convention = "numpy" From d8214b5e00a6a45a4ad426af562c433948d9fd1e Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:41:38 -0400 Subject: [PATCH 13/29] fixd model to gpu bug --- baselines/fedpft/fedpft/models.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index 0514b2f3283..7ebc9beed4a 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -102,6 +102,8 @@ def extract_features( labels : np.array 2D array containing labels of `features`. """ + feature_extractor.to(device) + features, labels = [], [] for dict in dataloader: batch_samples = dict["img"].to(device) @@ -109,7 +111,7 @@ def extract_features( with torch.no_grad(): feature = feature_extractor(batch_samples) features.append(feature.cpu().detach().numpy()) - labels.append(batch_label) + labels.append(batch_label.cpu().detach().numpy()) # reshape feauturs and labels into a single numpy array features = np.concatenate(features, axis=0, dtype=np.float64) From 03ca12463b4335ba66e11d2c954b2f760da0ee73 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:42:26 -0400 Subject: [PATCH 14/29] fixed config --- baselines/fedpft/fedpft/conf/base.yaml | 4 ++-- baselines/fedpft/fedpft/conf/strategy/fedavg.yaml | 2 +- baselines/fedpft/fedpft/conf/strategy/fedpft.yaml | 4 ++-- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/baselines/fedpft/fedpft/conf/base.yaml b/baselines/fedpft/fedpft/conf/base.yaml index ab1477bd696..01b1495c241 100644 --- a/baselines/fedpft/fedpft/conf/base.yaml +++ b/baselines/fedpft/fedpft/conf/base.yaml @@ -1,10 +1,10 @@ --- -num_clients: 2 +num_clients: 50 dirichlet_alpha: 0.1 num_rounds: 1 num_cpus: 1 -num_gpus: 0.1 +num_gpus: 1 batch_size: 64 device: cuda diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml index 3a4e290ced2..5f9e1d9e777 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -6,7 +6,7 @@ accept_failures: False on_fit_config_fn: _target_: fedpft.server.fedavg_get_on_fit_config_fn lr: 0.001 - num_epochs: 10 + num_epochs: 1 evaluate_metrics_aggregation_fn: _target_: fedpft.server.weighted_average _partial_: true \ No newline at end of file diff --git a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml index c4982074633..5612193071d 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedpft.yaml @@ -7,12 +7,12 @@ num_classes: ${dataset.num_classes} feature_dimension: ${model.hidden_dimension} device: ${device} server_batch_size: 32 -num_epochs: 1 +num_epochs: 50 server_opt: lr: 1e-4 on_fit_config_fn: _target_: fedpft.server.fedpft_get_on_fit_config_fn - n_mixtures: 2 + n_mixtures: 1 cov_type: spherical seed: 0 tol: 1e-12 From 791de9facdcf305ccb1e8a9ad39c667034211dcf Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:43:04 -0400 Subject: [PATCH 15/29] added notebook for visualization --- .../fedpft/docs/viz_and_plot_results.ipynb | 204 ++++++++++++++++++ 1 file changed, 204 insertions(+) create mode 100644 baselines/fedpft/docs/viz_and_plot_results.ipynb diff --git a/baselines/fedpft/docs/viz_and_plot_results.ipynb b/baselines/fedpft/docs/viz_and_plot_results.ipynb new file mode 100644 index 00000000000..866ffb5d8c7 --- /dev/null +++ b/baselines/fedpft/docs/viz_and_plot_results.ipynb @@ -0,0 +1,204 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "id": "5e0cf2a9-b782-48de-ac45-128726a26e64", + "metadata": {}, + "outputs": [ + { + "ename": "ModuleNotFoundError", + "evalue": "No module named 'matplotlib'", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[1;32mIn[2], line 7\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mos\u001b[39;00m\n\u001b[0;32m 6\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mnp\u001b[39;00m\n\u001b[1;32m----> 7\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mpyplot\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mplt\u001b[39;00m\n", + "\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'matplotlib'" + ] + } + ], + "source": [ + "import pickle\n", + "import yaml\n", + "from pathlib import Path\n", + "import os\n", + "\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "7ea3e149-ce6f-4ba0-aa41-e0501a04efe3", + "metadata": {}, + "outputs": [], + "source": [ + "def saveFig(name, fig):\n", + " fig.savefig(\n", + " name,\n", + " dpi=None,\n", + " facecolor=fig.get_facecolor(),\n", + " edgecolor=\"none\",\n", + " orientation=\"portrait\",\n", + " format=\"png\",\n", + " transparent=False,\n", + " bbox_inches=\"tight\",\n", + " pad_inches=0.2,\n", + " metadata=None,\n", + " )" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "id": "4b010856-0d99-4d81-8fb0-7a927f10eeaf", + "metadata": {}, + "outputs": [], + "source": [ + "# Update the path belows to the directories containing the results for FedPFT and FedAvg\n", + "path_fedpft_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n", + "path_fedpft_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-44-20')\n", + "\n", + "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','18-16-41')\n", + "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "2e3e165c-1ce6-4efa-a4e1-1372586e436e", + "metadata": {}, + "outputs": [], + "source": [ + "# load results\n", + "def read_accuracies(path_to_pickle):\n", + " for result in list(Path(path_to_pickle).glob(\"*.pkl\")):\n", + " with open(result, \"rb\") as handle:\n", + " data = pickle.load(handle)\n", + "\n", + " accuracies = data['history'].metrics_distributed['accuracy']\n", + " return accuracies\n" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "id": "77b70c73", + "metadata": {}, + "outputs": [], + "source": [ + "fedpft_cifar = read_accuracies(path_fedpft_resutls_cifar100)\n", + "fedpft_caltech = read_accuracies(path_fedpft_resutls_caltech101)\n", + "fedavg_cifar = read_accuracies(path_fedavg_resutls_cifar100)\n", + "fedavg_caltech = read_accuracies(path_fedavg_resutls_caltech101)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "6f4c87ad", + "metadata": {}, + "outputs": [], + "source": [ + "fedavg_cifar = [(1, 0.06924765515865097),\n", + " (2, 0.1315106765116743),\n", + " (3, 0.16773099181800039),\n", + " (4, 0.1946717222111355),\n", + " (5, 0.2171223308720814),\n", + " (6, 0.2375773298742766),\n", + " (7, 0.2597285970864099),\n", + " (8, 0.276092596288166),\n", + " (9, 0.290560766314109),\n", + " (10, 0.3036320095789264),\n", + " (11, 0.3128118140091798),\n", + " (12, 0.3261823987228098),\n", + " (13, 0.33745759329475156),\n", + " (14, 0.3477349830373179),\n", + " (15, 0.35831171422869684),\n", + " (16, 0.36679305527838757),\n", + " (17, 0.37407703053282776),\n", + " (18, 0.3817601277190182),\n", + " (19, 0.38824585910995807),\n", + " (20, 0.3942326880862103)]" + ] + }, + { + "cell_type": "code", + "execution_count": 59, + "id": "e1a678de", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "No artists with labels found to put in legend. Note that artists whose label start with an underscore are ignored when legend() is called with no argument.\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def viz():\n", + " fig, axs = plt.subplots(figsize=(10, 2), nrows=1, ncols=2)\n", + " \n", + " # cifar100 - fedavg\n", + " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', linewidth=2.0)\n", + " \n", + " axs[0].set_title('CIFAR100 - ResNet50')\n", + " \n", + " for ax in axs:\n", + " ax.set_xticks([1, 5, 10 , 15, 20])\n", + " ax.grid()\n", + " ax.legend(fontsize=14, loc='lower right')\n", + " ax.set_xlabel(\"Round\", fontsize=14)\n", + " ax.set_ylabel(\"Accuracy\", fontsize=14)\n", + "\n", + " return fig\n", + "\n", + "f = viz()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "92460065", + "metadata": {}, + "outputs": [], + "source": [ + "saveFig(\"FedProx_mnist.png\", f)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.11" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} From 90bd5ce81d086937bd9b0e4a1839b5de37a9fc09 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 22:43:34 -0400 Subject: [PATCH 16/29] completed readme file --- baselines/fedpft/README.md | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 3f045810835..3370fd22d8f 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -51,10 +51,10 @@ dataset: [CIFAR100, Caltech101] # list of datasets you include in your baseline. | number of rounds | 1 | | client resources | {'num_cpus': 2.0, 'num_gpus': 0.0 }| | data partition | distribution with $\alpha$=0.1 | -| Number of mixtures | 2 | +| Number of mixtures | 1 | | Covariance type | spherical | | tolerance | 1e-12 | -| maximum GMM iterations | 1e3 | +| maximum EM iterations | 1e3 | ## Environment Setup @@ -98,10 +98,13 @@ python -m fedpft.main strategy=FedAvg client=FedAvg With the following command, we run both FedPFT and FedAvg configurations. ```bash -python -m fedprox.main --multirun dataset=CIFAR100, Caltech101 +# FedPFT +python -m fedprox.main dataset=CIFAR100 model=resnet50 +python -m fedprox.main dataset=Caltech101 model=clip -# FedAvg -python -m fedprox.main --multirun strategy=fedavg client=fedavg dataset=CIFAR100, Caltech101 +# FedAvg with pre-trained, frozen models +python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 +python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 fedavg.num_epochs=10 fedavg.lr=0.01 num_gpus=0.2 ``` The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. From eee619cec8964f74bd2ea892fad8f6b4683a64bc Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 23:47:09 -0400 Subject: [PATCH 17/29] fixed cofig --- baselines/fedpft/fedpft/conf/strategy/fedavg.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml index 5f9e1d9e777..166bcd10aef 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -5,8 +5,8 @@ fraction_evaluate: 1 accept_failures: False on_fit_config_fn: _target_: fedpft.server.fedavg_get_on_fit_config_fn - lr: 0.001 - num_epochs: 1 + lr: 0.01 + num_epochs: 10 evaluate_metrics_aggregation_fn: _target_: fedpft.server.weighted_average _partial_: true \ No newline at end of file From c0d45be2a4a6470a17471ac463dff348c22bcf60 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Sun, 14 Apr 2024 23:47:39 -0400 Subject: [PATCH 18/29] fixed readme --- baselines/fedpft/README.md | 18 +++++++++--------- 1 file changed, 9 insertions(+), 9 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 3370fd22d8f..c25f6de8f71 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -75,19 +75,19 @@ poetry install ## Running the Experiments -To run this FedProx with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: +To run this FedPFT with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: ```bash python -m fedpft.main # this will run using the default settings in the `conf/config.yaml` # you can override settings directly from the command line -python -m fedprox.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 +python -m fedpft.main dataset=Caltech101 model=clip # will set dataset to Caltech101 and the pre-trained model to Clip-ViT/B32 ``` To run using FedAvg: ```bash # this will use a frozen, pre-trained model and train the classifier head -python -m fedpft.main strategy=FedAvg client=FedAvg +python -m fedpft.main strategy=FedAvg client=FedAvg num_rounds=20 dataset=Caltech101 model=clip num_gpus=0.2 ``` @@ -99,14 +99,14 @@ With the following command, we run both FedPFT and FedAvg configurations. ```bash # FedPFT -python -m fedprox.main dataset=CIFAR100 model=resnet50 -python -m fedprox.main dataset=Caltech101 model=clip +python -m fedpft.main dataset=CIFAR100 model=resnet50 +python -m fedpft.main dataset=Caltech101 model=clip # FedAvg with pre-trained, frozen models -python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 -python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 fedavg.num_epochs=10 fedavg.lr=0.01 num_gpus=0.2 +python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 strategy.on_fit_config_fn.num_epochs=1=1 num_gpus=0.5 +python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 num_gpus=0.2 ``` -The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the `--multirun` commands above. +The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the commands above. -![](_static/FedProx_mnist.png) \ No newline at end of file +![](_static/FedPft.png) \ No newline at end of file From aa4f198b604c21eb92880b8ec89d70c948c34f2f Mon Sep 17 00:00:00 2001 From: Mahdi Date: Mon, 15 Apr 2024 00:12:08 -0400 Subject: [PATCH 19/29] add plots --- baselines/fedpft/_static/FedPft.png | Bin 0 -> 28010 bytes 1 file changed, 0 insertions(+), 0 deletions(-) create mode 100644 baselines/fedpft/_static/FedPft.png diff --git a/baselines/fedpft/_static/FedPft.png b/baselines/fedpft/_static/FedPft.png new file mode 100644 index 0000000000000000000000000000000000000000..76028f4f24b02b424b9bbbb2ffff0a37d260f45c GIT binary patch literal 28010 zcmd43WmHye*EV{Ql2QsH2ndLDmr6<_-QAMXNH-!SAR-DS@|J?VuAAN>5Ue{XdJkL3gdBloRQ;{RYyN-uKp$HY^r8Q6}3>y>* z4F?As{$#@QSv&l8$3sTXL(|#X!^_<5AxhcY!{w2)$0IunI?so0?sm>je4Ij@{OokL z9v&|4ce%J6|K|rdo!xA>$isyD;X`m;r+CD^WF*$06U!iX!=Pnwd_>1_)jqwsPIt9{Jhwob z&A_Ipgsd|JJru8(V4)!>O(^6!3XSwd%YnObE#o(RAtD~HjkMn)a`ZT%DEfc@46%^~ zT#}If_YZr2%U^O%su<}N8PA$VTONy#*6x&A4C2B;m71Z-}Tyf)}Maw z^^vQP^AtgpbZ86(*Q=unLVYDA0!C6?LFcJrTYP-{FlqWhL#1Qi*yrZvuCmx1ckf;& zV^Rvv&%a$NMAWd`e@}5jk&*NRk&TT_?q8E8e_S>; zHhD(U$xp6Qj@0ku;&sL&a&vD@dCwC*dGdsgfkEownQ^_Rc}FBkfoZcCBdJ1`^T(8w zlw?sqK_eq0Ge<{4Q&UrT)&<4~Yd@=Or<+6{J$f{=w)U)0Gk@;y>L}Jmea_B7N=XUF z-N%2Pv_}v*oawpkNV6o!mpf03B`xmcq$DTntp#L?`jMNPn|mMai(~`*UPj+vD6#w)j-p0YlZ~sxG`+&Ci)#=|+(_|4JUVndoGbbk#tE@`%c5H7y zzxLi1OYE7MnF%gyI>xiMw!X$=Asw>Xi5b62(x$Wd9p32Hf zm!+?iU(@c8U7VkA1)gqyzJD^mzM&zT=ya7$e75bxM@K4hE|X$U(^s!v z=`{z6qUi42p}cgNx+PmChWN&fSjUNvEG6~UebowCezklcdonQRmGJBuk8n=YQv{?o$6h1k7 z%ktnma~qrd$_AYh1HDSCD2>#Zn3!JQH|PJBi{awRA}p6)xfz;>h{ymuqjgLZMY%ZY z*5kjcgVlDL-oCzb`|A@}r6=t~;%0LlQQjA42PD+g&%WoYTK*X>lz;G`9X8a}RT&wX z+4{{UsrILYv+L_6yB7TX{8#WPIHk{y|MHl(VScKwXJBE$MLzmuvpF6fj`>)*xqVH# zc#zoA*A&h7^B1sD5?}zG(5Sjno+>s?EX8h+@ce&)7{Ii?h}3uIN4|6AR;8Z zio*GpAzQzpbm4ScC5_q5_-ON$kST8H zVQnt#`p}q|2MH&1XS3z9yz-_2f3KP}2gVXo3BI-Nd&Bx=^+!=eyx4KU@MoXHt(z*D zVzD=+o|<((zxgTXLaaYSv}o`nX%y!AL`?)8&L^+Uj3HhjA)(~tD`(RVn^TS40s@_f z+w)f)b#!#D-ScG6&d%Oi9%MjCC@SJXo8h+Tz!@7KXC3)_a3HtXn^fU<;1p}YNeG*3 zY+{1p?p=dIQ9eGhtgNg8-7*?>4vyKSrKkE;);Ib1H0>HABXO#or)fMrJqwI#d9U-^ z2K($T6;j*4#d*)i3YEk0#0gciGWz{3Q?AUUQSF1h_So3iTUfF~C~H^0w70c!yDurB zB+~Cbz9J>ELsZn$-_Pk0S&$dRM$hZi*(aVV=y-p$)OdDz8Rx-+2mFu5h#f|XS@y2M z9+v*{iUSR0+4W4lforkxys+Rvuy$-r@7axeQ{pUxK<$PBxw~&yo{sxpFH(Y6xKc#mPc}a;rp{1t> z*V>v|*rxk%^k$gH^1w|fM%hp}a>rGn7W4`zYQNV~Zy?zitH3}$>E31ohJ%9x94`u} z&EF3{?GPRQc(2W-?yp;F)Jo;tkfr5nYwM>{5tosrd){M(LqMQa zA6ru+M9ygx`TRLCatk-^dZ199JOVz>7#&#&B?cebzP#q*2|V@o_VKwXC`b;)QO3aF zIy*c2mCtFs5Aoh>7d;&qQ0wUEFzbxIiY#rZaeeeJxt+8`@!Lm-hb@?L7MI?Tzw%R#E8+00i028R2umd|_!weSbav_)inr($e zFNhrc_t#R8JwLngtG;d2G>8N6RTgxWP$ecd?vHIx1q6`_KK`Ld@ud0UoDD@hQfkbG zbAQ9-DV*2B;(N9Obge&s*0#*Q#zdK~ja9T&*?a>qhB-Ue8FL>_x7JgIM?WiNxOsR; zph%TepN)TTz(TcU2A#7&p=CF1YUsWhn|P=vL}G^$cB0A`NXb`x z5wy^b+TGdRB@+=9O&aIFF`}1tAQ%)B)Y{P@z5ZP0=;Mxg?5}z+-SO$YmG4-ZnwqnV zUtZe>mBC$OLkGyq%d>xdM_3p~>M4PGz0&LU>qOMTbSPrj^reHxf1V2T?kbt=e7j7+ zWujFr>b)gVURg;x<+mxC`&j7F7@Z!Vq(&ydR_rL^z{A-~xsMHNoH#z!)vgs@U%cx1xvL%nW!lS^S5O1JLZ+|-q@<;v3`vQlbc$b`hB=IunnOR2 z{u^=mMl@VLwWzPwL({^-LKhd8;IJ?Z*isRceAaJamkGPfNJQN(l~+~OP3!#frMFkH zLS(ZUtE4D4rG00j+#CbW(#-O5Bsqrx9WO6wm37~J7ngF2bWy+kmWc@}6B84_A6g=H zp6hrL)W_%&Jh-1jFfIYoj28KLy7qHA=%PgUN})>2PGsVP@bDpv9MKHM!xSk%Sd+>F&^FCz&=&W0dJx9iy#eSQ7efh;Lh@aK5i`J%F>`}gmM z%FgfNTR1wFxH*!eI`>X@0=`^u*#644h>VHR^fmcl|AW3}WweYoG&B@21e8wB8EAxZ z1_p05=xdQmGWjWsUz)oNjuol}?z|%K%=a0U&}H|fuabb0x#1}jPz#s0bnyEhy09Bm z;~00+oC~m+o=s^(+3k#%#cg_yy<0}AUot~d;+Wx8&K=u9Su$-Unsy=!8 zl%ACp4-lu~7gz~(xHOB-w<~^zIy&S~Z(ctAaWxO-G{tX=o3UIb4a_?J!H0pbFWv~= zQFeQg2Y(|8PZVao+^i5EJ7huNMC;o5LDL6d_0;BD29yd)jlwG=BqXeS7jIHh%wZw* z8hr&UEG=jM{CUqjtavYnhm8&YTc)_K{g>4E)zPxDJxX~o{GI5lY+JJtwAl)YOu2W( zRmTxAX2vnD^H4Xs#FW@GkfT7xZun7YU2I|03`U~);X+Me*EvjNn%dfO zSsVX=52vxS!t%2je1ByLoE`W$*O?YH7$mDK5FGAu{ZB(s^W5{#=|U@Z$2Iiy^V*ZA zWH2>3{iDikmPYTY4vy@Or(Ru1`KS*!enTIyoy$G7A1RJX zOQU9FWNaB6R3FTMJ(QEfSkg!vxHl+wIDK)R?>zb-U%cHWmVf#0=oREsQ3G&RH(|Yx*85Lo$Wy=VvG3PTxxmg^&>v zkc@?^^;^BP1WDiD>0Vp&@#4tVfg?D0e135_Pb3m}dJQ(BR-GvhU0{qbG}g80=H>zX zH-Ocmpw(NphGGc=A2LVqz?I*5iW(p=z|ZI*X)*wYy6l&NyJD%@zkVfv^4f8U*8i;@ z7izN3!)WHCCSYPZ<=bLN3@KL=;WJPkxQQk zdTr0iXQs@90A zs;Zp5Ju9l!w!GUl{#2l)rA5%HY0%k+amGZi=w-zuRx}i_J%!aO zupfH2u_V_k7^{&B4u!RaMJR01d8odh zytlJ^eQ(`i$SVZslClqR9nL?cUl?&F$;LZVU2R%?Dev?XHWxSD{|sr%$-z z&9F9Cpi}ZjG4QqNC1c{FMasT60&IV`6@$ylWXcZ$^CVRt>F41;D1D@qkz<$??llNgIXt89>A z#D8XUtb*aL=NgX0sh}gw8Ois&I7vxK)yhmnPd9@uq=17Hd^GmfqZoP{0dy!C`1{;& z6p_O@?Y~RtyT2A?(&(F1z!mKPLpKgCZtH8)z$kc(mJ8hpV~u`7Oe$%SWVcliWC1&) zwJ%i&nFgV=Ug0pPZfOh0cl|TW0{H0?Ou6#%@-2Ww)QfaDU;=C!u7zyC56JsB90)Sz=8!r4+uzk9v8CgA+&w=mEt^jyHk%|ls&d7h|0 z?asU8X9}7`G$Ji9wWB1|w|d-P*Vo^Zjibhupnl(EJ4g>4fdxG9t=-*r_*)f^S9SdN zf7&RHhTpn*f07s-d04RU%Pm;@@TqAhq(*;oxp|pdI2gKcp=f)a zBl3{oM$sZi=VWAMEdVY7C&vNHTDUu}iM#T+R6d)2vMIn22M323xCu*+ zKiO=)FzN2@Rx8#W&^m_kmi1(^#u?ZasQXeOpGAFka!?XTp~8~vPFFNdhf>lyJgjw1 z!2V^nve=EXIyqb0f}wp_m$qk=e3(Ge0)wbw`?E3^?xl2JFJCp2eEg#$8;riVmoHzw zZ)W!P`HL4CGn?ufSbx*$aP9*yIpomn4Nno@(!836X1Y z@$#Y&JDkC|$;+!@*9apnZfR+0C=8nxtiKWND-4^E6nQ8>E4Oxa$!=|LlfZaW=1K|=AeKv1SOhd<9@wE&QA9P^b0wN@( zwX$Gj#Q_*SqNfU38+NH-M;TonY6m#Dv|>TtpldS%5SC^#OZ- zG;&B$9pb?yC5{y}uN8BlMqPtbjSIEWF~Y`UjCQ>9e3)}Te?RG?s-}j<%+gYxH&{qX$?)ekXeg~qw--vCf$K_xWk zL%vi}%&22zL2-wcFP%6ReW>v^GW0Ii@AeC z(S9){O3%Om$R3Sc7?b|w_9_d&yz#$$jp~sg+}5JyfEWo$0*U?iJVJT~hNN-WaszqF zRH8DV$sBheT9^C-gyk&KEt`WiMs*bK0EG|@>?=BP1miJi4KGeI$;L7 zIBaMM*kfCLLepk2bVE7+{@_$vI>)qO>EGobd%ewxw$5kQ`ojcNY?%mkxP^+Dl>hG% zU3N6RsBz6I8Hsw~KNasi&PWNy8$m1@(V<6Ya`7F1M@zmt8o_t|Q~L@U9;jXdJ?E1j z#qwnBGWz-;gKJ~GSLeDnc5GyU(!Wn&-7GE%ng5KYsyZ{(*oM#VWA3?`@#%bfer_K= z#{Hi{$O>CEBS6TRP2@6~U zz6azJeh1d(veG#=vc_q^iQxehh0+&VR>pM>3e5e{prf5zAPA@fVGqkb7b`T?0^&k1 zvjMCnMna85Occq4g@s-+3CT*zAh`{+8DJN| zzP9$Oo&x6BHYk693Jkgu$Vf;iQ9?pyU&t3fav1*mu!NK*4CX?pW(e&E^e!5z*tnh? zc19Oe0Un!v>ZHFyPLq)^I?MyC0xtFv%G=xf<-=~+4NvC>8O#>s7e6L2_`s^l$3LqS z2418s_rYs!uMH!aR6r*%*vAzVFn^e!7V##ALoNw40Q6bZrAwC(iUU}!r@*$1JM!}J zC8VSjdS|?NfsO(a4gT$nGi*{;_{b6e|2ULKH3QiVRlL4_F^)7eEwNM<_wf1Y=^MFw z=h%S@0|Cy(%}vAJ%gwC~Ak_~i_suC$YVkm7s8*lhfw~-Q7%OFnAj2}S?DjSKl~%aq z?0Rp90@ucPfGvM1d=5L8)Y*`xLcAI|%4@3YY<8J>xw&?CUf{7_cpS;ap@J?r&L>I? zH`wFY2O=YT)6~grZrudM5Xc{3BuRkZf{rKo=n?xXPGbWzS3!6dn3pcGW#s4NwDk26 z0wMGSDLPWh_>##|J#_p5!rny1Lu7{&(O$ zvw3Y^cBV8oiYh59lhD$Z4b#xlA}a2OiQ!^>vZbXZMX76zjg3$cBY@1+)6*+>WNBxI z3$%BVr@Q-ZwzytSKE}w1Jw@TKrssdZ+>1R<cpMy^{K$0T#npU zTH4nfzAii*3*=Q|N=gL2Vi13O27rj3nOS~a5a^(GpxEKw%`E6uG<;6>9pO4O9nE!E zS4YrH1F)#YOZD&j?cpqsUriRk$H5tJVuyXRvSN`jxFBYIgkN2191?V1SZ+#3ny}wv zHFt17H^9o~HD}z~Bi!@zdh+)=NpIb4N>1%_tzULhqTnf74i~7~4rXH+e6SC{%BDjn zAfV0T_YN3vBV*$Vs~%EROO8TfIdp1&n9-AgUf!6j4f`g3K@IKlhm#q6wYld(sr9t* z(izikQCTnvLozBVQog>pq>~FJa5krA^0ud0*vf>S*I;F(Wqo4KUtGu;y~YVGxABQC zaYtK0!5jPnenH$WQ;FDhaaJ6>k^njvafAEIv<6Q!DX^X5@RGPQU=ro6Ot z9SN~o0~hMoq<7b|?np+a=+4&-IEfcjWDMk*R@Bcv3S$Jneft(Yf(KfnMs5jwA~NyE zy}RFPxxZ^dq&qMc1a-rh#VM<^?OFHRg$301wjd7C>zV!=i}dU~>dh4jjKQ@&gGBiF zeIwr&%&nPdYH|?%51?zdY4cN*QnXPs`?bfe)&s*=Z4(maD#ykqSEBWy{E(1n3x}d| z@}gyuPPf-mjx!g5R1ykP8j+f}gl6yU6IH{vx6>N{>vVkB_w^-yF1i!dqk$X^$~fxU z_zcm;zc-@6h+*7o`u6VzA-g{P`Ik1tj8ULuWp%~>Ow*30^OueNd$+-)1og>j=`%Ze z3W`N~rSr0w2P^&T>OU=A^BjEetCO!)a4+Y#2?3~o+rbL@W8t61nh?B8*qB>QZvDg(t?xP#-^1 z+skA9yK|d|d*>H1grXuHg^&4biLOIMPtq>ZF<%+V1=dpvX}Lhsyn{c&Ds2YE8Q>!} z5v|x0s2L!DMc#Vws-?I0J;6IB%a>^cM$Md4+cTL#9ieOE0(7@zrW00V;ap{!_fDI9 zV2z>U6}!vP-=8T?1Z;&dO$KAX#e&`vsLI^N5dadl5NEZ)Q$b@-xF||iiOqJW3cK9vWz_MZdm{E zKB|H&$?I-FN{!ujY|vsPfq;>Hb`1??Lt~o$@`C#Kl&UJdwA#A&%|zFse)7`uQf{5z zdH$SEY;GR^;s};@xcDbcd&H`clkrmC|F#XnAdGlv5Mu#Yn}~>j;=TfHanwM`N(2)v zGDefL<^1T<;ikB&j)d}XDIvcj9={#>a9O6IOV0(z>dnV<0vf;1FRrt+e~Q17aPzyJ zt02h1YZEm@P?|bnow$KQ!oUx!7&imxCLJA1A$d-?XM-m`4$W#LF_In)LNj-@~CiFM_XxD|v2MQ8`vzr{c`#A&FI$K9yBOR=$`m8Xf zIZP#{Dl_mH7jz9#a34g2!fpmvGX};MpvdBbgHg|}3*hbV@7EDzt>xxp7}wi-(pH^f z8H|?B>00fu_(Vo3Di8-#aPi-(N_ze_)j|8c?j`CQXmWCtl~rWV6X$W<-PdX5G~o%r z;0Y8;NMd55Mtx!;83=@ho~giA-vmJLUrK#W8eqvb##o)wPF||zs*V+iUb(ohN^kow6>rRi+R8*BJyH( z;~eYlu>DE)p`i2-)*8kNxP4-f_eL_Y)6n(k@aFR8Y z4pn9nC8KSWcF4SD;}}$7V}6tCBkK0;#h~4bwHcJmO{UAvbvT-uXJ02@z0O+5OT4W* z2Xe<}0Q|G7t1v<2pg_rI*6GvZvntRteTpb!FVI5Gtp8ctYzrb|+U z#}Ps!>f2(Jsa=J}>}U!d$fnip+Y>a9DkTlxSlhIxrMrK7DqzoezPcWJkxAW!7p$pX z&n^6)yPwEpxqB#ErNmX@5A$d__>_RsC-B=}Yi;n^E%(|qL9i(>TgfnXFe$%z0`l|A zhkD}_#HeT2vV5`@m%8|@r7=^Ks96seqIRTAY!^8isztFrrW?=7=uG`ybj0R&Tx9a| z^Gkm7hF(m}q)=2$jHbW8-@fK(@4G4wkco(pgF>_fkS-8j>u@1a)yyK>H#QEeZR{M{ z5fN`vQ(ymSH?XVWQjPu-^Hs@pXz_IPsc69apXVhdA+oVSVZ=D5HFbP{kih>i$?+9g!C z6|eMvKo@K)R;=X0LT^ibN#g3=FX~Z?jW&8y^lKv=eWf)onPbU%ii1F18` zdKKsZ>7##Aot>S5`Vpc9$IXg;$J zT^)__`d0quhkFc{&&`nn61Cb&CrhU69hv-2eSd!u;LV>v8G+f%j~EjT{3dP4nFf_E zS2F}`a>@L5q#IL>G0^)~c-iT*Equ-l0%mVr+~F+sIC(AKQKiet`GEwd|FSProEBIcpdsV{$%D2#0N0C9k>eMg3LGf} zkTEw9LW)xHTqZg;K*riT4=YILM7_K+a~|NDY6^R_XKK+gTO`u_6I`HI=}$%hxZCSFL*HL7_VbpHC4@c>2#r^^Cv&%+canh zSAx#|QXTIHq<+8pn(wRf)z6K7E#n_rx?O(9CeY}iz}@}(CgM=K%N*>gOD7OpBUmrx|}a#n&K^2F4fgz}0cDnnG0qi#W5+?R2R zs^AklM<;#JTl8WBfxvglb)P4-0vVamzvrQWs$X+*6lK$Myf@o77S;U;o`Azp4lZ2W z6DSmgH^g2fB!qw_h)C0Q1YwbQTgL(}yG$_Kk*)S^kt>q0~lo=43NOXllUpk+gI!Y@tVAlX(zp9wG-J;5Z{A zBl_Xs;2`26hB6)sHi1991lf38EDE)##Ea8q_3Z=g#yUM)AKxW%^PM1vQEYbhYFhCG zK^`H>n%k-!xT5=;-yEx|FkW#{*qAQhs?zgX-{tC$qrMXgE*eB`e*9-R1O`4>1J{dl zm~U+?q4Zqivwj9^`yMKpykg~js~pT4XEq9RpJsi|=p=4Nc92w6tf4d`X&b%)mMvL-7ZXd;3j! z8ueqtf(wtig_nlGiyR$k=|>??Svi-O=IIinY&w_vwVN(`cHo$G;=Pq6Y=l0OLk5p( z2UucKGFo-9sHm1CwwAxEy)t_DLzhmT%cH!!(0&x%erqY`$8T@-p1I?__IKko=|wd6 zMDx1G57N*tzKOd}*#AHeJVaamWf#%^m1{`z%tKZ-1btNF@iguJwt$x4H; z-`+9_II*7rj=iCpAtI@x^Q!kQG=`r)f7V?NFZhZRs^_uD)iF26Khb2Zj7+Kp+C?*~ ztvMR&ovK<>uy%RP7uaH_YW~eHiwr6BnrW6N^_|Uu+NXq-1F#+j9H2>qHvo?7;PWH{ zPz1za8%&RY!v>4>`Nmw2g?KG^Q@n5Jo!?(O+Rd&h(ZKTFRh}uS3AXO*aA>>Ek9x23 zBVbbc>Q(o|*#yOqaQqOiCgN{tXmb?m-}7VE1qF{|<0A`-;e;827aPPM5+HMcod&}e zCUAa|^71$tVgb>xQ)Z#$v;zrH3iYA-J`>rur)MW+JM&$HbQ~qi>qXia{{9{J;T8>F z^D&Sn2`n+S)8owjtSm8fpSUi7F6e}5@L|XlIM?I1-{ZsKv+nsGY{bGhv5aF%qEHA) z1T9Y{S;uF+5B66<`!Rd?5DNxO#I|?cvBv$k3RvY3nW5uz-VRIvmxzKH?#=PFBw%Z&K6&TpJ(o| z1^d^?UK9NVrlCn9@da|Q@=Mqj2p-yF7>i z{wS`&bFcOBaG?AVI<%>&Nw2~J3v>#X)e#QiyLZVy8G{0B{WUoR%GJx|Pf*ktBl&Li zehW2*k-8e@%D#^X;xLW9&XP&u?mFl=DXryJ*RPyY8$%HiFV-8-WEtT-%}bvht(gCh z(9_tROzxPPqT%7;=|xLUK^$|p#xE)#ejz3%4(74!LZLuGivehYSYiQS#*I4yU&DP7ba zwn!0-g{P1JLmFr}i1T>60dSMB?;bO#0GGg5AmX=AfLJvFIL0(?0-J~g4ZvllT@6_c z#NiI|4XaB%Vn`hvBmsH96SM++QCYx~yt`lLQ~$%`zB02HITF0}^P|Yn!yqdwggk8x z$0s#vU>0+l9$Aa~LPLXoUGU1xI&i852`H|zP%e3)m*TfgO%WxgX=uOj<2iZVSLGba z6oRb-iiqbJ5~+f7&z<4XspNP51gBXrny4C% zc*P0YJ9kJ${PnQBHpgfC)9pX`jb0|A8Kb|QzlC2{TwJMMv+-cKfFCj6*AGMiMRgd{)b4mQ^3MUM=FMaY*2%Qd0 zoaw;DEj3D@6K&k8vRGO|ec=w2b;re$;!T)2 zqmCzA02?k8y+{5Ve_`;z244I@6-;$^@!qu~c2 zJ}o_6dn7(CP8JRj3PVb2C7B))TPRbNz_;Fyv%9WjjQxpwKe- zZjK-tj2ux>SY-|t=s@Rj7%qvu5lm_s(x@_z?TRboTDJ(YH&r;%G7P$8yu`#hnRvTp zAZxB%7KMY4;k!5B0K_UbGD?8OeX!K{9yt2sS5H2cmj}nk6M=4a_519X|CzHM27sr{ zsNPe#&=K)K{rz*b>1^NdQ*EuCs4VN96s0u9qnc^p%}#w>qx~L>h$i7z)J&nX>T*ta zM|FEI^9rd$2iO**$Hkp<7Z>05WRRAA`2hCo(eCfTy2lRb>*D|CsR@`myjUtBo$)Df zS)jDW6~s*%P;ocN@GGYSzbMZfX&2H5ejl$F8YrTe`D5_Wl{CTi`(r2ize{}>{b?jY zp6+Cuj$MADq$DgrHZ3hKhF{t#O!hGQ-^@McZC-(4w{Th-{XQPf;geC{!%h=Ty*GTT zSvI!AqS(v%t)rodu!{7p{MAY6_kl-PhsO@vHtz1O=){Cv7fkf;)jSN+lv8-IBqb#e zp^G3AemXS+q7`t7aN_X$$15R#VkBwdDCN%H47m@O!&^7_IAxFfZ#wiw;j0qXCLG=lh z&c4ed1qQpvlz1!Z8ZU$&?u1~>S<%!U1ZoG~0Ae~^Z*xi_;&SjCD1niR%A>V*;NaJ* z^I(~qn**Jl&mTfDw(v(GtIbeO5Z6rL`H_uC&^a|UWuyT>Gc#VZq{O(W0jhjf<&*yqXk!f&?+9KS-kXWSK@PDk>pgx(}u0Vmim*LIkk?JY_S`$F&`1 zra3>q?EU)&O(DXz~*Ym|@lRgP`enpP$}A0x+MngCim$R4mvW zQU%ed1S7>K#!x4Kn(hJ<-wNv=9v;5pc93I3Nhx8K0|Ak{m>r#kre%Qv71vfriEO`P zA6}d^-Dl;f*Nci=@JLEUGI1+Ix1e_E4kA`F=sygstcvS`;3ky@9~v=WSYT3GT3gWo z(f-SW3H9`I0aOC(M)dEURQCtD8uAaex>ynVl6+yaIix4CkB+vf$zEG<%3F&2@F2i= zPe$gm*bmV4J(E6)Ki>8luyd7NR8@%+{&m(BJLhpwI~u?ELcSxWaS0fMz~aPx%0rT1|I-8)__v$d2tKUZXt>%h&$EN zQgiMQ(xr+GjwXeL*2z5Y$Y9g+g*5v9lKWtPG1E;_veu+zTg1goaiWD(SM8y5h(>*P zV`T4_mvVKrklde-53ZvuC@Jpni~qZN`?BHJgP%_#BZt9U0hD@2y!bireVPbS1i1>t z_*yQU3P!ciu&}G&{>!}Z6me#Q^k$J5LSV1Y2KqFdVoUEi%=; zYv;X#g9sQoU$N_>qYz#U40BNsYs1mZQ)*4W=e2e8I}-_5-a7uZck3qFH4(iAPD<2L z|J8_3WR%yJn0kxeo)62xg-`epAtqJ`{(%4N7D8Er*0{p<5^w#;9RPSow$iV^e}2`$ zZA=AFa947?KY>4E>$g=~Sy%q5_# zAXeL^_5w9fY@*ReO0o9WNb)n=1#VlUn>4LJ$3JV{|LfC4S{C{)8<+@yp-i$T(Bl{qP9D$!?@t2 zhp3jCd&!*y*&GcPutu0eLa@3gzBf*qUJ@D<2^AGS>|kz+PkcglvaDFIIQs&c-1GI` zk|2x6dO2W;sqv}}Bt0Oi)(%G9fovK4fN=Gjpaa)?VZ=~iT%6@M03%~I%xre*-7;Y) zzO8;l-~4t&P0T8BHnCX;MvJ}kI&&x1j7GnZ2%^qRzXS5-1qNQ}ugY3R$GysM@F4s1 z<0DuP7;fH_RFCTAdd9Tg+mG$JP8w5rI-2;w9t#s2Jq#OdWaKz1zE>!aPvH&g>L{Lj zq9;!1j($}N-(L#+guLWbdCg@tvv`^;T_#BU+TN)`|W7}EF`75MMZ0-a#x0OE8MN+gq=zn(T>@e_3@S4g7m%G z;NgFEjpzP4FB@ACZ|p

d_7*2>qXO)q5X%DR0Q)4ebQi-R}&>+5*hiF25l@RuX$zmJKxU0O+++dK}!@eb4paJy!^nUCZXxtxnYR1b#yXM;$X3yg?J zh_@UNJ+Pc$zz>DE#)s81(`Fig(NB|-u7V4L8=U-BU^Vas(*X{+Gl(ID)(S!(8j4Er zk(z3K`(K|C(=`fWTUynQ0PO&w zi$STvfao65M8KF2L7GcB8g@~~Iqa}1lkwuwSl3a9Cm1R!$f8uo*D8F&yzyrsD-3** zOz;#7i~)&r4!_ra0Pg4#&h~*fP|?wXpQoi6Wv^FNRz3ms3LgY&nNqey+_t8G(3wB1 zICCXpopSGFLtTzNqAokTM1QB%;+I6RV#WcoC$y-jh!|W_ zwyG*B5GXzpu#zFpp^f-_pNh6NaO^uK#Viob(kuDU4G&<}g zVuNbiEL*?rxo|Zw?`A=oxeX-ctLqwtT1a{mB>`S&-EmdPfcGm7dDWY(ZeNvq`2#k) zziRa>2syu6cERpbo09uNCbgou#I(fpxVEtTe0V|NT}i{s*D7UqsQ9c2Adnm5H61_! z`JIsb{Co?24-bAO)r@D5x;C3_3$G(+U+(CLl#&TN6R7DMH%MEyJoad5yYHMul4KA= zE@70`^o}{Lif?PwGMUJN1> z5`n3#s)83T5P+Y*vkvkC$>KpxLp4u*9Di0~!MZ7a0S&JLg5{6K$|ZSTViGs|h`28i zAYmpz9x^9LeiqXC9%x4(b|SejrS!X3k#JfyXjA4;r?3P1Q0|&NYvWkma=wrR@;)KY z-U+RZs_jt&LiwKC0uIxA_5ScrC50#^^WZwtkFXR##|OTxgw z$!~M2r8fyO?8h;&@`iJBZsIdZUSNI%`>}5QBbaSb!JyeO+`TZKM}r-ToD}c}l-JaJ z1_qZ91!2#y-nu{I3lQHxfiwAK1H`an5I+jo8$Y?uV>dK5qM>O0x6txb(xagfG2d!| zv(pBFDL@a})jjieuuFP*0s;cety|oS_=K)z(lJkaydit9?$bWWXyG&@o-X(4|H#L` zbJ=I-Hb-|k^L0v%!QWc1nd=kvS;0u6=cOjus;YK~tcQUDfgCC+L<@lY z8-S~9AjK3vzcQ`L<)k4aBZJSSIQCnia@X93X&>xJ=aY2;&ZGAiiQE$-YZWd$Owtq> zNingoAZURDvaY;}iYy=y^(gmEbX11;rKPWEBPCxP`FPMmLxW{vP=ZnQU;^*4=0A^v11T%u~eM4zpIMRf?pw` zw)PIn^{^WPC*=>nkOL)o&-pIr$m)g@YwkQM=t*UtvhoU9_D>W-+(pp(kxsH>lc^^lcuOPCuM2$X#dcLKbXAosTqs5Rz4D<2~9CGfIxyUt02^^(fD>4*uW7c>eAisa;% zD>DSKJVJIGtr)JaWKm!sl#Ly77Lm>|{HlDM|9zR$=+j%zk1rcw;*10ye1(@F49@V@ zh@th^hcD3N<_-;rh-S9T%?_MeS|XZB6D}j^E#&PGNIdoI_%T8+A@(PTvLKAU86XYC z)rcog5N}2S1k#XnG!!AoWNx8>_r9ch3JMSMx*()Bg4=<0>yU|w31UK5peL4tabCs` zm|t}W^TTWpJs2MbJDvIf@DlB>{lowYAHi7wyJX>~T*2N9y@0vvoC+p{z7jpOg@s7* zOW5dwg1&?ik-aGQ#K0Ag`_JJO1N2;V?vR1>8#M8;w8rkXVHDsa<95#jCj{RhNs=5G z*NHJD-#w;+_m4oOcWBszw;CWRKh|}h_)&NxM{ImE68$u3(91o8;(px`!aNd?qgE?i z2Wkgdf$P_nW6P6M`FH1JHUtKBbS%Iq-xULZ&pj~>HWIAW>}-2PcgJaWb5|Pco#g_XKumj?(MGZ_#*u*%eFNR( z@?`|N$dh%wNnHRS`@!kg_2$zZd~i4AcpibCQW11bfpMBuNtb#K`%(0yCHk@O)v7 z%Lb#hg(71g2_s|3f&w>1UGW0w=`GEQYZX-TN7Ej!jgcTJUr3=ACnw3!Cop%VzDZ7= zL0&5ceCvbi3t(U&Kp;`E`N3gy4&omWl-MPg5IS#y7Ym^8xXY8e!JFHS6;)nr=+*}l%&%hzHJr^5k$4gU3w&E;R99bRn4Pco4VU`_0y!$F5} zTnWE6Gg8oW0*r@?ts?i=-f8V(|aH1mWn#tq0|holV*YO|3QWN|g`Lb}zjrb|TNRjE^@| zA!#Oj?;e8fyL)?w9N5PZ6(}G=ZDV2cJE(Ly`T0m-{{O1(+~cWE*Eaqm>A*Ne=pZSl zrI2cr4yuJhC0e8=XDS(rYLszGltU#&Oi9jR5=uoyP76s*R-)08L(~u{rCo@9-D>u` z_h-+%f4%>_{;RYOzxDi{=f1D|y1omBN6o#r@y4?&lOp&Wg?TpTh8F&I4pZlB9rcI( zK1iE44seUf-arIXgQg-20;bc8!Wkb&k+l=2t z{hK?G&%aZV7c1K%-m4QmQd?bJg3uVMj{JDaIOV}owV5| ztH}fm&mQ3?3cP)|%xBV((2O$Hwe}tqvsJj|C`|0UW5*f^A>hx1G1peFyR81-(05zakIW17y!aX1H80jKz5YY)#a7+IyySi zX$Hbj(xST?GdqhKdR{~>4U>^H-}<=g*&AFk0yohXk0SQzbvId*7y_#$w0%D88iq!_B`^*@fTiWL*CY{e$*!S7K+qrfvqC7<*YYaFJu3u_@;jp+! zd*op@O2$J~)d{FE%5Y=1_4P%f>Zf{m$Bs1p{Rkn!xDW#9Ng`TT8j`>pB6Dre=b@qU zCr@Nd&(0HId_Q-_QUV&M0bbt+cQ zzNo6YC(f1{R-p?Q3qlrHs=YWSDfvO8v)UAm7}cY^OYxV(>(wvoFaG7SiENHrw(L$& zsAxg~JNd2sU4m$733r4S&HI?7eekV4jkBqGfaZ);q$Gm0adSIx%9yZsHeB9%1a}S{ zQLg$h(*ZB|*vHqvz*(+FNjJthIcwq0hxRC-3y`a?tg7QWTdJ$Se41~3N9++#XL>?H z)!vSE-1(b6tjM!Cl-jql)7g?Eci>CrJ!i|NgpA3LR(qa}jut|xO(zu8X{hr@Zipw% zMLmsXb$9FqL^!$*p@rS(G+RljoYPQfJO$~zvg)Wg1QbDm?sn&brpm9ACmsx}UH@)Q zX@RGds5~#_>5#g(sEcD-f5oQ3=rfj4dLaXsRL)p-IVQ7kIk2uOq5bFn_`43Nw-l$w z0}{Lisi0j$d$Fk)vamDo!?Kc7QY5ELIf8nh9Q5?Wg4t1O#4>DNcLG-Kx{GYQ;s0(*)E zruu&w*h1nIreSetcqjti%a)R~JP4Hw1xtgsoba#nyf%BPX7%^?m*M!>JJ4;(ebMaQ zVu($j{(zxtjGoGdADdaLy{>-Bep_-F-Jgq>wNe&C(wnNXH#*z}9{eRZ{n~I#6a5hF z{ow;M^@%Nw(yAUs-xwnq76MJi-}btNcWb`WhCM#X2em+I&CKB=;9KB=0;;h zPfyRLG!q$|NCoSS&R095XD!@$@8DzCWJgC2*7q;d%esbF?!@5Z)64UF-Xe0(+EEi8 z8d`!*z#PKd{_gro^r@|T_`9jW_^mg^K6Pufe)3#(=Gr7=M{I5j!WfRZe`F4WH^v2F zqh3?vzMBHo8>miJO9(ATA{KqfLM$*(%&2DQ?O*5G3=LKK;LIEp(Z~u~Hf@0|84}I) z`=T*d#x6SVCi__6GVcnYH}vjd?B7;lt|J;)71n?Dod?xPj7E3V` zp-!3f=H=xDrKF@Vs{n)v=B*?zZI9FK+qXr|rJe~IAcs9#S} zF(;ZoH;S35HxWjMS#fdoJntn2l_7N0uA|U>y7lb*lIkeo*kR_~N-M;Jqf@_sN$f|y@+u{zYqz@6nuo!XgpOk^fDJXbz$PexRa2ySmZW4S<``Es zp_5Sx`NfNuD*hVkX8wVn_<^VG%mMfmV_=oDOnRM`o?eET8Y*BW@xz1Ec;9m$gRto( z;o>PDj}8r8RK`yYF3fa3$eyC4voca4tlY4F+S047zg!hP1!E4=in+doP*TY;Uu)xk zDKSIgk&#-rOUO7dw)T|E5g0#iIwEozn#Q%vJL6LcPp1px$#?0Qq53VsT-AzdB ziK6|V=j6eXr;D__{(Jd(>uiHm_iqD1y!~~*qI`A$c>?E)Kik+)N@%QA%g+xkEG#T8pPlR# zUKke6zE~Lc54@`EYd3FFu!6>@uo0K>`7@|baFB^uuR^W>1Xb)E%lh*2XYaWPRyF#! zxtQ_e6Wx2@z!UF-2Aqcrbj|%g4{eqZDte`Y1(fd8Fjk6~S zE!Yf?OUh%;fM`Ec0~fr7ev8J7gAX^*JHCW>d_w0iWssIFn-1oyk^J4+ju)k(lI%T{ zO0b64jHWkbZ(F<{$l2=UIJY`u&1L@=Ccp@=MuhtzS}O#p)nM4wp{3e> z*T3la995;{{)~b{U0{dE>FrnB7{BB<>g^NsyC`mI3b|8FLa34*`I3YJ^Qfv*n0( z2idt&R6b9xi~H{#`)d%ovE2+)RChNk*prBP}M zt^nBX?l18|!y;s~EQZhpz>oxEr(iX$2Vkt|XK!q8nawHypuyK@;!Z8n-GIAI1L%Uk z;sWC1MH#C5F}2EbI%|>!WHj5t;&kcy#!NHxaB#5@W5eXxC6v^Hiq99-OT^68>Wn>m zRu~^KqH(eXV*Ad#$<@k_^vfcTrcT8j=X~x~B(os0wRUu**1zfK2!@K5)vThaxv_T; zed_K;yFal3w%|TV8Ertc04Nv@PWCp-7KaQqW80cN(BQCjP#RNY`>{e`QF3=J)RK4i zw3cRL->FTq5BQK=r(T#KJI(>S|>pRD!CQ$kjZ5{F3C< zsa7frwglgeNPjBZ^v#7P?-*br#J+GQZftwV5M0pY_U&5=YNlXE8v79r#I{R6Q3Cda z62Xr%V;vuJn0BWBApZ=^JpCMH=xPXaE5IE8F!QXrdiTKGiGmnz5&|4!>l8S)LC-zu zAGBD|aNrg7JGR#Vmf@M@8rkE*lD&suJs1R%;|bUhi*2gV?IB*#5@l_ogi^JhNV93f#ycC;(VZ;NqzRyfPWp#v^ucrD5|Z;fIJA{MdAP z=W4)4!R!K4N@%r&T_g(VGBnrHuOWN08Aa?-T^hBMBQe%A{vj@w#^ghyOLgDX%EuI9 z*jmEnj)&MHx6*eB8JYS{)to@WV2-Ay7^>+l`Igz+WU%?uEXv8bvKO~BynO~hXc0{t z9Yxo&xhV+Sh%y0!;?=5Bjwqf}`BOezGv~`~!9Eb7c6K}Q7Aat}$My;ka=KI!0X)n6Es1qsP z5g{Qh9ZaJq!d?QjBi#%89F$UmP{%a9a*GzFvPxSk24txRa%>OG9()EcxHee3HU;Z< zP%LeG#^y_6SQp61WbQIGHZCR0Hg>cXMppjIf%gNI*Z09x_!1X%HjgU?8|1wCgapji}n=yDu!~kPZ zq$yCQ;UXHSs-W>AZ;|vX2N9N1ZHwKe;*^`9udlzt$h|;t+_*fyp`Ym64+w95{7DX? z>5yarq_w2t0EaBCG9ap`oy86=jEbXS-v=3yeVa954|1^Ot$eA{tCPj&r0-)}ZNf#C zU^13N0Zi+ARKthkDFmSD$@oGI@?MbcM*QnRvHKa)13stkIhTR!&O#SD2`A7R>@mTR zNxO7+jkB^20Agnn97fVe+6uu2R@&TbLu@@*vp>wdQEJf`%LGHJRc|mhGn0ioVjkyL zs|_eXBnb@NhFX45C3Va{A+T!IgUtHs)7ZCzjIPZhu9w%xa%03&H zStuW1Z8E<-3QHw?>x%Hq)#1xbc0lH#xgo|nY@C4TbB;hlvIos&or#IX?Hp9#bOaK+ z3d{i9F(Jo~AD0?=iL)s*E;e+3eQo{>nDSTN#z2z*WCSG7R)Ntv^3nNi-=0X9F$C6TE}H z?5th_NEPZ*iVV64M_gtm5O80$CV=`+_VoNn+$j7Tj80hjiC+)rUm!Kix(+8(!7`wY=|=M z0i$1ZnT!>-u1;9OU+7wjqi57%P-r8V8l*6**f+po_J-fWoWrX>+#=P+uMWij^;qZ zMJGXNNuaSMcF)$+kntx@z%4X3oYA3K*|K;(4*4!8g|Vlz zk{_RH(}xFtfk}%+IviIpKBYa^$5V*?`4lCUk+Z~MGvF3&FCOkU1>xKgzXX=@bZ`fb zVFge@NBtD`_~>*E1=zyS6(6N!8@|heG!JqFY88JHBqP89UvwL6q&5*Lrti@q*A=$z zU5HPkOttI&GDR}Vfj-Rnbm42!UBa+n2%<5pVMJbw*AGxY5orjsSnwll2D{ s>{y-qx1z(?@BKgcR<8flO-3hJ`-@C{F-=Vg-+RUw8*VhXvc^8>pAVFp_W%F@ literal 0 HcmV?d00001 From e80e5a05f6e532c763ec80110bcd8e2d7a7cb063 Mon Sep 17 00:00:00 2001 From: Mahdi Date: Mon, 15 Apr 2024 00:12:31 -0400 Subject: [PATCH 20/29] add plot notebooks --- .../fedpft/docs/viz_and_plot_results.ipynb | 88 ++++++------------- 1 file changed, 25 insertions(+), 63 deletions(-) diff --git a/baselines/fedpft/docs/viz_and_plot_results.ipynb b/baselines/fedpft/docs/viz_and_plot_results.ipynb index 866ffb5d8c7..68077f7b59c 100644 --- a/baselines/fedpft/docs/viz_and_plot_results.ipynb +++ b/baselines/fedpft/docs/viz_and_plot_results.ipynb @@ -2,22 +2,10 @@ "cells": [ { "cell_type": "code", - "execution_count": 2, + "execution_count": 16, "id": "5e0cf2a9-b782-48de-ac45-128726a26e64", "metadata": {}, - "outputs": [ - { - "ename": "ModuleNotFoundError", - "evalue": "No module named 'matplotlib'", - "output_type": "error", - "traceback": [ - "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[1;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[1;32mIn[2], line 7\u001b[0m\n\u001b[0;32m 4\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mos\u001b[39;00m\n\u001b[0;32m 6\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mnp\u001b[39;00m\n\u001b[1;32m----> 7\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mpyplot\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mplt\u001b[39;00m\n", - "\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'matplotlib'" - ] - } - ], + "outputs": [], "source": [ "import pickle\n", "import yaml\n", @@ -30,7 +18,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 17, "id": "7ea3e149-ce6f-4ba0-aa41-e0501a04efe3", "metadata": {}, "outputs": [], @@ -52,7 +40,7 @@ }, { "cell_type": "code", - "execution_count": 32, + "execution_count": 18, "id": "4b010856-0d99-4d81-8fb0-7a927f10eeaf", "metadata": {}, "outputs": [], @@ -61,13 +49,13 @@ "path_fedpft_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n", "path_fedpft_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-44-20')\n", "\n", - "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','18-16-41')\n", - "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','16-36-16')\n" + "path_fedavg_resutls_cifar100 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','23-24-25')\n", + "path_fedavg_resutls_caltech101 = os.path.join(os.path.realpath('..'),'outputs','2024-04-14','22-32-11')\n" ] }, { "cell_type": "code", - "execution_count": 28, + "execution_count": 19, "id": "2e3e165c-1ce6-4efa-a4e1-1372586e436e", "metadata": {}, "outputs": [], @@ -84,7 +72,7 @@ }, { "cell_type": "code", - "execution_count": 33, + "execution_count": 20, "id": "77b70c73", "metadata": {}, "outputs": [], @@ -97,49 +85,13 @@ }, { "cell_type": "code", - "execution_count": 2, - "id": "6f4c87ad", - "metadata": {}, - "outputs": [], - "source": [ - "fedavg_cifar = [(1, 0.06924765515865097),\n", - " (2, 0.1315106765116743),\n", - " (3, 0.16773099181800039),\n", - " (4, 0.1946717222111355),\n", - " (5, 0.2171223308720814),\n", - " (6, 0.2375773298742766),\n", - " (7, 0.2597285970864099),\n", - " (8, 0.276092596288166),\n", - " (9, 0.290560766314109),\n", - " (10, 0.3036320095789264),\n", - " (11, 0.3128118140091798),\n", - " (12, 0.3261823987228098),\n", - " (13, 0.33745759329475156),\n", - " (14, 0.3477349830373179),\n", - " (15, 0.35831171422869684),\n", - " (16, 0.36679305527838757),\n", - " (17, 0.37407703053282776),\n", - " (18, 0.3817601277190182),\n", - " (19, 0.38824585910995807),\n", - " (20, 0.3942326880862103)]" - ] - }, - { - "cell_type": "code", - "execution_count": 59, + "execution_count": 21, "id": "e1a678de", "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "No artists with labels found to put in legend. Note that artists whose label start with an underscore are ignored when legend() is called with no argument.\n" - ] - }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "

" ] @@ -149,13 +101,23 @@ } ], "source": [ + "color1 = 'blue'\n", + "color2 = 'red'\n", + "\n", "def viz():\n", " fig, axs = plt.subplots(figsize=(10, 2), nrows=1, ncols=2)\n", " \n", - " # cifar100 - fedavg\n", - " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', linewidth=2.0)\n", - " \n", + " # cifar100\n", + " axs[0].plot([r for r, _ in fedavg_cifar], [a for _, a in fedavg_cifar], label='FedAvg', color=color1, linewidth=2.0)\n", + " axs[0].scatter([r for r, _ in fedpft_cifar], [a for _, a in fedpft_cifar], label='FedPFT', color=color2, marker='x', s=100)\n", " axs[0].set_title('CIFAR100 - ResNet50')\n", + " axs[0].set_ylim(0, 0.7)\n", + " \n", + " # caltech101\n", + " axs[1].plot([r for r, _ in fedavg_caltech], [a for _, a in fedavg_caltech], label='FedAvg', color=color1, linewidth=2.0)\n", + " axs[1].scatter([r for r, _ in fedpft_caltech], [a for _, a in fedpft_caltech], label='FedPFT', color=color2, marker='x', s=100)\n", + " axs[1].set_title('Caltech101 - Clip/ViT-B')\n", + " axs[1].set_ylim(0.2, 1)\n", " \n", " for ax in axs:\n", " ax.set_xticks([1, 5, 10 , 15, 20])\n", @@ -171,12 +133,12 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 22, "id": "92460065", "metadata": {}, "outputs": [], "source": [ - "saveFig(\"FedProx_mnist.png\", f)" + "saveFig(\"FedPft.png\", f)" ] } ], From 9964e770e90a228e68980f0269c55f6374f8fd31 Mon Sep 17 00:00:00 2001 From: mahdi Date: Mon, 15 Apr 2024 15:08:56 +0000 Subject: [PATCH 21/29] remove empty line --- baselines/fedpft/fedpft/models.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index 7ebc9beed4a..b4594cb986a 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -103,7 +103,7 @@ def extract_features( 2D array containing labels of `features`. """ feature_extractor.to(device) - + features, labels = [], [] for dict in dataloader: batch_samples = dict["img"].to(device) @@ -164,7 +164,7 @@ def test( total += samples.shape[0] running_loss = nn.CrossEntropyLoss()(output, labels) loss += running_loss - + return loss.cpu().item(), correct / total From af4277759c020655c7f4a3f60ce35208ce617994 Mon Sep 17 00:00:00 2001 From: mahdi Date: Mon, 15 Apr 2024 15:12:52 +0000 Subject: [PATCH 22/29] removed extended_readme --- baselines/fedpft/EXTENDED_README.md | 123 ---------------------------- 1 file changed, 123 deletions(-) delete mode 100644 baselines/fedpft/EXTENDED_README.md diff --git a/baselines/fedpft/EXTENDED_README.md b/baselines/fedpft/EXTENDED_README.md deleted file mode 100644 index 9c8f5bc72fa..00000000000 --- a/baselines/fedpft/EXTENDED_README.md +++ /dev/null @@ -1,123 +0,0 @@ - -# Extended Readme - -> The baselines are expected to run in a machine running Ubuntu 22.04 - -While `README.md` should include information about the baseline you implement and how to run it, this _extended_ readme provides info on what's the expected directory structure for a new baseline and more generally the instructions to follow before your baseline can be merged into the Flower repository. Please follow closely these instructions. It is likely that you have already completed steps 1-2. - -1. Fork the Flower repository and clone it. -2. Navigate to the `baselines/` directory and from there run: - ```bash - # This will create a new directory with the same structure as this `baseline_template` directory. - ./dev/create-baseline.sh - ``` -3. All your code and configs should go into a sub-directory with the same name as the name of your baseline. - * The sub-directory contains a series of Python scripts that you can edit. Please stick to these files and consult with us if you need additional ones. - * There is also a basic config structure in `/conf` ready be parsed by [Hydra](https://hydra.cc/) when executing your `main.py`. -4. Therefore, the directory structure in your baseline should look like: - ```bash - baselines/ - ├── README.md # describes your baseline and everything needed to use it - ├── EXTENDED_README.md # to remove before creating your PR - ├── pyproject.toml # details your Python environment - └── - ├── *.py # several .py files including main.py and __init__.py - └── conf - └── *.yaml # one or more Hydra config files - - ``` -> :warning: Make sure the variable `name` in `pyproject.toml` is set to the name of the sub-directory containing all your code. - -5. Add your dependencies to the `pyproject.toml` (see below a few examples on how to do it). Read more about Poetry below in this `EXTENDED_README.md`. -6. Regularly check that your coding style and the documentation you add follow good coding practices. To test whether your code meets the requirements, please run the following: - ```bash - # After activating your environment and from your baseline's directory - cd .. # to go to the top-level directory of all baselines - ./dev/test-baseline.sh - ./dev/test-baseline-structure.sh - ``` - Both `test-baseline.sh` and `test-baseline-structure.sh` will also be automatically run when you create a PR, and both tests need to pass for the baseline to be merged. - To automatically solve some formatting issues and apply easy fixes, please run the formatting script: - ```bash - # After activating your environment and from your baseline's directory - cd .. # to go to the top-level directory of all baselines - ./dev/format-baseline.sh - ``` -7. Ensure that the Python environment for your baseline can be created without errors by simply running `poetry install` and that this is properly described later when you complete the `Environment Setup` section in `README.md`. This is specially important if your environment requires additional steps after doing `poetry install`. -8. Ensure that your baseline runs with default arguments by running `poetry run python -m .main`. Then, describe this and other forms of running your code in the `Running the Experiments` section in `README.md`. -9. Once your code is ready and you have checked: - * that following the instructions in your `README.md` the Python environment can be created correctly - - * that running the code following your instructions can reproduce the experiments in the paper - - , then you just need to create a Pull Request (PR) to kickstart the process of merging your baseline into the Flower repository. - -> Once you are happy to merge your baseline contribution, please delete this `EXTENDED_README.md` file. - - -## About Poetry - -We use Poetry to manage the Python environment for each individual baseline. You can follow the instructions [here](https://python-poetry.org/docs/) to install Poetry in your machine. - - -### Specifying a Python Version (optional) -By default, Poetry will use the Python version in your system. In some settings, you might want to specify a particular version of Python to use inside your Poetry environment. You can do so with [`pyenv`](https://github.com/pyenv/pyenv). Check the documentation for the different ways of installing `pyenv`, but one easy way is using the [automatic installer](https://github.com/pyenv/pyenv-installer): -```bash -curl https://pyenv.run | bash # then, don't forget links to your .bashrc/.zshrc -``` - -You can then install any Python version with `pyenv install ` (e.g. `pyenv install 3.9.17`). Then, in order to use that version for your baseline, you'd do the following: - -```bash -# cd to your baseline directory (i.e. where the `pyproject.toml` is) -pyenv local - -# set that version for poetry -poetry env use - -# then you can install your Poetry environment (see the next setp) -``` - -### Installing Your Environment -With the Poetry tool already installed, you can create an environment for this baseline with commands: -```bash -# run this from the same directory as the `pyproject.toml` file is -poetry install -``` - -This will create a basic Python environment with just Flower and additional packages, including those needed for simulation. Next, you should add the dependencies for your code. It is **critical** that you fix the version of the packages you use using a `=` not a `=^`. You can do so via [`poetry add`](https://python-poetry.org/docs/cli/#add). Below are some examples: - -```bash -# For instance, if you want to install tqdm -poetry add tqdm==4.65.0 - -# If you already have a requirements.txt, you can add all those packages (but ensure you have fixed the version) in one go as follows: -poetry add $( cat requirements.txt ) -``` -With each `poetry add` command, the `pyproject.toml` gets automatically updated so you don't need to keep that `requirements.txt` as part of this baseline. - - -More critically however, is adding your ML framework of choice to the list of dependencies. For some frameworks you might be able to do so with the `poetry add` command. Check [the Poetry documentation](https://python-poetry.org/docs/cli/#add) for how to add packages in various ways. For instance, let's say you want to use PyTorch: - -```bash -# with plain `pip` you'd run a command such as: -pip install torch==1.13.1+cu117 torchvision==0.14.1+cu117 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu117 - -# to add the same 3 dependencies to your Poetry environment you'd need to add the URL to the wheel that the above pip command auto-resolves for you. -# You can find those wheels in `https://download.pytorch.org/whl/cu117`. Copy the link and paste it after the `poetry add` command. -# For instance to add `torch==1.13.1+cu117` and a x86 Linux system with Python3.8 you'd: -poetry add https://download.pytorch.org/whl/cu117/torch-1.13.1%2Bcu117-cp38-cp38-linux_x86_64.whl -# you'll need to repeat this for both `torchvision` and `torchaudio` -``` -The above is just an example of how you can add these dependencies. Please refer to the Poetry documentation to extra reference. - -If all attempts fail, you can still install packages via standard `pip`. You'd first need to source/activate your Poetry environment. -```bash -# first ensure you have created your environment -# and installed the base packages provided in the template -poetry install - -# then activate it -poetry shell -``` -Now you are inside your environment (pretty much as when you use `virtualenv` or `conda`) so you can install further packages with `pip`. Please note that, unlike with `poetry add`, these extra requirements won't be captured by `pyproject.toml`. Therefore, please ensure that you provide all instructions needed to: (1) create the base environment with Poetry and (2) install any additional dependencies via `pip` when you complete your `README.md`. \ No newline at end of file From b600ed32df04a1850fbab50b7372bb2e96c6f58d Mon Sep 17 00:00:00 2001 From: jafermarq Date: Tue, 23 Apr 2024 08:14:10 +0000 Subject: [PATCH 23/29] minor changes --- baselines/fedpft/README.md | 6 +++--- baselines/fedpft/pyproject.toml | 1 + 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index c25f6de8f71..45eee5954d7 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -1,8 +1,8 @@ --- title: Parametric Feature Transfer, One-shot Federated Learning with Foundation Models url: https://arxiv.org/abs/2402.01862 -labels: [foundation-models, pre-trained, one-shot, one-round] # please add between 4 and 10 single-word (maybe two-words) labels (e.g. system heterogeneity, image classification, asynchronous, weight sharing, cross-silo). Do not use "" -dataset: [CIFAR100, Caltech101] # list of datasets you include in your baseline. Do not use "" +labels: [foundation-models, pre-trained, one-shot, one-round] +dataset: [CIFAR-100, Caltech101] --- # FedPFT: One-shot Federated Learning with Foundation Models @@ -109,4 +109,4 @@ python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=cli The above commands would generate results that you can plot and would look like the plot shown below. This plot was generated using the jupyter notebook in the `docs/` directory of this baseline after running the commands above. -![](_static/FedPft.png) \ No newline at end of file +![](_static/FedPft.png) diff --git a/baselines/fedpft/pyproject.toml b/baselines/fedpft/pyproject.toml index 30e47defbda..11bbddd0e17 100644 --- a/baselines/fedpft/pyproject.toml +++ b/baselines/fedpft/pyproject.toml @@ -58,6 +58,7 @@ pytest = "==6.2.4" pytest-watch = "==4.2.0" ruff = "==0.0.272" types-requests = "==2.27.7" +virtualenv = "==20.21.0" [tool.isort] line_length = 88 From 8732803d767634c66b49dd9242bdb9c6df637433 Mon Sep 17 00:00:00 2001 From: jafermarq Date: Tue, 23 Apr 2024 09:14:46 +0000 Subject: [PATCH 24/29] minor fix --- baselines/fedpft/fedpft/models.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index b4594cb986a..b9b85d4c4cd 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -126,7 +126,7 @@ def test( feature_extractor: torch.nn.Module, device: torch.device, ) -> Tuple[float, float]: - """"Evaluates the `classifier_head` on the dataset. + """Evaluates the `classifier_head` on the dataset. Parameters ---------- From 6a9bb2b07b0f723e36300b3d780d1eec1f2f21f3 Mon Sep 17 00:00:00 2001 From: mahdi Date: Wed, 24 Apr 2024 00:24:19 +0000 Subject: [PATCH 25/29] fix formating --- baselines/fedpft/README.md | 14 +++---- baselines/fedpft/fedpft/client.py | 4 +- baselines/fedpft/fedpft/dataset.py | 5 ++- baselines/fedpft/fedpft/main.py | 1 + baselines/fedpft/fedpft/models.py | 59 +++++++++++++++-------------- baselines/fedpft/fedpft/server.py | 10 +++-- baselines/fedpft/fedpft/strategy.py | 4 +- baselines/fedpft/fedpft/utils.py | 37 +++++++++--------- 8 files changed, 74 insertions(+), 60 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index dc02d60a76a..1856223ba45 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -18,11 +18,11 @@ dataset: [CIFAR-100, Caltech101] ## About this baseline -**What’s implemented:** The code in this directory replicates the centralized experiments in *Parametric Feature Transfer, One-shot Federated Learning with Foundation Models* (Beitollahi et al., 2024) for CIFAR100 and Caltech101 datasets, which proposed the FedPFT algorithm. Concretely, it replicates the results in Section 5.2. +**What’s implemented:** The code in this directory replicates the centralized experiments in *Parametric Feature Transfer, One-shot Federated Learning with Foundation Models* (Beitollahi et al., 2024) for CIFAR-100 and Caltech101 datasets, which proposed the FedPFT algorithm. Concretely, it replicates the results in Section 5.2. -**Datasets:** CIFAR100 and Caltech101 from HuggingFace +**Datasets:** CIFAR-100 and Caltech101 from HuggingFace -**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8Gigs of ram. +**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8 gigs of memory. **Contributors:** Mahdi Beitollahi @@ -32,14 +32,14 @@ dataset: [CIFAR-100, Caltech101] **Task:** Image classification **Model:** This directory utilizes two pre-trained, frozen models as shown in Table 1 of the paper: -* ResNet50 pre-trained on ImageNet is used for CIFAR100 dataset(see `models/resnet50`). +* ResNet50 pre-trained on ImageNet is used for CIFAR-100 dataset(see `models/resnet50`). * CLIP, ViT-B/32 pre-trained on web dataset is used for Caltech101 dataset (see `models/clip_vit`) -**Dataset:** This baseline includes the CIFAR100 and Caltech101 datasets. By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. +**Dataset:** This baseline includes the CIFAR-100 and Caltech101 datasets. By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. | Dataset | #classes | #partitions | partitioning method | partition settings | | :------ | :---: | :---: | :---: | :---: | -| CIFAR100 | 100 | 50 | Dirichlet distribution | $\alpha$=0.1 | +| CIFAR-100 | 100 | 50 | Dirichlet distribution | $\alpha$=0.1 | | Caltech101 | 101 | 50 | Dirichlet distribution | $\alpha$=0.1 | **Training Hyperparameters:** The following table shows the main hyperparameters for this baseline with their default value (i.e. the value used if you run `python main.py` directly) @@ -75,7 +75,7 @@ poetry install ## Running the Experiments -To run this FedPFT with CIFAR100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: +To run this FedPFT with CIFAR-100 baseline, first ensure you have activated your Poetry environment (execute `poetry shell` from this directory), then: ```bash python -m fedpft.main # this will run using the default settings in the `conf/config.yaml` diff --git a/baselines/fedpft/fedpft/client.py b/baselines/fedpft/fedpft/client.py index 434055808f8..c20aefe9236 100644 --- a/baselines/fedpft/fedpft/client.py +++ b/baselines/fedpft/fedpft/client.py @@ -22,6 +22,7 @@ class FedPFTClient(fl.client.NumPyClient): """Flower FedPFTClient.""" + # pylint: disable=too-many-arguments def __init__( self, trainloader: DataLoader, @@ -83,7 +84,7 @@ def fit( features=features, labels=labels, n_mixtures=int(config["n_mixtures"]), - cov_type=config["cov_type"], + cov_type=str(config["cov_type"]), seed=int(config["seed"]), tol=float(config["tol"]), max_iter=int(config["max_iter"]), @@ -130,6 +131,7 @@ def fit( return self.get_parameters(config={}), len(self.trainloader.dataset), {} +# pylint: disable=too-many-arguments def generate_client_fn( client_cfg: DictConfig, trainloaders: List[DataLoader], diff --git a/baselines/fedpft/fedpft/dataset.py b/baselines/fedpft/fedpft/dataset.py index 733234074ef..df41d10996a 100644 --- a/baselines/fedpft/fedpft/dataset.py +++ b/baselines/fedpft/fedpft/dataset.py @@ -8,9 +8,11 @@ from torchvision import transforms +# pylint: disable=too-many-instance-attributes class Dataset: """Dataset class.""" + # pylint: disable=too-many-locals, too-many-arguments def __init__( self, dataset: str, @@ -30,7 +32,7 @@ def __init__( Parameters ---------- dataset : str - Name of dataset to be downloaded from HuggingFace. + Name or path of the dataset to be downloaded from HuggingFace. num_clients: int Number of clients. batch_size: int @@ -60,6 +62,7 @@ def __init__( self.seed = seed self.split_size = split_size self.image_column_name = image_column_name + self.kwargs = kwargs def get_loaders(self): """Partition the datasets and return a list of dataloaders.""" diff --git a/baselines/fedpft/fedpft/main.py b/baselines/fedpft/fedpft/main.py index 9860b1232bf..debc4b35f52 100644 --- a/baselines/fedpft/fedpft/main.py +++ b/baselines/fedpft/fedpft/main.py @@ -13,6 +13,7 @@ from fedpft.client import generate_client_fn +# pylint: disable=too-many-locals @hydra.main(config_path="conf", config_name="base", version_base=None) def main(cfg: DictConfig) -> None: """Run federated learning with frozen, pre-trained models. diff --git a/baselines/fedpft/fedpft/models.py b/baselines/fedpft/fedpft/models.py index b9b85d4c4cd..3a57cf52141 100644 --- a/baselines/fedpft/fedpft/models.py +++ b/baselines/fedpft/fedpft/models.py @@ -8,6 +8,7 @@ import torch.utils import torchvision.transforms as transforms from flwr.common.logger import log +from numpy.typing import NDArray from torch import nn from torch.utils.data import DataLoader from torchvision import models @@ -16,17 +17,17 @@ def resnet50() -> torch.nn.modules: """Return ResNet-50 model as feature extractor.""" - resnet50 = models.resnet50(weights=models.ResNet50_Weights.DEFAULT) + resnet50_model = models.resnet50(weights=models.ResNet50_Weights.DEFAULT) # Remove last layer and flatten outputs - resnet50 = torch.nn.Sequential( - *(list(resnet50.children())[:-1]), torch.nn.Flatten() + resnet50_model = torch.nn.Sequential( + *(list(resnet50_model.children())[:-1]), torch.nn.Flatten() ) # Set the hidden_dimension - resnet50.hidden_dimension = 2048 + resnet50_model.hidden_dimension = 2048 - return resnet50 + return resnet50_model def clip_vit(name: str) -> torch.nn.modules: @@ -47,9 +48,10 @@ def __init__(self, vision_model): self.vision_model = vision_model self.hidden_dimension = vision_model.config.hidden_size - def forward(self, input): - output = self.vision_model(input) - return output[1] # return pooled_output (CLS token) + def forward(self, x): + """Return pooled output (CLS token).""" + output = self.vision_model(x) + return output[1] vision_model = CLIPModel.from_pretrained(name).vision_model @@ -71,18 +73,18 @@ def transform(mean: List, std: List) -> transforms.Compose: transforms.Compose Transform function for normalizing images """ - tr = transforms.Compose( + transform_comp = transforms.Compose( [ transforms.ToTensor(), transforms.Normalize(mean, std), ] ) - return tr + return transform_comp def extract_features( dataloader: DataLoader, feature_extractor: torch.nn.Module, device: torch.device -) -> Tuple[np.array, np.array]: +) -> Tuple[NDArray, NDArray]: """Extract features and labels from images using feature extractor. Parameters @@ -97,27 +99,27 @@ def extract_features( Returns ------- - features : np.array + features : NDArray 2D array containing features extracted from `feature_extractor`. - labels : np.array + labels : NDArray 2D array containing labels of `features`. """ feature_extractor.to(device) features, labels = [], [] - for dict in dataloader: - batch_samples = dict["img"].to(device) - batch_label = dict["label"].to(device) + for sample in dataloader: + batch_samples = sample["img"].to(device) + batch_label = sample["label"].to(device) with torch.no_grad(): feature = feature_extractor(batch_samples) features.append(feature.cpu().detach().numpy()) labels.append(batch_label.cpu().detach().numpy()) # reshape feauturs and labels into a single numpy array - features = np.concatenate(features, axis=0, dtype=np.float64) - labels = np.concatenate(labels, dtype=int) + features_np = np.concatenate(features, axis=0).astype("float64") + labels_np = np.concatenate(labels) - return features, labels + return features_np, labels_np def test( @@ -153,9 +155,9 @@ def test( feature_extractor.to(device) correct, total, loss = 0, 0, 0 - for dict in dataloader: - samples = dict["img"].to(device) - labels = dict["label"].to(device) + for sample in dataloader: + samples = sample["img"].to(device) + labels = sample["label"].to(device) with torch.no_grad(): feature = feature_extractor(samples) output = classifier_head(feature) @@ -163,11 +165,12 @@ def test( correct += (pred == labels).sum().item() total += samples.shape[0] running_loss = nn.CrossEntropyLoss()(output, labels) - loss += running_loss + loss += running_loss.cpu().item() - return loss.cpu().item(), correct / total + return loss, correct / total +# pylint: disable=too-many-locals, too-many-arguments def train( classifier_head: torch.nn.Linear, dataloader: DataLoader, @@ -204,10 +207,10 @@ def train( for epoch in range(num_epochs): correct, total, loss = 0, 0, 0 - for _, dict in enumerate(dataloader): + for _, batch in enumerate(dataloader): classifier_head.zero_grad() - samples = dict["img"].to(device) - labels = dict["label"].to(device) + samples = batch["img"].to(device) + labels = batch["label"].to(device) if feature_extractor: with torch.no_grad(): samples = feature_extractor(samples) @@ -220,4 +223,4 @@ def train( running_loss.backward() opt.step() if verbose: - log(logging.INFO, f"Epoch:{epoch+1} --- Accuracy: {correct/total}") + log(logging.INFO, "Epoch: %s --- Accuracy: %s", epoch + 1, correct / total) diff --git a/baselines/fedpft/fedpft/server.py b/baselines/fedpft/fedpft/server.py index 00d88360e9f..9c6c605884d 100644 --- a/baselines/fedpft/fedpft/server.py +++ b/baselines/fedpft/fedpft/server.py @@ -29,6 +29,7 @@ def fedpft_get_on_fit_config_fn( Function to return a config with the `lr` and `num_epochs` """ + # pylint: disable=unused-argument def fit_config(server_round: int) -> Dict[str, str]: """Return a configuration for training Gaussian Mixtures.""" config = { @@ -44,14 +45,14 @@ def fit_config(server_round: int) -> Dict[str, str]: def fedavg_get_on_fit_config_fn( - lr: float, + learning_rate: float, num_epochs: int, ) -> Callable[[int], Dict[str, str]]: """Return a function which returns FedAvg training configurations. Parameters ---------- - lr : float + learning_rate : float Client's learning rate num_epochs : int Number of epochs for local learning of clients @@ -59,13 +60,14 @@ def fedavg_get_on_fit_config_fn( Returns ------- Callable[[int], Dict[str, str]] - Function to return a config with the `lr` and `num_epochs` + Function to return a config with the `learning_rate` and `num_epochs` """ + # pylint: disable=unused-argument def fit_config(server_round: int) -> Dict[str, str]: """Return a configuration number of epochs and learning rate.""" config = { - "lr": str(lr), + "lr": str(learning_rate), "num_epochs": str(num_epochs), } return config diff --git a/baselines/fedpft/fedpft/strategy.py b/baselines/fedpft/fedpft/strategy.py index f9546140124..2e4302bde45 100644 --- a/baselines/fedpft/fedpft/strategy.py +++ b/baselines/fedpft/fedpft/strategy.py @@ -68,6 +68,7 @@ def __init__( self.num_epochs = num_epochs self.device = device + # pylint: disable=too-many-locals def aggregate_fit( self, server_round: int, @@ -79,10 +80,11 @@ def aggregate_fit( if not self.accept_failures and failures: raise Exception("there are failures and failures are not accepted") + assert self.on_fit_config_fn is not None config = self.on_fit_config_fn(server_round) # Sample from the GMMs to create synthetic feature dataset - synthetic_features_dataset = [] + synthetic_features_dataset: List[Union[Dict, Tuple]] = [] for _, fit_res in results: # Convert byte parameters into ndarrays and GMMParameters ndarray = parameters_to_ndarrays(fit_res.parameters) diff --git a/baselines/fedpft/fedpft/utils.py b/baselines/fedpft/fedpft/utils.py index c1a27c14647..b7812d556d0 100644 --- a/baselines/fedpft/fedpft/utils.py +++ b/baselines/fedpft/fedpft/utils.py @@ -4,7 +4,7 @@ from typing import List import numpy as np -from flwr.common import NDArrays +from numpy.typing import NDArray from sklearn.mixture import GaussianMixture @@ -12,19 +12,19 @@ class GMMParameters: """GMM parameters.""" - label: int - means: NDArrays - weights: NDArrays - covariances: NDArrays - num_samples: int + label: NDArray + means: NDArray + weights: NDArray + covariances: NDArray + num_samples: NDArray -def gmmparam_to_ndarrays(gmm: GMMParameters) -> NDArrays: +def gmmparam_to_ndarrays(gmm: GMMParameters) -> List[NDArray]: """Convert gmm object to NumPy ndarrays.""" return [gmm.label, gmm.means, gmm.weights, gmm.covariances, gmm.num_samples] -def ndarrays_to_gmmparam(ndarrays: NDArrays) -> GMMParameters: +def ndarrays_to_gmmparam(ndarrays: NDArray) -> GMMParameters: """Convert NumPy ndarray to GMM object.""" return GMMParameters( label=ndarrays[0], @@ -35,9 +35,10 @@ def ndarrays_to_gmmparam(ndarrays: NDArrays) -> GMMParameters: ) +# pylint: disable=too-many-arguments def learn_gmm( - features: np.array, - labels: np.array, + features: NDArray, + labels: NDArray, n_mixtures: int, cov_type: str, seed: int, @@ -48,10 +49,10 @@ def learn_gmm( Parameters ---------- - features : np.array + features : NDArray A 2-d array with size (n_samples, feature_dimension) containing extracted features for all the samples. - labels : np.array + labels : NDArray An array with size (n_samples) containing labels associated for each sample in `features`. n_mixtures : int @@ -86,17 +87,17 @@ def learn_gmm( gmm.fit(cond_features) gmm_list.append( GMMParameters( - label=label, + label=np.array(label), means=gmm.means_.astype("float16"), weights=gmm.weights_.astype("float16"), covariances=gmm.covariances_.astype("float16"), - num_samples=len(cond_features), + num_samples=np.array(len(cond_features)), ) ) return gmm_list -def chunks(lst, n): - """Yield successive n-sized chunks from lst.""" - for i in range(0, len(lst), n): - yield lst[i : i + n] +def chunks(lst, chunk_size): + """Yield successive chunk_size-sized chunks from lst.""" + for i in range(0, len(lst), chunk_size): + yield lst[i : i + chunk_size] From ffc3d8c7307f6f6819a95bd8dcd6368a32712663 Mon Sep 17 00:00:00 2001 From: mahdi Date: Wed, 24 Apr 2024 17:23:18 +0000 Subject: [PATCH 26/29] add email address --- baselines/fedpft/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 1856223ba45..cad603d124e 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -24,7 +24,7 @@ dataset: [CIFAR-100, Caltech101] **Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8 gigs of memory. -**Contributors:** Mahdi Beitollahi +**Contributors:** Mahdi Beitollahi (mahdi.beitollahi@queensu.ca). ## Experimental Setup From ffb2be665ead2f0e379421e96271e8dfe1dd9261 Mon Sep 17 00:00:00 2001 From: jafermarq Date: Wed, 24 Apr 2024 21:08:50 +0000 Subject: [PATCH 27/29] minor update --- baselines/fedpft/README.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index cad603d124e..8b0fb3d5752 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -22,7 +22,7 @@ dataset: [CIFAR-100, Caltech101] **Datasets:** CIFAR-100 and Caltech101 from HuggingFace -**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8 gigs of memory. +**Hardware Setup:** These experiments were run on a desktop machine with 8 CPU threads and Nvidia 4070 with 8GB of VRAM. **Contributors:** Mahdi Beitollahi (mahdi.beitollahi@queensu.ca). @@ -35,7 +35,7 @@ dataset: [CIFAR-100, Caltech101] * ResNet50 pre-trained on ImageNet is used for CIFAR-100 dataset(see `models/resnet50`). * CLIP, ViT-B/32 pre-trained on web dataset is used for Caltech101 dataset (see `models/clip_vit`) -**Dataset:** This baseline includes the CIFAR-100 and Caltech101 datasets. By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. +**Dataset:** This baseline includes the CIFAR-100 and Caltech101 datasets via [flwr-datasets](https://flower.ai/docs/datasets/). By default, it will be partitioned into 50 clients following a Dirichlet distribution with $\alpha$=0.1. | Dataset | #classes | #partitions | partitioning method | partition settings | | :------ | :---: | :---: | :---: | :---: | From 1ef9430660dc70802e5cbe5b9b396242c61f6c41 Mon Sep 17 00:00:00 2001 From: Mahdi Beitollahi <96784135+mahdibeit@users.noreply.github.com> Date: Thu, 25 Apr 2024 13:05:02 -0400 Subject: [PATCH 28/29] Update baselines/fedpft/README.md update readme Co-authored-by: Javier --- baselines/fedpft/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/baselines/fedpft/README.md b/baselines/fedpft/README.md index 8b0fb3d5752..45bddfda610 100644 --- a/baselines/fedpft/README.md +++ b/baselines/fedpft/README.md @@ -103,7 +103,7 @@ python -m fedpft.main dataset=CIFAR100 model=resnet50 python -m fedpft.main dataset=Caltech101 model=clip # FedAvg with pre-trained, frozen models -python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 strategy.on_fit_config_fn.num_epochs=1=1 num_gpus=0.5 +python -m fedpft.main strategy=fedavg client=fedavg dataset=CIFAR100 model=resnet50 num_rounds=20 strategy.on_fit_config_fn.num_epochs=1 num_gpus=0.5 python -m fedpft.main strategy=fedavg client=fedavg dataset=Caltech101 model=clip num_rounds=20 num_gpus=0.2 ``` From 2f6d66de0009b7f153b80b62b82990a048fbce83 Mon Sep 17 00:00:00 2001 From: Mahdi Beitollahi <96784135+mahdibeit@users.noreply.github.com> Date: Thu, 25 Apr 2024 13:05:51 -0400 Subject: [PATCH 29/29] Update baselines/fedpft/fedpft/conf/strategy/fedavg.yaml fix config arg Co-authored-by: Javier --- baselines/fedpft/fedpft/conf/strategy/fedavg.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml index 166bcd10aef..b7703e78eb6 100644 --- a/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml +++ b/baselines/fedpft/fedpft/conf/strategy/fedavg.yaml @@ -5,7 +5,7 @@ fraction_evaluate: 1 accept_failures: False on_fit_config_fn: _target_: fedpft.server.fedavg_get_on_fit_config_fn - lr: 0.01 + learning_rate: 0.01 num_epochs: 10 evaluate_metrics_aggregation_fn: _target_: fedpft.server.weighted_average