scaleoutsystems · ahellander · Mar 24, 2024 · Feb 5, 2024 · Mar 2, 2024 · Mar 5, 2024
diff --git a/examples/async-simulation/.gitignore → examples/async-clients/.gitignore b/examples/async-simulation/.gitignore → examples/async-clients/.gitignore
@@ -2,5 +2,6 @@ data
 *.npz
 *.tgz
 *.tar.gz
+*.log
 .async-simulation
 client.yaml
diff --git a/examples/async-clients/Experiment.ipynb b/examples/async-clients/Experiment.ipynb
diff --git a/examples/async-clients/README.md b/examples/async-clients/README.md
@@ -0,0 +1,77 @@
+# ASYNC CLIENTS 
+This example shows how to experiment with intermittent and asynchronous client workflows.     
+
+## Prerequisites
+- [Python 3.8, 3.9 or 3.10](https://www.python.org/downloads)
+- [Docker](https://docs.docker.com/get-docker)
+- [Docker Compose](https://docs.docker.com/compose/install)
+
+## Running the example (pseudo-distributed, single host)
+
+First, make sure that FEDn is installed (we recommend using a virtual environment)
+
+Clone FEDn
+```sh
+git clone https://github.com/scaleoutsystems/fedn.git
+```
+
+Install FEDn and dependencies
+
+``
+pip install fedn
+```
+
+Or from source, standing in the folder 'fedn/fedn'
+
+```
+pip install .
+```
+
+### Prepare the example environment, the compute package and seed model
+
+Standing in the folder fedn/examples/async-clients
+```
+pip install -r requirements.txt
+```
+
+Create the compute package and seed model:
+```
+tar -czvf package.tgz client
+```
+
+```
+python client/entrypoint init_seed
+```
+
+You will now have a file 'seed.npz' in the directory.
+
+### Running a simulation
+
+Deploy FEDn on localhost. Standing in the the FEDn root directory: 
+
+```
+docker-compose up 
+```
+
+Initialize FEDn with the compute package and seed model
+
+```
+python init_fedn.py
+```
+
+Start simulating clients
+```
+python run_clients.py
+```
+
+Start the experiment / training sessions: 
+
+```
+python run_experiment.py
+```
+
+Once global models start being produced, you can start analyzing results using API Client, refer to the notebook "Experiment.ipynb" for instructions. 
+
+
+
+
diff --git a/examples/async-clients/client/entrypoint.py b/examples/async-clients/client/entrypoint.py
@@ -0,0 +1,142 @@
+# /bin/python
+import fire
+import numpy as np
+from sklearn.datasets import make_classification
+from sklearn.metrics import accuracy_score
+from sklearn.model_selection import train_test_split
+from sklearn.neural_network import MLPClassifier
+
+from fedn.utils.helpers.helpers import get_helper, save_metadata, save_metrics
+
+HELPER_MODULE = 'numpyhelper'
+ARRAY_SIZE = 10000
+
+
+def compile_model(max_iter=1):
+    clf = MLPClassifier(max_iter=max_iter)
+    # This is needed to initialize some state variables needed to make predictions
+    # We will overwrite weights and biases during FL training
+    X_train, y_train, _, _ = make_data()
+    clf.fit(X_train, y_train)
+    return clf
+
+
+def save_parameters(model, out_path):
+    """ Save model to disk.
+
+    :param model: The model to save.
+    :type model: torch.nn.Module
+    :param out_path: The path to save to.
+    :type out_path: str
+    """
+    helper = get_helper(HELPER_MODULE)
+    parameters = model.coefs_ + model.intercepts_
+
+    helper.save(parameters, out_path)
+
+
+def load_parameters(model_path):
+    """ Load model from disk.
+
+    param model_path: The path to load from.
+    :type model_path: str
+    :return: The loaded model.
+    :rtype: torch.nn.Module
+    """
+    helper = get_helper(HELPER_MODULE)
+    parameters = helper.load(model_path)
+
+    return parameters
+
+
+def init_seed(out_path='seed.npz'):
+    """ Initialize seed model.
+
+    :param out_path: The path to save the seed model to.
+    :type out_path: str
+    """
+    # Init and save
+    model = compile_model()
+    save_parameters(model, out_path)
+
+
+def make_data(n_min=50, n_max=100):
+    """ Generate / simulate a random number n data points.
+
+    n will fall in the interval (n_min, n_max)
+
+    """
+    n_samples = 100000
+    X, y = make_classification(n_samples=n_samples, n_features=4, n_informative=4, n_redundant=0, random_state=42)
+    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
+
+    n = np.random.randint(n_min, n_max, 1)[0]
+    ind = np.random.choice(len(X_train), n)
+    X_train = X_train[ind, :]
+    y_train = y_train[ind]
+    return X_train, y_train, X_test, y_test
+
+
+def train(in_model_path, out_model_path):
+    """ Train model.
+
+    """
+
+    # Load model
+    parameters = load_parameters(in_model_path)
+    model = compile_model()
+    n = len(parameters)//2
+    model.coefs_ = parameters[:n]
+    model.intercepts_ = parameters[n:]
+
+    # Train
+    X_train, y_train, _, _ = make_data()
+    epochs = 10
+    for i in range(epochs):
+        model.partial_fit(X_train, y_train)
+
+    # Metadata needed for aggregation server side
+    metadata = {
+        'num_examples': len(X_train),
+    }
+
+    # Save JSON metadata file
+    save_metadata(metadata, out_model_path)
+
+    # Save model update
+    save_parameters(model, out_model_path)
+
+
+def validate(in_model_path, out_json_path):
+    """ Validate model.
+
+    :param in_model_path: The path to the input model.
+    :type in_model_path: str
+    :param out_json_path: The path to save the output JSON to.
+    :type out_json_path: str
+    :param data_path: The path to the data file.
+    :type data_path: str
+    """
+    parameters = load_parameters(in_model_path)
+    model = compile_model()
+    n = len(parameters)//2
+    model.coefs_ = parameters[:n]
+    model.intercepts_ = parameters[n:]
+
+    X_train, y_train, X_test, y_test = make_data()
+
+    # JSON schema
+    report = {
+        "accuracy_score": accuracy_score(y_test, model.predict(X_test)),
+    }
+
+    # Save JSON
+    save_metrics(report, out_json_path)
+
+
+if __name__ == '__main__':
+    fire.Fire({
+        'init_seed': init_seed,
+        'train': train,
+        'validate': validate
+    })
diff --git a/examples/async-clients/client/fedn.yaml b/examples/async-clients/client/fedn.yaml
@@ -0,0 +1,5 @@
+entry_points:
+  train:
+    command: python entrypoint.py train $ENTRYPOINT_OPTS
+  validate: 
+    command: python entrypoint.py validate $ENTRYPOINT_OPTS
diff --git a/examples/async-clients/img/async-clients.png b/examples/async-clients/img/async-clients.png
diff --git a/examples/async-simulation/init_fedn.py → examples/async-clients/init_fedn.py b/examples/async-simulation/init_fedn.py → examples/async-clients/init_fedn.py
@@ -4,5 +4,5 @@
 DISCOVER_PORT = 8092
 
 client = APIClient(DISCOVER_HOST, DISCOVER_PORT)
-client.set_package('package.tgz', 'numpyhelper')
-client.set_initial_model('seed.npz')
+client.set_active_package('package.tgz', 'numpyhelper')
+client.set_active_model('seed.npz')
diff --git a/examples/async-clients/requirements.txt b/examples/async-clients/requirements.txt
@@ -0,0 +1,3 @@
+fire==0.3.1
+numpy
+scikit-learn
diff --git a/examples/async-clients/run_clients.py b/examples/async-clients/run_clients.py
@@ -0,0 +1,77 @@
+"""This scripts starts N_CLIENTS using the SDK.
+
+
+
+
+
+If you are running with a local deploy of FEDn
+using docker compose, you need to make sure that clients
+are able to resolve the name "combiner" to 127.0.0.1
+
+One way to accomplish this is to edit your /etc/host,
+adding the line:
+
+combiner    127.0.0.1
+
+(this requires root previliges)
+"""
+
+import copy
+import time
+from multiprocessing import Process
+
+import numpy as np
+
+from fedn.network.clients.client import Client
+
+settings = {
+    'DISCOVER_HOST': '127.0.0.1',
+    'DISCOVER_PORT': 8092,
+    'N_CLIENTS': 10,
+    'N_CYCLES': 100,
+    'CLIENTS_MAX_DELAY': 10,
+    'CLIENTS_ONLINE_FOR_SECONDS': 120
+}
+
+client_config = {'discover_host': settings['DISCOVER_HOST'], 'discover_port': settings['DISCOVER_PORT'], 'token': None, 'name': 'testclient',
+                 'client_id': 1, 'remote_compute_context': True, 'force_ssl': False, 'dry_run': False, 'secure': False,
+                 'preshared_cert': False, 'verify': False, 'preferred_combiner': False,
+                 'validator': True, 'trainer': True, 'init': None, 'logfile': 'test.log', 'heartbeat_interval': 2,
+                 'reconnect_after_missed_heartbeat': 30}
+
+
+def run_client(online_for=120, name='client'):
+    """ Simulates a client that starts and stops
+    at random intervals.
+
+    The client will start after a radom time 'mean_delay',
+    stay online for 'online_for' seconds (deterministic),
+    then disconnect.
+
+    This is repeated for N_CYCLES.
+
+    """
+
+    conf = copy.deepcopy(client_config)
+    conf['name'] = name
+
+    for i in range(settings['N_CYCLES']):
+        # Sample a delay until the client starts
+        t_start = np.random.randint(0, settings['CLIENTS_MAX_DELAY'])
+        time.sleep(t_start)
+        fl_client = Client(conf)
+        time.sleep(online_for)
+        fl_client.disconnect()
+
+
+if __name__ == '__main__':
+
+    # We start N_CLIENTS independent client processes
+    processes = []
+    for i in range(settings['N_CLIENTS']):
+        p = Process(target=run_client, args=(settings['CLIENTS_ONLINE_FOR_SECONDS'], 'client{}'.format(i),))
+        processes.append(p)
+        p.start()
+
+    for p in processes:
+        p.join()
diff --git a/examples/async-clients/run_experiment.py b/examples/async-clients/run_experiment.py
@@ -0,0 +1,34 @@
+import time
+import uuid
+
+from fedn import APIClient
+
+DISCOVER_HOST = '127.0.0.1'
+DISCOVER_PORT = 8092
+client = APIClient(DISCOVER_HOST, DISCOVER_PORT)
+
+if __name__ == '__main__':
+
+    # Run six sessions, each with 100 rounds.
+    num_sessions = 6
+    for s in range(num_sessions):
+
+        session_config = {
+            "helper": "numpyhelper",
+            "id": str(uuid.uuid4()),
+            "aggregator": "fedopt",
+            "round_timeout": 20,
+            "rounds": 100,
+            "validate": False,
+        }
+
+        session = client.start_session(**session_config)
+        if session['success'] is False:
+            print(session['message'])
+            exit(0)
+
+        print("Started session: {}".format(session))
+
+        # Wait for session to finish
+        while not client.session_is_finished(session_config['id']):
+            time.sleep(2)