From 4df578ee525d39e98118f2c43bbd37d275b371ec Mon Sep 17 00:00:00 2001
From: Jin Hanyu <48324756+Hanyu-Jin@users.noreply.github.com>
Date: Mon, 22 Aug 2022 23:46:08 +0800
Subject: [PATCH] Enable FL Server in SGX (#5396)

* add assembly

* Enable FL Sever in SGX

* Change the url in tutorial.md

* Add start-fl-server.py to Docker Image

* rm ppml-assebly.xml

* Add start-python-fl-server-sgx.sh to Docker Image

* Put start-fl-server.py into assembly

* Update 3.1.2 Start FL Server in SGX in pytorch-nn-lr-tutorial.md

* Change the location of start-fl-server.py

* Correct the path in start-python-fl-server-sgx.sh

* Delete -r in cp command

Co-authored-by: Jiaming <litchy233@gmail.com>
---
 .../python/docker-graphene/Dockerfile         |  4 +-
 .../start-python-fl-server-sgx.sh             | 25 ++++++++
 .../pytorch_nn_lr/pytorch-nn-lr-tutorial.md   | 18 ++----
 .../example/pytorch_nn_lr/pytorch_nn_lr_1.py  |  2 +-
 .../example/pytorch_nn_lr/pytorch_nn_lr_2.py  |  2 +-
 python/ppml/scripts/ppml-conf.yaml            |  9 +++
 python/ppml/scripts/setup-env.sh              |  5 ++
 python/ppml/scripts/start-fgboost-server.py   | 23 +++++++
 python/ppml/scripts/start-fl-server.py        | 62 +++++++++++++++++++
 python/ppml/src/bigdl/ppml/fl/nn/fl_server.py |  6 +-
 .../nn/generated/fgboost_service_pb2_grpc.py  | 16 +++--
 .../fl/nn/generated/psi_service_pb2_grpc.py   |  7 +--
 scala/assembly/src/main/assembly/assembly.xml |  8 +++
 13 files changed, 156 insertions(+), 31 deletions(-)
 create mode 100644 ppml/trusted-big-data-ml/python/docker-graphene/start-scripts/start-python-fl-server-sgx.sh
 create mode 100644 python/ppml/scripts/ppml-conf.yaml
 create mode 100644 python/ppml/scripts/setup-env.sh
 create mode 100644 python/ppml/scripts/start-fgboost-server.py
 create mode 100644 python/ppml/scripts/start-fl-server.py

diff --git a/ppml/trusted-big-data-ml/python/docker-graphene/Dockerfile b/ppml/trusted-big-data-ml/python/docker-graphene/Dockerfile
index 91ed7406db4..72c6ef44654 100644
--- a/ppml/trusted-big-data-ml/python/docker-graphene/Dockerfile
+++ b/ppml/trusted-big-data-ml/python/docker-graphene/Dockerfile
@@ -165,7 +165,8 @@ RUN apt-get update --fix-missing && \
 RUN wget https://raw.githubusercontent.com/intel-analytics/analytics-zoo/bigdl-2.0/docker/hyperzoo/download-bigdl.sh && \
     chmod a+x ./download-bigdl.sh
 RUN ./download-bigdl.sh && \
-    rm bigdl*.zip
+    rm bigdl*.zip && \
+    cp ${BIGDL_HOME}/python/start-fl-server.py /ppml/trusted-big-data-ml/fl
 
 # stage.4 ppml
 FROM ubuntu:20.04
@@ -323,3 +324,4 @@ ADD azure /ppml/trusted-big-data-ml/azure
 WORKDIR /ppml/trusted-big-data-ml
 
 ENTRYPOINT [ "/opt/entrypoint.sh" ]
+
diff --git a/ppml/trusted-big-data-ml/python/docker-graphene/start-scripts/start-python-fl-server-sgx.sh b/ppml/trusted-big-data-ml/python/docker-graphene/start-scripts/start-python-fl-server-sgx.sh
new file mode 100644
index 00000000000..b03f5edea42
--- /dev/null
+++ b/ppml/trusted-big-data-ml/python/docker-graphene/start-scripts/start-python-fl-server-sgx.sh
@@ -0,0 +1,25 @@
+#!/bin/bash
+
+port=8980
+client_num=2
+
+while getopts "p:c:" opt
+do
+    case $opt in
+        p)
+            port=$OPTARG
+        ;;
+        c)
+            client_num=$OPTARG
+        ;;
+    esac
+done
+cd /ppml/trusted-big-data-ml
+/graphene/Tools/argv_serializer bash -c " /opt/jdk8/bin/java\
+        -cp '/ppml/trusted-big-data-ml/work/spark-3.1.2/conf/:/ppml/trusted-big-data-ml/work/spark-3.1.2/jars/*'\
+        -Xmx10g org.apache.spark.deploy.SparkSubmit\
+        --master 'local[4]'\
+        /ppml/trusted-big-data-ml/fl/start-fl-server.py -p $port -c $client_num" > /ppml/trusted-big-data-ml/secured-argvs
+./init.sh
+SGX=1 ./pal_loader bash 2>&1 | tee fl-server-sgx.log
+
diff --git a/python/ppml/example/pytorch_nn_lr/pytorch-nn-lr-tutorial.md b/python/ppml/example/pytorch_nn_lr/pytorch-nn-lr-tutorial.md
index 9637378635a..86a6c844da0 100644
--- a/python/ppml/example/pytorch_nn_lr/pytorch-nn-lr-tutorial.md
+++ b/python/ppml/example/pytorch_nn_lr/pytorch-nn-lr-tutorial.md
@@ -96,20 +96,14 @@ result = ppl.predict(x)
 ## 3 Run FGBoost
 FL Server is required before running any federated applications. Check [Start FL Server]() section for details.
 ### 3.1 Start FL Server in SGX
-// TODO: add this section after running FL Server in SGX succesfully in this example.
-
-Modify the config file `ppml-conf.yaml`
-```yaml
-# the port server gRPC uses
-serverPort: 8980
-
-# the number of clients in this federated learning application
-clientNum: 2
-```
-Then start the FL Server
+#### 3.1.1 Start the container
+Before running FL Server in SGX, please prepaer keys and start the BigDL PPML container first. Check  [3.1 BigDL PPML Hello World](https://github.com/intel-analytics/BigDL/tree/main/ppml#31-bigdl-ppml-hello-world) for details.
+#### 3.1.2 Run FL Server in SGX
+You can run FL Server in SGX with the following command:
 ```bash
-python BigDL/python/ppml/src/bigdl/ppml/fl/nn/fl_server.py
+bash start-python-fl-server-sgx.sh -p 8980 -c 2
 ```
+You can set port with `-p` and set client number with `-c`  while the default settings are `port=8980` and `client-num=2`.
 ### 3.2 Start FGBoost Clients
 Modify the config file `ppml-conf.yaml`
 ```yaml
diff --git a/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_1.py b/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_1.py
index b69522174c9..98b7a4aa446 100644
--- a/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_1.py
+++ b/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_1.py
@@ -52,7 +52,7 @@ def forward(self, x: List[Tensor]):
     # fl_server = FLServer(2)
     # fl_server.build()
     # fl_server.start()
-    df_train = pd.read_csv('./python/ppml/example/pytorch_nn_lr/data/diabetes-vfl-1.csv')    
+    df_train = pd.read_csv('.data/diabetes-vfl-1.csv')    
     
     # this should wait for the merge of 2 FLServer (Py4J Java gRPC and Python gRPC)
     # df_train['ID'] = df_train['ID'].astype(str)
diff --git a/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_2.py b/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_2.py
index e3aa9c2dc29..f8b4004a3ab 100644
--- a/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_2.py
+++ b/python/ppml/example/pytorch_nn_lr/pytorch_nn_lr_2.py
@@ -35,7 +35,7 @@ def forward(self, x):
 
 
 if __name__ == '__main__':
-    df_train = pd.read_csv('./python/ppml/example/pytorch_nn_lr/data/diabetes-vfl-2.csv')
+    df_train = pd.read_csv('.data/diabetes-vfl-2.csv')
 
     # this should wait for the merge of 2 FLServer (Py4J Java gRPC and Python gRPC)
     # df_train['ID'] = df_train['ID'].astype(str)
diff --git a/python/ppml/scripts/ppml-conf.yaml b/python/ppml/scripts/ppml-conf.yaml
new file mode 100644
index 00000000000..4b6113fbe1d
--- /dev/null
+++ b/python/ppml/scripts/ppml-conf.yaml
@@ -0,0 +1,9 @@
+##### Server property
+# clientNum: 2
+# privateKeyFilePath: /ppml/trusted-big-data-ml/work/keys/server.pem
+# certChainFilePath:  /ppml/trusted-big-data-ml/work/keys/server.crt
+# serverPort:
+
+##### Client property
+# clientTarget:
+# taskID:
diff --git a/python/ppml/scripts/setup-env.sh b/python/ppml/scripts/setup-env.sh
new file mode 100644
index 00000000000..31491792774
--- /dev/null
+++ b/python/ppml/scripts/setup-env.sh
@@ -0,0 +1,5 @@
+PYTHON_ZIP=$(find lib -name *-python-api.zip)
+JAR=$(find lib -name *-jar-with-dependencies.jar)
+export PYTHONPATH=$PYTHONPATH:$(pwd)/$PYTHON_ZIP
+export PYTHONPATH=$PYTHONPATH:$(pwd)/$PYTHON_ZIP/bigdl/ppml/fl/nn/generated
+export BIGDL_CLASSPATH=$JAR
\ No newline at end of file
diff --git a/python/ppml/scripts/start-fgboost-server.py b/python/ppml/scripts/start-fgboost-server.py
new file mode 100644
index 00000000000..3d69a108ea9
--- /dev/null
+++ b/python/ppml/scripts/start-fgboost-server.py
@@ -0,0 +1,23 @@
+#
+# Copyright 2016 The BigDL Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+from bigdl.ppml.fl.fl_server import FLServer
+
+if __name__ == '__main__':
+    fl_server = FLServer()
+    fl_server.build()
+    fl_server.start()
+    fl_server.wait_for_termination()
\ No newline at end of file
diff --git a/python/ppml/scripts/start-fl-server.py b/python/ppml/scripts/start-fl-server.py
new file mode 100644
index 00000000000..c72ac47ec34
--- /dev/null
+++ b/python/ppml/scripts/start-fl-server.py
@@ -0,0 +1,62 @@
+#
+# Copyright 2016 The BigDL Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import sys
+import os
+import fnmatch
+import getopt
+
+for files in os.listdir('/ppml/trusted-big-data-ml/work/bigdl-2.1.0-SNAPSHOT/python/'):
+    if fnmatch.fnmatch(files, 'bigdl-ppml-*-python-api.zip'):
+        sys.path.append('/ppml/trusted-big-data-ml/work/bigdl-2.1.0-SNAPSHOT/python/' + files)
+        sys.path.append('/ppml/trusted-big-data-ml/work/bigdl-2.1.0-SNAPSHOT/python/' + files + '/bigdl/ppml/fl/nn/generated')
+
+if '/usr/lib/python3.6' in sys.path:
+    sys.path.remove('/usr/lib/python3.6')
+if '/usr/lib/python3.6/lib-dynload' in sys.path:
+    sys.path.remove('/usr/lib/python3.6/lib-dynload')
+if '/usr/local/lib/python3.6/dist-packages' in sys.path:
+    sys.path.remove('/usr/local/lib/python3.6/dist-packages')
+if '/usr/lib/python3/dist-packages' in sys.path:
+    sys.path.remove('/usr/lib/python3/dist-packages')
+
+from bigdl.ppml.fl.nn.fl_server import FLServer
+
+if __name__ == '__main__':
+
+    client_num = 2
+    port = 8980
+    
+    try:
+        opts, args = getopt.getopt(sys.argv[1:], "hc:p:", ["client-num=", "port="])
+    except getopt.GetoptError:
+        print("start_fl_server.py -c <client-num> -p <port>")
+        sys.exit(2)
+    
+    for opt, arg in opts:
+        if opt == '-h':
+            print("start_fl_server.py -c <client-num> -p <port>")
+        elif opt in ("-c", "--client-num"):
+            client_num = arg
+        elif opt in ("-p", "--port"):
+            port = arg
+
+    fl_server = FLServer(client_num)
+    fl_server.set_port(port)
+    fl_server.build()
+    fl_server.start()
+
+    fl_server.wait_for_termination()
diff --git a/python/ppml/src/bigdl/ppml/fl/nn/fl_server.py b/python/ppml/src/bigdl/ppml/fl/nn/fl_server.py
index 18bd70b0b17..a62a2a7962e 100644
--- a/python/ppml/src/bigdl/ppml/fl/nn/fl_server.py
+++ b/python/ppml/src/bigdl/ppml/fl/nn/fl_server.py
@@ -20,13 +20,13 @@
 from bigdl.ppml.fl.nn.generated.nn_service_pb2_grpc import *
 from bigdl.ppml.fl.nn.nn_service import NNServiceImpl
 import yaml
-
+import logging
 
 
 class FLServer(object):
     def __init__(self, client_num=1):
         self.server = grpc.server(futures.ThreadPoolExecutor(max_workers=5))
-        self.port = 8980 # TODO: set from config file
+        self.port = 8980
         self.client_num = client_num
         self.secure = False
         self.load_config()
@@ -79,4 +79,4 @@ def wait_for_termination(self):
     fl_server = FLServer(2)
     fl_server.build()
     fl_server.start()
-    fl_server.wait_for_termination()
\ No newline at end of file
+    fl_server.wait_for_termination()
diff --git a/python/ppml/src/bigdl/ppml/fl/nn/generated/fgboost_service_pb2_grpc.py b/python/ppml/src/bigdl/ppml/fl/nn/generated/fgboost_service_pb2_grpc.py
index 7c8546245b5..ddfcf12c06c 100644
--- a/python/ppml/src/bigdl/ppml/fl/nn/generated/fgboost_service_pb2_grpc.py
+++ b/python/ppml/src/bigdl/ppml/fl/nn/generated/fgboost_service_pb2_grpc.py
@@ -3,8 +3,6 @@
 import grpc
 
 import fgboost_service_pb2 as fgboost__service__pb2
-from bigdl.dllib.utils.log4Error import invalidInputError
-
 
 class FGBoostServiceStub(object):
     """Missing associated documentation comment in .proto file."""
@@ -59,43 +57,43 @@ def uploadLabel(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def downloadLabel(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def split(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def register(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def uploadTreeLeaf(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def evaluate(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def predict(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
 
 def add_FGBoostServiceServicer_to_server(servicer, server):
diff --git a/python/ppml/src/bigdl/ppml/fl/nn/generated/psi_service_pb2_grpc.py b/python/ppml/src/bigdl/ppml/fl/nn/generated/psi_service_pb2_grpc.py
index 226393cba35..9916c0356fb 100644
--- a/python/ppml/src/bigdl/ppml/fl/nn/generated/psi_service_pb2_grpc.py
+++ b/python/ppml/src/bigdl/ppml/fl/nn/generated/psi_service_pb2_grpc.py
@@ -3,7 +3,6 @@
 import grpc
 
 import psi_service_pb2 as psi__service__pb2
-from bigdl.dllib.utils.log4Error import invalidInputError
 
 
 class PSIServiceStub(object):
@@ -40,19 +39,19 @@ def getSalt(self, request, context):
         """
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def uploadSet(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def downloadIntersection(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
         context.set_details('Method not implemented!')
-        invalidInputError(False, 'Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
 
 def add_PSIServiceServicer_to_server(servicer, server):
diff --git a/scala/assembly/src/main/assembly/assembly.xml b/scala/assembly/src/main/assembly/assembly.xml
index 8ba18cc45cc..c229c50fc7c 100644
--- a/scala/assembly/src/main/assembly/assembly.xml
+++ b/scala/assembly/src/main/assembly/assembly.xml
@@ -148,6 +148,13 @@
           <include>bigdl-ppml*-jar-with-dependencies.jar</include>
       </includes>
     </fileSet>
+    <fileSet>
+      <outputDirectory>/python</outputDirectory>
+      <directory>${project.parent.basedir}/../../../../../python/ppml/scripts</directory>
+      <includes>
+          <include>start-fl-server.py</include>
+      </includes>
+    </fileSet>
   </fileSets>
   <dependencySets>
     <dependencySet>
@@ -176,3 +183,4 @@
     </dependencySet>
   </dependencySets>
 </assembly>
+