Merge pull request #43 from FederatedAI/develop

v1.2.0
FederatedAI · Feb 21, 2020 · 299c79a · 299c79a
2 parents 9d0347d + 1dc25d4
commit 299c79a
Show file tree

Hide file tree

Showing 267 changed files with 6,761 additions and 7,950 deletions.
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,18 @@
+# common file patterns
+.DS_STORE
+.idea
+*.iml
+*.pyc
+__pycache__
+*.jar
+*.class
+.project
+*.prefs
+
+# excluded paths
+/fate-serving/federatedml/target/
+/fate-serving/serving-server/target/
+/fate-serving/target/
+/fate-serving/fate-serving-core/target/
+.idea/*
+.vscode/*
diff --git a/README.md b/README.md
@@ -4,203 +4,21 @@
 
 ## Introduction
 
-FATE-Serving is a high-performance, industrialized serving system for federated learning models, designed for production environments.
+FATE-Serving is a high-performance, industrialized serving system for federated learning models, designed for production environments. for more detail, You can click [WIKI](https://github.com/FederatedAI/FATE-Serving/wiki) for more information for more information 
 
 ### FATE-Serving now supports
 
 - High performance online Federated Learning algorithms.
 - Federated Learning online inference pipeline.
 - Dynamic loading federated learning models.
 - Can serve multiple models, or multiple versions of the same model.
-- Support A/B testing experimental models.
 - Real-time inference using federated learning models.
 - Support multi-level cache for remote party federated inference result.
 - Support pre-processing, post-processing and data-access adapters for the production deployment.
-- Provide service managerment for grpc interface by using zookeeper as registry (optional)
+- Provide service managerment for grpc interface by using zookeeper as registry 
 - Requests for publishing models are persisted to local files，so the loaded model will be loaded automatically when the application is restarted
 
 
 
-## Federated Learning Online Inference Pipeline
 
-![fate_serving_online_pipeline](./images/fate_serving_online_pipeline.png)
 
-
-
-## Architecture
-
-![fate_serving_arch](./images/fate_serving_arch.png)
-
-
-
-## Deploy
-
-The preparations are as follows：
-
-1. The serving-server rely on Redis,Redis needs to be installed in advance
-2. All models is run in the JVM ,Java  needs to be installed in advance
-3. Verify that the service governance feature is required, you can set it to be enabled in the configuration file, and if it is enabled, you need to install zookeeper in advance
-
-the ordinary deploy architecture as the graph shows，If you use this pattern， the IP addresses of each module need to be manually configured in the configuration file
-
-![fate_serving_arch](./images/noZk.png)
-
-
-
-
-
-If you want use the service management,the deploy architecture is show here:
-
-![fate_serving_arch](./images/useZk.png)
-
-
-- serving-server: Federated Learning online inference service based on GRPC
-- serving-router: route requests to serving-server or to another party ，The function of this module is similar to the Proxy module in FATE
-- Zookeeper: work as the register center 
-
-
-
-### The data in the zookeeper
-
-
-
-
-
-
-
-### serving-server.properties
-Key configuration item description:
-
-| Configuration item | Configuration item meaning | Configuration item value |
-| - | - | - |
-| ip | listen address for FATE-Serving | default 0.0.0.0 |
-| port | listen port for the grpc server of FATE-Serving | default 8000 |
-| workMode | the work mode of FATE-Flow | 0 for standalone, 1 for cluster |
-| inferenceWorkerThreadNum | inference worker num for async inference | default 10 |
-| standaloneStoragePath | the storage path of standalone EggRoll | generally is PYTHONPATH/data |
-| remoteModelInferenceResultCacheSwitch | switch of remote model inference result cache storage | default true |
-| proxy | the address of proxy | custom configuration |
-| roll | the address of roll | custom configuration |
-| OnlineDataAccessAdapter | data access adapter class for obtaining host feature data | default TestFile, read host feature data from ``host_data.csv`` on serving-server root directory |
-| InferencePostProcessingAdapter| inference post-processing adapter class for dealing result after model inference | default PassPostProcessing |
-| InferencePreProcessingAdapter | inference pre-processing adapter class for dealing guest feature data before model inference | default PassPreProcessing |
-| useRegister | Register interface to registry or not | default false |
-| useZkRouter | route request by the interface info which is registered into zookeeper | default false |
-| zk.url | zookeeper url ,eg:zookeeper://localhost:2181?backup=localhost:2182,localhost:2183 | default zookeeper://localhost:2181 |
-| coordinator | The party id for serving  | default webank |
-| serviceRoleName | The federated roles  model name | default serving |
-| modelCacheAccessTTL | The model cache expire after access | default 12 |
-| modelCacheMaxSize | The maximum size of model cache | default 50 |
-| remoteModelInferenceResultCacheTTL | The remote model inference result cache expire after access | default 300 |
-| remoteModelInferenceResultCacheMaxSize | The maximum size of remote model inference result cache | default 10000 |
-| inferenceResultCacheTTL | The inference result cache expire after access | default 30 |
-| inferenceResultCacheCacheMaxSize | The maximum size of inference result cache | default 1000 |
-| redis.ip | The connection host | default 127.0.0.1 |
-| redis.port | Accept redis connections on the specified port| default 6379 |
-| redis.password | The connection password | default  fate_dev |
-| redis.timeout | Close the connection after a client is idle for N seconds | default 10 |
-| redis.maxTotal | The maximum number of objects that can be allocated by the pool | default 100 |
-| redis.maxIdle | The maximum number of "idle" instances that can be held in the pool or a negative value if there is no limit | default 100 |
-| external.remoteModelInferenceResultCacheTTL | The remote model inference result cache expire after access  for external cache | default 86400 |
-| external.remoteModelInferenceResultCacheDBIndex | The remote model inference result cache DBIndex for external | default 0 |
-| external.inferenceResultCacheTTL | The inference result cache expire after access for external cache | default 300 |
-| external.inferenceResultCacheDBIndex | The inference result cache DBIndex for external cache | default 0 |
-| external.processCacheDBIndex | The process cache DBIndex for external cache | default 0 |
-| canCacheRetcode | Caching result by retcode | default 0,102 |
-| acl.username | Zookeeper acl authentication user name | |
-| acl.password | Zookeeper acl authentication user password |  |
-
-### proxy.properties
-Key configuration item description:
-
-| Configuration item | Configuration item meaning | Configuration item value |
-| - | - | - |
-| ip | listen address for FATE-Serving-Router | default 0.0.0.0 |
-| port | listen port for the FATE-Serving-Router | default 9370 |
-| coordinator | The party id for serving | default webank |
-| zk.url | zookeeper url, same as serving configuration | default zookeeper://localhost:2181 |
-| useRegister | Register interface to registry or not | default false |
-| useZkRouter | route request by the interface info which is registered into zookeeper | default false |
-| route.table | router table configuration file absolute path | default /data/projects/fate/serving-router/conf/route_table.json |
-| acl.username | Zookeeper acl authentication user name |   |
-| acl.password | Zookeeper acl authentication user password |  |
-
-### Deploy Serving-Server 
-For detail, Here are some key steps:
-
-
-    1.git clone https://github.com/FederatedAI/FATE-Serving.git
-    2.cd  FATE-Serving
-    3.mvn clean package
-    4.copy serving-server/target/fate-serving-server-1.1.2-release.zip to your deploy location and unzip it
-    5.modify the configuration file conf/serving-server.properties according to your own requirements
-    6.confirm whether Java is installed. You can check through the java -version command.
-    7.sh service.sh restart
-
-
-
-
-### Deploy Serving-Router
-
-For detail, Here are some key steps:
-
-    1.Same as serving-server deploy steps 1/2/3, if it has been executed, you can skip
-    2.copy router/target/fate-serving-router-1.1.2-release.zip to your deploy location and unzip it
-    3.modify the configuration file conf/proxy.properties and conf/route_table.json according to your own requirements
-    5.confirm whether Java is installed. You can check through the java -version command.
-    6.sh service.sh restart
-
-
-
-
-
-
-
-
-
-
-## Usage
-FATE-Serving provide publish model and online inference API.
-
-### Publish Model
-
-Please use FATE-Flow Client which in the fate-flow to operate, refer to **Online Inference** guide at [fate_flow_readme](https://github.com/FederatedAI/FATE/blob/master/fate_flow/README.md). 
-
-
-
-### Inference
-
-Serving currently supports three inference-related interfaces, using the grpc protocol.
-
-- inference: Initiate an inference request and get the result
-- startInferenceJob: Initiate an inference request task without getting results
-- getInferenceResult: Get the result of the inference by caseid
-
-please refer to this script for inference.
-
-
-
-### Adapter
-
-Serving supports pre-processing, post-processing and data-access adapters for the actural production.
-
-- pre-processing: Data pre processing before model calculation
-- post-processing: Data post processing after model calculation
-- data-access: get feature from party's system
-
-At the current stage, you need to put the java code to recompile, and later support to dynamically load the jar in the form of a release.
-
-For now:
-
-- push your pre-processing and post-processing adapter code into fate-serving/serving-server/src/main/java/com/webank/ai/fate/serving/adapter/processing and modify the InferencePreProcessingAdapter/InferencePostProcessingAdapter configuration parameters.
-- push your data-access adapter code into fate-serving/serving-server/src/main/java/com/webank/ai/fate/serving/adapter/dataaccess and modify the OnlineDataAccessAdapter configuration parameters.
-
-please refer to PassPostProcessing, PassPreProcessing, TestFile adapter.
-
-
-
-### Remote party multi-level cache
-
-For federal learning, one inference needs to be calculated by multiple parties. In the production environment, the parties are deployed in different IDCs, and the network communication between multiple parties is one of the bottleneck.
-
-So, fate-serving supports caches multi-party model inference results on the initiator, but never caches feature data. you can turn the remoteModelInferenceResultCacheSwitch which in the configuration.
diff --git a/RELEASE.md b/RELEASE.md
@@ -1,8 +1,15 @@
+# Release 1.2.0
+## Major Features and Improvements
+* Replace serving-router with a brand new service called serving-proxy, which supports authentication and inference request with HTTP or gRPC
+* Decouple FATE-Serving and Eggroll, model is read directly from FATE-Flow
+* Fixed a bug that got the remote inference result cache
+
 # Release 1.1.2
 ## Major Features and Improvements
 * Using metrics components and providing monitoring through JMX
 * Host supports binding grpc interface with model information and registering it in zookeeper, and supports routing to different instances through model information.
 * Guest adds a grpc interface for model binding. It supports model binding service id and registering it in zookeeper. The caller can route to different instances through service id. The service id is specified by fate_flow, which can uniquely represent a model.
+
 # Release 1.1.1
 ## Major Features and Improvements
 * Support indicating partial columns in Onehot Encoder

diff --git a/bin/common.sh b/bin/common.sh
@@ -0,0 +1,75 @@
+#!/bin/bash
+set -e
+getpid() {
+  if [ -e "./bin/${module}.pid" ]; then
+    pid=$(cat ./bin/${module}.pid)
+  fi
+  if [[ -n ${pid} ]]; then
+    count=$(ps -ef | grep $pid | grep -v "grep" | wc -l)
+    if [[ ${count} -eq 0 ]]; then
+      rm ./bin/${module}.pid
+      unset pid
+    fi
+  fi
+}
+
+mklogsdir() {
+  if [[ ! -d "logs" ]]; then
+    mkdir logs
+  fi
+}
+
+start() {
+  echo "try to start ${module}"
+  getpid
+  if [[ ! -n ${pid} ]]; then
+    mklogsdir
+    if [[ ! -e "fate-${module}.jar" ]]; then
+      ln -s fate-${module}-${module_version}.jar fate-${module}.jar
+    fi
+    if [ ${module} = "serving-server" ]; then
+      java -cp "conf/:lib/*:fate-${module}.jar" ${main_class} -c conf/${module}.properties >>logs/console.log 2>>logs/error.log &
+    elif [ ${module} = "serving-proxy" ]; then
+      java -Dspring.config.location=${configpath}/application.properties -cp "conf/:lib/*:fate-${module}.jar" ${main_class} -c conf/application.properties >>logs/console.log 2>>logs/error.log &
+    else
+      echo "usage: ${module} {serving-server|serving-proxy}"
+    fi
+    sleep 5
+    id=$(ps -p $! | awk '{print $1}' | sed -n '2p')
+    if [[ ${#id} -ne 0 ]]; then
+      echo $! >./bin/${module}.pid
+      getpid
+      echo "service start sucessfully. pid: ${pid}"
+    else
+      echo "service start failed"
+    fi
+  else
+    echo "service already started. pid: ${pid}"
+  fi
+}
+
+status() {
+  getpid
+  if [[ -n ${pid} ]]; then
+    echo "status: $(ps -f -p ${pid})"
+    exit 0
+  else
+    echo "service not running"
+    exit 1
+  fi
+}
+
+stop() {
+  getpid
+  if [[ -n ${pid} ]]; then
+    echo "killing: $(ps -p ${pid})"
+    kill ${pid}
+    if [[ $? -eq 0 ]]; then
+      echo "killed"
+    else
+      echo "kill error"
+    fi
+  else
+    echo "service not running"
+  fi
+}
diff --git a/...ing-server/conf/serving-server.properties → conf/serving-server.properties b/...ing-server/conf/serving-server.properties → conf/serving-server.properties
@@ -13,15 +13,10 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-coordinator=webank
 ip=127.0.0.1
 port=8000
-workMode=0
 serviceRoleName=serving
 inferenceWorkerThreadNum=10
-#storage
-# maybe python/data/
-standaloneStoragePath=
 # cache
 remoteModelInferenceResultCacheSwitch=true
 # in-process cache
@@ -45,7 +40,6 @@ external.inferenceResultCacheDBIndex=0
 canCacheRetcode=0,102
 external.processCacheDBIndex=0
 # federation
-party.id=9999
 # adapter
 OnlineDataAccessAdapter=TestFile
 InferencePostProcessingAdapter=PassPostProcessing
@@ -57,5 +51,3 @@ roll=127.0.0.1:8011
 zk.url=zookeeper://localhost:2181
 useRegister=false
 useZkRouter=false
-useJMX=true
-jmx.server.name=JMXServer
diff --git a/fate-metrics-api/pom.xml b/fate-metrics-api/pom.xml
@@ -0,0 +1,16 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<project xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xmlns="http://maven.apache.org/POM/4.0.0"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <parent>
+        <artifactId>fate-serving</artifactId>
+        <groupId>com.webank.ai.fate</groupId>
+        <version>${fate.version}</version>
+    </parent>
+    <modelVersion>4.0.0</modelVersion>
+
+    <artifactId>fate-metrics-api</artifactId>
+    <packaging>jar</packaging>
+
+</project>