use exchange from mysql and neo4j (#805)

vesoft-inc · Oct 15, 2021 · 7ad29c6 · 7ad29c6
1 parent c91846d
commit 7ad29c6
Show file tree

Hide file tree

Showing 2 changed files with 77 additions and 82 deletions.
diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md
@@ -52,31 +52,31 @@ This example is done on MacOS. Here is the environment configuration information
 
 - Hardware specifications:
   - CPU: 1.7 GHz Quad-Core Intel Core i7
-  - memory: 16 GB
+  - Memory: 16 GB
 
-- Spark: 2.4.7, Stand-alone
+- Spark: 2.4.7, stand-alone
 
-- Hadoop: 2.9.2, Pseudo-distributed deployment
+- Hadoop: 2.9.2, pseudo-distributed deployment
 
 - MySQL: 8.0.23
 
-- Nebula Graph: {{nebula.release}} ([Deploy Nebula Graph with Docker Compose](../../4.deployment-and-installation/2.compile-and-install-nebula-graph/3.deploy-nebula-graph-with-docker-compose.md))
+- Nebula Graph: {{nebula.release}}. [Deploy Nebula Graph with Docker Compose](../../4.deployment-and-installation/2.compile-and-install-nebula-graph/3.deploy-nebula-graph-with-docker-compose.md).
 
 ## Prerequisites
 
 Before importing data, you need to confirm the following information:
 
 - Nebula Graph has been [installed](../../4.deployment-and-installation/2.compile-and-install-nebula-graph/2.install-nebula-graph-by-rpm-or-deb.md) and deployed with the following information:
 
-  - IP address and port of Graph and Meta services.
+  - IP addresses and ports of Graph and Meta services.
 
-  - User name and password with Nebula Graph write permission.
+  - The user name and password with write permission to Nebula Graph.
 
 - Exchange has been [compiled](../ex-ug-compile.md), or [download](https://repo1.maven.org/maven2/com/vesoft/nebula-exchange/) the compiled `.jar` file directly.
 
 - Spark has been installed.
 
-- Learn about the Schema created in Nebula Graph, including Tag and Edge type names, properties, and more.
+- Learn about the Schema created in Nebula Graph, including names and properties of Tags and Edge types, and more.
 
 - The Hadoop service has been installed and started.
 
@@ -88,7 +88,7 @@ Analyze the data to create a Schema in Nebula Graph by following these steps:
 
 1. Identify the Schema elements. The Schema elements in the Nebula Graph are shown in the following table.
 
-    | Element  | name | property |
+    | Element  | Name | Property |
     | :--- | :--- | :--- |
     | Tag | `player` | `name string, age int` |
     | Tag | `team` | `name string` |
@@ -98,33 +98,33 @@ Analyze the data to create a Schema in Nebula Graph by following these steps:
 2. Create a graph space **basketballplayer** in the Nebula Graph and create a Schema as shown below.
 
     ```ngql
-    ## create graph space
+    ## Create a graph space.
     nebula> CREATE SPACE basketballplayer \
             (partition_num = 10, \
             replica_factor = 1, \
             vid_type = FIXED_STRING(30));
     
-    ## use the graph space basketballplayer
+    ## Use the graph space basketballplayer.
     nebula> USE basketballplayer;
     
-    ## create Tag player
+    ## Create the Tag player.
     nebula> CREATE TAG player(name string, age int);
     
-    ## create Tag team
+    ## Create the Tag team.
     nebula> CREATE TAG team(name string);
     
-    ## create Edge type follow
+    ## Create the Edge type follow.
     nebula> CREATE EDGE follow(degree int);
 
-    ## create Edge type serve
+    ## Create the Edge type serve.
     nebula> CREATE EDGE serve(start_year int, end_year int);
     ```
 
 For more information, see [Quick start workflow](../../2.quick-start/1.quick-start-workflow.md).
 
-### Step 2: Modify configuration file
+### Step 2: Modify configuration files
 
-After Exchange is compiled, copy the conf file `target/classes/application.conf` settings MySQL data source configuration. In this case, the copied file is called `mysql_application.conf`. For details on each configuration item, see [Parameters in the configuration file](../parameter-reference/ex-ug-parameter.md).
+After Exchange is compiled, copy the conf file `target/classes/application.conf` to set MySQL data source configuration. In this case, the copied file is called `mysql_application.conf`. For details on each configuration item, see [Parameters in the configuration file](../parameter-reference/ex-ug-parameter.md).
 
 ```conf
 {
@@ -145,7 +145,7 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf`
   # Nebula Graph configuration
   nebula: {
     address:{
-      # Specify the IP addresses and ports for Graph and all Meta services.
+      # Specify the IP addresses and ports for Graph and Meta services.
       # If there are multiple addresses, the format is "ip1:port","ip2:port","ip3:port".
       # Addresses are separated by commas.
       graph:["127.0.0.1:9669"]
@@ -172,16 +172,16 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf`
       timeout: 1000
     }
   }
-  # Processing vertex
+  # Processing vertexes
   tags: [
-    # Set information about Tag player.
+    # Set the information about the Tag player.
     {
       # The Tag name in Nebula Graph.
       name: player
       type: {
-        # Specify the data source file format, set to MySQL.
+        # Specify the data source file format to MySQL.
         source: mysql
-        # Specifies how to import the data into Nebula Graph: Client or SST.
+        # Specify how to import the data into Nebula Graph: Client or SST.
         sink: client
       }
 
@@ -199,18 +199,18 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf`
       fields: [age,name]
       nebula.fields: [age,name]
 
-      # Specify a column of data in the table as the source of vertex VID in the Nebula Graph.
+      # Specify a column of data in the table as the source of VIDs in the Nebula Graph.
       vertex: {
         field:playerid
       }
 
-      # Number of pieces of data written to Nebula Graph in a single batch.
+      # The number of data written to Nebula Graph in a single batch.
       batch: 256
 
-      # Number of Spark partitions
+      # The number of Spark partitions.
       partition: 32
     }
-    # Set Tag Team information.
+    # Set the information about the Tag Team.
     {
       name: team
       type: {
@@ -237,18 +237,19 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf`
 
   ]
 
-  # Processing edge
+  # Processing edges
   edges: [
-    # Set information about Edge Type follow
+    # Set the information about the Edge Type follow.
     {
       # The corresponding Edge Type name in Nebula Graph.
       name: follow
 
       type: {
-        # Specify the data source file format, set to MySQL.
+        # Specify the data source file format to MySQL.
         source: mysql
 
-        # Specifies how to import the data into Nebula Graph: Client or SST.
+        # Specify how to import the Edge type data into Nebula Graph.
+        # Specify how to import the data into Nebula Graph: Client or SST.
         sink: client
       }
 
@@ -260,31 +261,30 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf`
       password:"123456"
       sentence:"select src_player,dst_player,degree from basketball.follow order by src_player;"
 
-      # Specify the column names in the follow table in Fields, and their corresponding values are specified as properties in the Nebula Graph.
+      # Specify the column names in the follow table in fields, and their corresponding values are specified as properties in the Nebula Graph.
       # The sequence of fields and nebula.fields must correspond to each other.
       # If multiple column names need to be specified, separate them by commas.
       fields: [degree]
       nebula.fields: [degree]
 
-      # In source, use a column in the follow table as the source of the edge's starting vertex.
-
+      # In source, use a column in the follow table as the source of the edge's source vertex.
+      # In target, use a column in the follow table as the source of the edge's destination vertex.
       source: {
         field: src_player
       }
 
-      # In target, use a column in the follow table as the source of the edge's destination vertex.
       target: {
         field: dst_player
       }
 
-      # Number of pieces of data written to Nebula Graph in a single batch.
+      # The number of data written to Nebula Graph in a single batch.
       batch: 256
 
-      # Number of Spark partitions
+      # The number of Spark partitions.
       partition: 32
     }
 
-    # Set information about Edge Type serve
+    # Set the information about the Edge Type serve.
     {
       name: serve
       type: {
@@ -326,17 +326,17 @@ ${SPARK_HOME}/bin/spark-submit --master "local" --class com.vesoft.nebula.exchan
 
     JAR packages are available in two ways: [compiled them yourself](../ex-ug-compile.md), or [download](https://repo1.maven.org/maven2/com/vesoft/nebula-exchange/) the compiled `.jar` file directly.
 
-Example:
+For example:
 
 ```bash
 ${SPARK_HOME}/bin/spark-submit  --master "local" --class com.vesoft.nebula.exchange.Exchange  /root/nebula-spark-utils/nebula-exchange/target/nebula-exchange-{{exchange.release}}.jar  -c /root/nebula-spark-utils/nebula-exchange/target/classes/mysql_application.conf
 ```
 
 You can search for `batchSuccess.<tag_name/edge_name>` in the command output to check the number of successes. For example, `batchSuccess.follow: 300`.
 
-### Step 4: (optional) Validation data
+### Step 4: (optional) Validate data
 
-Users can verify that data has been imported by executing a query in the Nebula Graph client (for example, Nebula Graph Studio). Such as:
+Users can verify that data has been imported by executing a query in the Nebula Graph client (for example, Nebula Graph Studio). For example:
 
 ```ngql
 GO FROM "player100" OVER follow;