From 17a9fe219ff6f8226cc92d0efa38f0d5c43645aa Mon Sep 17 00:00:00 2001 From: cooper-lzy <78672629+cooper-lzy@users.noreply.github.com> Date: Thu, 10 Aug 2023 10:34:41 +0800 Subject: [PATCH] exchange supports batch update and delete (#2213) --- .../parameter-reference/ex-ug-parameter.md | 3 +++ .../use-exchange/ex-ug-import-from-clickhouse.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-csv.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-hbase.md | 8 ++++++++ .../use-exchange/ex-ug-import-from-hive.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-jdbc.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-json.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-kafka.md | 8 ++++++++ .../use-exchange/ex-ug-import-from-maxcompute.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-mysql.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-neo4j.md | 11 +++++++++++ .../use-exchange/ex-ug-import-from-oracle.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-orc.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-parquet.md | 9 +++++++++ .../use-exchange/ex-ug-import-from-pulsar.md | 8 ++++++++ 15 files changed, 128 insertions(+) diff --git a/docs-2.0/nebula-exchange/parameter-reference/ex-ug-parameter.md b/docs-2.0/nebula-exchange/parameter-reference/ex-ug-parameter.md index 0a4b3c3bc35..2ba04af1988 100644 --- a/docs-2.0/nebula-exchange/parameter-reference/ex-ug-parameter.md +++ b/docs-2.0/nebula-exchange/parameter-reference/ex-ug-parameter.md @@ -98,6 +98,8 @@ For different data sources, the vertex configurations are different. There are m |`tags.name`|string|-|Yes|The tag name defined in NebulaGraph.| |`tags.type.source`|string|-|Yes|Specify a data source. For example, `csv`.| |`tags.type.sink`|string|`client`|Yes|Specify an import method. Optional values are `client` and `SST`.| +|`tags.writeMode`|string|`INSERT`|No|Types of batch operations on data, including batch inserts, updates, and deletes. Optional values are `INSERT`, `UPDATE`, `DELETE`.| +|`tags.deleteEdge`|string|`false`|No|Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `tags.writeMode` is `DELETE`.| |`tags.fields`|list\[string\]|-|Yes|The header or column name of the column corresponding to properties. If there is a header or a column name, please use that name directly. If a CSV file does not have a header, use the form of `[_c0, _c1, _c2]` to represent the first column, the second column, the third column, and so on.| |`tags.nebula.fields`|list\[string\]|-|Yes|Property names defined in NebulaGraph, the order of which must correspond to `tags.fields`. For example, `[_c1, _c2]` corresponds to `[name, age]`, which means that values in the second column are the values of the property `name`, and values in the third column are the values of the property `age`.| |`tags.vertex.field`|string|-|Yes|The column of vertex IDs. For example, when a CSV file has no header, users can use `_c0` to indicate values in the first column are vertex IDs.| @@ -245,6 +247,7 @@ For the specific parameters of different data sources for edge configurations, p |`edges.name`| string|-|Yes|The edge type name defined in NebulaGraph.| |`edges.type.source`|string|-|Yes|The data source of edges. For example, `csv`.| |`edges.type.sink`|string|`client`|Yes|The method specified to import data. Optional values are `client` and `SST`.| +|`edges.writeMode`|string|`INSERT`|No|Types of batch operations on data, including batch inserts, updates, and deletes. Optional values are `INSERT`, `UPDATE`, `DELETE`.| |`edges.fields`|list\[string\]|-|Yes|The header or column name of the column corresponding to properties. If there is a header or column name, please use that name directly. If a CSV file does not have a header, use the form of `[_c0, _c1, _c2]` to represent the first column, the second column, the third column, and so on.| |`edges.nebula.fields`|list\[string\]|-|Yes|Edge names defined in NebulaGraph, the order of which must correspond to `edges.fields`. For example, `[_c2, _c3]` corresponds to `[start_year, end_year]`, which means that values in the third column are the values of the start year, and values in the fourth column are the values of the end year.| |`edges.source.field`|string|-|Yes|The column of source vertices of edges. For example, `_c0` indicates a value in the first column that is used as the source vertex of an edge.| diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-clickhouse.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-clickhouse.md index 8474265621d..d1a0a6fa05c 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-clickhouse.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-clickhouse.md @@ -170,6 +170,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # policy:hash } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -254,6 +260,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-csv.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-csv.md index d45dc35c5a4..77ae084e96f 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-csv.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-csv.md @@ -202,6 +202,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # If the CSV file does not have a header, set the header to false. The default value is false. header: false + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -317,6 +323,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # If the CSV file does not have a header, set the header to false. The default value is false. header: false + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hbase.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hbase.md index 7f0639a2485..ccfd5015cd7 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hbase.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hbase.md @@ -203,6 +203,11 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false # Number of pieces of data written to NebulaGraph in a single batch. batch: 256 @@ -283,6 +288,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hive.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hive.md index b5688e4731b..04055fd5809 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hive.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-hive.md @@ -245,6 +245,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -318,6 +324,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-jdbc.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-jdbc.md index afb903c98d1..83a2ebf0dee 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-jdbc.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-jdbc.md @@ -234,6 +234,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -337,6 +343,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-json.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-json.md index ed511ef024c..d1c907d3b56 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-json.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-json.md @@ -222,6 +222,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -323,6 +329,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-kafka.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-kafka.md index e8fb00f6c75..15d65aa2e90 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-kafka.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-kafka.md @@ -188,6 +188,11 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false # The number of data written to NebulaGraph in a single batch. batch: 10 @@ -254,6 +259,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # # (Optional) Specify a column as the source of the rank. # #ranking: rank + # # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + # #writeMode: INSERT + # # The number of data written to NebulaGraph in a single batch. # batch: 10 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-maxcompute.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-maxcompute.md index e46a337a861..dd07e90f3e7 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-maxcompute.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-maxcompute.md @@ -179,6 +179,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -277,6 +283,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of Spark partitions. partition:10 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md index 87732db09c0..bc20dd91377 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-mysql.md @@ -223,6 +223,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -317,6 +323,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-neo4j.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-neo4j.md index da2f3724fcb..8f6afbbb93a 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-neo4j.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-neo4j.md @@ -190,6 +190,13 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # newColName:new-field # } } + + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + partition: 10 batch: 1000 check_point_path: /tmp/test @@ -250,6 +257,10 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } #ranking: rank + + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + partition: 10 batch: 1000 check_point_path: /tmp/test diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-oracle.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-oracle.md index 9fc0a8ab9e7..deb35e76fa4 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-oracle.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-oracle.md @@ -218,6 +218,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -310,6 +316,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-orc.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-orc.md index 191030c067a..ad4fccdbb9e 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-orc.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-orc.md @@ -189,6 +189,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -290,6 +296,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-parquet.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-parquet.md index fd3b73609b3..a7a3bde70c0 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-parquet.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-parquet.md @@ -190,6 +190,12 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false + # The number of data written to NebulaGraph in a single batch. batch: 256 @@ -290,6 +296,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 256 diff --git a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-pulsar.md b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-pulsar.md index ec347253d8f..c58676a2212 100644 --- a/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-pulsar.md +++ b/docs-2.0/nebula-exchange/use-exchange/ex-ug-import-from-pulsar.md @@ -172,6 +172,11 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # } } + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + + # Whether or not to delete the related incoming and outgoing edges of the vertices when performing a batch delete operation. This parameter takes effect when `writeMode` is `DELETE`. + #deleteEdge: false # The number of data written to NebulaGraph in a single batch. batch: 10 @@ -259,6 +264,9 @@ After Exchange is compiled, copy the conf file `target/classes/application.conf` # (Optional) Specify a column as the source of the rank. #ranking: rank + # Batch operation types, including INSERT, UPDATE, and DELETE. defaults to INSERT. + #writeMode: INSERT + # The number of data written to NebulaGraph in a single batch. batch: 10