(incubator-graphar-testing) branch main updated: change import config file (#27)

weibin Wed, 30 Oct 2024 16:36:22 -0700

This is an automated email from the ASF dual-hosted git repository.

weibin pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/incubator-graphar-testing.git



The following commit(s) were added to refs/heads/main by this push:
     new 955596c  change import config file (#27)
955596c is described below

commit 955596c325ceba7b607e285738e3dd0ce4ff424e
Author: Liu Jiajun <[email protected]>
AuthorDate: Thu Oct 31 07:26:16 2024 +0800

    change import config file (#27)
    
    * add import config file
    
    * change import  config file
---
 neo4j/data/import.full.json | 214 --------------------------------------------
 neo4j/data/import.full.yml  | 138 ++++++++++++++++++++++++++++
 neo4j/data/import.mini.json | 130 ---------------------------
 neo4j/data/import.mini.yml  |  71 +++++++++++++++
 4 files changed, 209 insertions(+), 344 deletions(-)

diff --git a/neo4j/data/import.full.json b/neo4j/data/import.full.json
deleted file mode 100644
index 479c508..0000000
--- a/neo4j/data/import.full.json
+++ /dev/null
@@ -1,214 +0,0 @@
-{
-    "graphar": {
-        "path": "/workspaces/incubator-graphar/graphar/movie",
-        "name": "MovieGraph",
-        "vertex_chunk_size": 100,
-        "edge_chunk_size": 1024,
-        "file_type": "parquet",
-        "adj_list_type": "ordered_by_source",
-        "validate_level": "weak",
-        "version": "gar/v1"
-    },
-    "import_schema": {
-        "vertices": [
-            {
-                "type": "Person",
-                "labels": [
-                    "Person"
-                ],
-                "chunk_size": 100,
-                "validate_level": "no",
-                "prefix": "vertex/Person/",
-                "property_groups": [
-                    {
-                        "file_type": "parquet",
-                        "properties": [
-                            {
-                                "name": "name",
-                                "data_type": "string",
-                                "is_primary": true,
-                                "nullable": false
-                            },
-                            {
-                                "name": "born",
-                                "data_type": "int64",
-                                "is_primary": false,
-                                "nullable": true
-                            }
-                        ]
-                    }
-                ],
-                "sources": [
-                    {
-                        "file_type": "parquet",
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person.parquet",
-                        "columns": {
-                            "name": "name",
-                            "born": "born"
-                        }
-                    }
-                ]
-            },
-            {
-                "type": "Movie",
-                "labels": [
-                    "Movie"
-                ],
-                "chunk_size": 100,
-                "validate_level": "no",
-                "prefix": "vertex/Movie/",
-                "property_groups": [
-                    {
-                        "file_type": "parquet",
-                        "properties": [
-                            {
-                                "name": "title",
-                                "data_type": "string",
-                                "is_primary": true,
-                                "nullable": false
-                            },
-                            {
-                                "name": "tagline",
-                                "data_type": "string",
-                                "is_primary": false,
-                                "nullable": true
-                            }
-                        ]
-                    }
-                ],
-                "sources": [
-                    {
-                        "file_type": "orc",
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Movie.orc",
-                        "columns": {
-                            "title": "title",
-                            "tagline": "tagline"
-                        }
-                    }
-                ]
-            }
-        ],
-        "edges": [
-            {
-                "edge_type": "WROTE",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "chunk_size": 1024,
-                "validate_level": "no",
-                "prefix": "edge/Person_WROTE_Movie/",
-                "adj_lists": [
-                    {
-                        "ordered": true,
-                        "aligned_by": "src",
-                        "file_type": "parquet"
-                    },
-                    {
-                        "ordered": true,
-                        "aligned_by": "dst",
-                        "file_type": "parquet"
-                    }
-                ],
-                "sources": [
-                    {
-                        "file_type": "csv",
-                        "delimiter": ",",
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_WROTE_Movie.csv",
-                        "columns": {
-                            "name": "name",
-                            "title": "title"
-                        }
-                    }
-                ]
-            },
-            {
-                "edge_type": "ACTED_IN",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "validate_level": "no",
-                "chunk_size": 1024,
-                "prefix": "edge/Person_ACTED_IN_Movie/",
-                "adj_lists": [
-                    {
-                        "ordered": true,
-                        "aligned_by": "src",
-                        "file_type": "parquet"
-                    },
-                    {
-                        "ordered": true,
-                        "aligned_by": "dst",
-                        "file_type": "parquet"
-                    }
-                ],
-                "sources": [
-                    {
-                        "file_type": "json",
-                        "delimiter": ",",
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_ACTED_IN_Movie.json",
-                        "columns": {
-                            "name": "name",
-                            "title": "title"
-                        }
-                    }
-                ]
-            },
-            {
-                "edge_type": "REVIEWED",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "chunk_size": 1024,
-                "validate_level": "no",
-                "prefix": "edge/Person_REVIEWED_Movie/",
-                "property_groups": [
-                    {
-                        "file_type": "parquet",
-                        "properties": [
-                            {
-                                "name": "rating",
-                                "data_type": "int64",
-                                "is_primary": false,
-                                "nullable": true
-                            },
-                            {
-                                "name": "summary",
-                                "data_type": "string",
-                                "is_primary": false,
-                                "nullable": true
-                            }
-                        ]
-                    }
-                ],
-                "adj_lists": [
-                    {
-                        "ordered": true,
-                        "aligned_by": "src",
-                        "file_type": "parquet"
-                    },
-                    {
-                        "ordered": true,
-                        "aligned_by": "dst",
-                        "file_type": "parquet"
-                    }
-                ],
-                "sources": [
-                    {
-                        "file_type": "csv",
-                        "delimiter": ",",
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_REVIEWED_Movie.csv",
-                        "columns": {
-                            "name": "name",
-                            "title": "title",
-                            "summary": "summary",
-                            "rating": "rating"
-                        }
-                    }
-                ]
-            }
-        ]
-    }
-}
\ No newline at end of file
diff --git a/neo4j/data/import.full.yml b/neo4j/data/import.full.yml
new file mode 100644
index 0000000..a4dbd71
--- /dev/null
+++ b/neo4j/data/import.full.yml
@@ -0,0 +1,138 @@
+graphar:                                              # Global configuration 
of imported data
+  path: /tmp/graphar/movie                            # (Required) Path to the 
graphar directory
+  name: MovieGraph                                    # (Required) Name of the 
graph
+  vertex_chunk_size: 100                              # Number of vertices per 
chunk
+  edge_chunk_size: 1024                               # Number of edges per 
chunk
+  file_type: parquet                                  # Default file type for 
vertices and edges, can be "parquet", "orc", "csv", "json"
+  adj_list_type: ordered_by_source                    # Default adjacency list 
type, can be "ordered_by_source", "ordered_by_dest", "unordered_by_source", 
"unordered_by_dest"
+  validate_level: weak                                # Default validation 
level for vertices and edges, can be "no", "weak", "strong"
+  version: gar/v1                                     # Version of the graphar 
schema
+
+import_schema:
+  vertices:
+    - type: Person
+      labels:
+        - Person
+      chunk_size: 100
+      validate_level: "no"
+      prefix: vertex/Person/
+      property_groups:
+        - file_type: parquet
+          properties:
+            - name: name
+              data_type: string
+              is_primary: true
+              nullable: false
+            - name: born
+              data_type: int64
+              is_primary: false
+              nullable: true
+      sources:
+        - file_type: parquet
+        - path: ../testing/neo4j/data/Person.parquet
+          columns:
+            name: name
+            born: born
+    - type: Movie
+      labels:
+        - Movie
+      chunk_size: 100
+      validate_level: "no"
+      prefix: vertex/Movie/
+      property_groups:
+        - file_type: parquet
+          properties:
+            - name: title
+              data_type: string
+              is_primary: true
+              nullable: false
+            - name: tagline
+              data_type: string
+              is_primary: false
+              nullable: true
+      sources:
+        - file_type: orc
+        - path: ../testing/neo4j/data/Movie.orc
+          columns:
+            title: title
+            tagline: tagline
+  edges:
+    - edge_type: WROTE
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      chunk_size: 1024
+      validate_level: "no"
+      prefix: edge/Person_WROTE_Movie/
+      adj_lists:
+        - ordered: true
+          aligned_by: src
+          file_type: parquet
+        - ordered: true
+          aligned_by: dst
+          file_type: parquet
+      sources:
+        - file_type: csv
+          delimiter: ","
+          path: ../testing/neo4j/data/Person_WROTE_Movie.csv
+          columns:
+            name: name
+            title: title
+    - edge_type: ACTED_IN
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      validate_level: "no"
+      chunk_size: 1024
+      prefix: edge/Person_ACTED_IN_Movie/
+      adj_lists:
+        - ordered: true
+          aligned_by: src
+          file_type: parquet
+        - ordered: true
+          aligned_by: dst
+          file_type: parquet
+      sources:
+        - file_type: json
+          delimiter: ","    # will be ignored
+          path: ../testing/neo4j/data/Person_ACTED_IN_Movie.json
+          columns:
+            name: name
+            title: title
+    - edge_type: REVIEWED
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      chunk_size: 1024
+      validate_level: "no"
+      prefix: edge/Person_REVIEWED_Movie/
+      property_groups:
+        - file_type: parquet
+          properties:
+            - name: rating
+              data_type: int64
+              is_primary: false
+              nullable: true
+            - name: summary
+              data_type: string
+              is_primary: false
+              nullable: true
+      adj_lists:
+        - ordered: true
+          aligned_by: src
+          file_type: parquet
+        - ordered: true
+          aligned_by: dst
+          file_type: parquet
+      sources:
+        - file_type: csv
+          delimiter: ","
+          path: ../testing/neo4j/data/Person_REVIEWED_Movie.csv
+          columns:
+            name: name
+            title: title
+            summary: summary
+            rating: rating
diff --git a/neo4j/data/import.mini.json b/neo4j/data/import.mini.json
deleted file mode 100644
index 8d85c77..0000000
--- a/neo4j/data/import.mini.json
+++ /dev/null
@@ -1,130 +0,0 @@
-{
-    "graphar": {
-        "path": "/workspaces/incubator-graphar/graphar/movie",
-        "name": "MovieGraph"
-    },
-    "import_schema": {
-        "vertices": [
-            {
-                "type": "Person",
-                "property_groups": [
-                    {
-                        "properties": [
-                            {
-                                "name": "name",
-                                "data_type": "string",
-                                "is_primary": true
-                            },
-                            {
-                                "name": "born",
-                                "data_type": "int64"
-                            }
-                        ]
-                    }
-                ],
-                "sources": [
-                    {
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person.parquet",
-                        "columns": {
-                            "name": "name",
-                            "born": "born"
-                        }
-                    }
-                ]
-            },
-            {
-                "type": "Movie",
-                "property_groups": [
-                    {
-                        "properties": [
-                            {
-                                "name": "title",
-                                "data_type": "string",
-                                "is_primary": true
-                            },
-                            {
-                                "name": "tagline",
-                                "data_type": "string"
-                            }
-                        ]
-                    }
-                ],
-                "sources": [
-                    {
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Movie.orc",
-                        "columns": {
-                            "title": "title",
-                            "tagline": "tagline"
-                        }
-                    }
-                ]
-            }
-        ],
-        "edges": [
-            {
-                "edge_type": "WROTE",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "sources": [
-                    {
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_WROTE_Movie.csv",
-                        "columns": {
-                            "name": "name",
-                            "title": "title"
-                        }
-                    }
-                ]
-            },
-            {
-                "edge_type": "ACTED_IN",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "sources": [
-                    {
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_ACTED_IN_Movie.csv",
-                        "columns": {
-                            "name": "name",
-                            "title": "title"
-                        }
-                    }
-                ]
-            },
-            {
-                "edge_type": "REVIEWED",
-                "src_type": "Person",
-                "src_prop": "name",
-                "dst_type": "Movie",
-                "dst_prop": "title",
-                "property_groups": [
-                    {
-                        "properties": [
-                            {
-                                "name": "rating",
-                                "data_type": "int64"
-                            },
-                            {
-                                "name": "summary",
-                                "data_type": "string"
-                            }
-                        ]
-                    }
-                ],
-                "sources": [
-                    {
-                        "path": 
"/workspaces/incubator-graphar/testing/neo4j/data/Person_REVIEWED_Movie.csv",
-                        "columns": {
-                            "name": "name",
-                            "title": "title",
-                            "summary": "summary",
-                            "rating": "rating"
-                        }
-                    }
-                ]
-            }
-        ]
-    }
-}
\ No newline at end of file
diff --git a/neo4j/data/import.mini.yml b/neo4j/data/import.mini.yml
new file mode 100644
index 0000000..86cf92f
--- /dev/null
+++ b/neo4j/data/import.mini.yml
@@ -0,0 +1,71 @@
+graphar:
+  path: /tmp/graphar/movie
+  name: MovieGraph
+
+import_schema:
+  vertices:
+    - type: Person
+      property_groups:
+        - properties:
+            - name: name
+              data_type: string
+              is_primary: true
+            - name: born
+              data_type: int64
+      sources:
+        - path: ../testing/neo4j/data/Person.parquet
+          columns:
+            name: name
+            born: born
+    - type: Movie
+      property_groups:
+        - properties:
+            - name: title
+              data_type: string
+              is_primary: true
+            - name: tagline
+              data_type: string
+      sources:
+        - path: ../testing/neo4j/data/Movie.orc
+          columns:
+            title: title
+            tagline: tagline
+  edges:
+    - edge_type: WROTE
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      sources:
+        - path: ../testing/neo4j/data/Person_WROTE_Movie.csv
+          columns:
+            name: name
+            title: title
+    - edge_type: ACTED_IN
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      sources:
+        - path: ../testing/neo4j/data/Person_ACTED_IN_Movie.json
+          columns:
+            name: name
+            title: title
+    - edge_type: REVIEWED
+      src_type: Person
+      src_prop: name
+      dst_type: Movie
+      dst_prop: title
+      property_groups:
+        - properties:
+          - name: rating
+            data_type: int64
+          - name: summary
+            data_type: string
+      sources:
+        - path: ../testing/neo4j/data/Person_REVIEWED_Movie.csv
+          columns:
+            name: name
+            title: title
+            summary: summary
+            rating: rating


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

(incubator-graphar-testing) branch main updated: change import config file (#27)

Reply via email to