565 lines
12 KiB
YAML
565 lines
12 KiB
YAML
client:
|
|
version: v3
|
|
address: "172.16.20.2:9669,172.16.20.4:9669,172.16.20.5:9669"
|
|
user: root
|
|
password: 123456
|
|
concurrencyPerAddress: 10
|
|
reconnectInitialInterval: 1s
|
|
retry: 3
|
|
retryInitialInterval: 1s
|
|
|
|
manager:
|
|
spaceName: Y24_1206
|
|
batch: 128
|
|
readerConcurrency: 50
|
|
importerConcurrency: 512
|
|
statsInterval: 10s
|
|
hooks:
|
|
before:
|
|
- statements:
|
|
- |
|
|
USE Y24_1206;
|
|
wait: 10s
|
|
|
|
log:
|
|
level: INFO
|
|
console: true
|
|
|
|
sources:
|
|
- path: /data/y4/tools/data/user-0s.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
tags:
|
|
- name: user
|
|
mode: INSERT
|
|
id:
|
|
type: "STRING"
|
|
index: 12 # id 字段作为VID
|
|
props:
|
|
- name: "friends_count"
|
|
type: "INT"
|
|
index: 0
|
|
- name: "listed_count"
|
|
type: "INT"
|
|
index: 1
|
|
- name: "favourites_count"
|
|
type: "INT"
|
|
index: 2
|
|
- name: "verified"
|
|
type: "STRING"
|
|
index: 3
|
|
- name: "label"
|
|
type: "STRING"
|
|
index: 4
|
|
- name: "platform"
|
|
type: "STRING"
|
|
index: 5
|
|
- name: "url"
|
|
type: "STRING"
|
|
index: 6
|
|
- name: "gather_time"
|
|
type: "STRING"
|
|
index: 7
|
|
- name: "screen_name"
|
|
type: "STRING"
|
|
index: 8
|
|
- name: "followers_count"
|
|
type: "INT"
|
|
index: 9
|
|
- name: "name"
|
|
type: "STRING"
|
|
index: 10
|
|
- name: "standpoint"
|
|
type: "STRING"
|
|
index: 11
|
|
- name: "position"
|
|
type: "STRING"
|
|
index: 13
|
|
- name: "region"
|
|
type: "STRING"
|
|
index: 14
|
|
- name: "register_location"
|
|
type: "STRING"
|
|
index: 15
|
|
- name: "party"
|
|
type: "STRING"
|
|
index: 16
|
|
|
|
- path: /data/y4/tools/data/post-0s.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
tags:
|
|
- name: post
|
|
mode: INSERT
|
|
id:
|
|
type: "STRING"
|
|
index: 11 # id 字段作为VID
|
|
props:
|
|
- name: "comment_count"
|
|
type: "INT"
|
|
index: 0
|
|
- name: "author_name"
|
|
type: "STRING"
|
|
index: 1
|
|
- name: "repost_count"
|
|
type: "INT"
|
|
index: 2
|
|
- name: "like_count"
|
|
type: "INT"
|
|
index: 3
|
|
- name: "keywords"
|
|
type: "STRING"
|
|
index: 4
|
|
- name: "platform"
|
|
type: "STRING"
|
|
index: 5
|
|
- name: "url"
|
|
type: "STRING"
|
|
index: 6
|
|
- name: "gather_time"
|
|
type: "STRING"
|
|
index: 7
|
|
- name: "post_relationship"
|
|
type: "STRING"
|
|
index: 8
|
|
- name: "publish_time"
|
|
type: "STRING"
|
|
index: 9
|
|
- name: "root_mid"
|
|
type: "STRING"
|
|
index: 10
|
|
- name: "author_id"
|
|
type: "STRING"
|
|
index: 12
|
|
- name: "source_task"
|
|
type: "STRING"
|
|
index: 13
|
|
- name: "view_count"
|
|
type: "INT"
|
|
index: 14
|
|
|
|
- path: /data/y4/tools/data/group-0s.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
tags:
|
|
- name: group
|
|
mode: INSERT
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # id 字段作为VID
|
|
props:
|
|
- name: "name"
|
|
type: "STRING"
|
|
index: 0
|
|
- name: "member_count"
|
|
type: "INT"
|
|
index: 2
|
|
- name: "platform"
|
|
type: "STRING"
|
|
index: 3
|
|
|
|
- path: /data/y4/tools/data/organization-0s.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
tags:
|
|
- name: organization
|
|
mode: INSERT
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # id 字段作为VID
|
|
props:
|
|
- name: "name"
|
|
type: "STRING"
|
|
index: 0
|
|
- name: "industry"
|
|
type: "STRING"
|
|
index: 1
|
|
- name: "member_count"
|
|
type: "STRING"
|
|
index: 3
|
|
- name: "platform"
|
|
type: "STRING"
|
|
index: 4
|
|
|
|
- path: /data/y4/tools/data/task-0s.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
tags:
|
|
- name: task
|
|
mode: INSERT
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # id 字段作为VID
|
|
props:
|
|
- name: "keywords"
|
|
type: "STRING"
|
|
index: 0
|
|
- name: "name"
|
|
type: "STRING"
|
|
index: 1
|
|
|
|
# 边数据
|
|
- path: /data/y4/tools/data/user_follow_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_follow_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/user_follower_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_follower_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/user_friend_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_friend_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/user_have_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_have_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/post_repost_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: post_repost_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/post_cite_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: post_cite_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
# - path: /data/y4/tools/data/user_post_post-0.csv
|
|
# csv:
|
|
# delimiter: "|"
|
|
# withHeader: true
|
|
# edges:
|
|
# - name: user_post_post
|
|
# mode: INSERT
|
|
# src:
|
|
# id:
|
|
# type: "STRING"
|
|
# index: 2 # src
|
|
# dst:
|
|
# id:
|
|
# type: "STRING"
|
|
# index: 1 # dst
|
|
# props:
|
|
# - name: "extra_prop"
|
|
# type: "STRING"
|
|
# index: 0
|
|
|
|
- path: /data/y4/tools/data/user_comment_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_comment_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/post_comment_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: post_comment_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/post_multicomment_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: post_multicomment_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/user_join_group-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_join_group
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/group_include_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: group_include_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/user_participate_task-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: user_participate_task
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/task_include_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: task_include_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/post_in_task-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: post_in_task
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/task_include_post-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: task_include_post
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
- path: /data/y4/tools/data/organization_include_user-0.csv
|
|
csv:
|
|
delimiter: "|"
|
|
withHeader: true
|
|
edges:
|
|
- name: organization_include_user
|
|
mode: INSERT
|
|
src:
|
|
id:
|
|
type: "STRING"
|
|
index: 2 # src
|
|
dst:
|
|
id:
|
|
type: "STRING"
|
|
index: 1 # dst
|
|
props:
|
|
- name: "extra_prop"
|
|
type: "STRING"
|
|
index: 0
|
|
|
|
# - path: /data/y4/tools/data/user_join_organization-0.csv
|
|
# csv:
|
|
# delimiter: "|"
|
|
# withHeader: true
|
|
# edges:
|
|
# - name: user_join_organization
|
|
# mode: INSERT
|
|
# src:
|
|
# id:
|
|
# type: "STRING"
|
|
# index: 2 # src
|
|
# dst:
|
|
# id:
|
|
# type: "STRING"
|
|
# index: 1 # dst
|
|
# props:
|
|
# - name: "extra_prop"
|
|
# type: "STRING"
|
|
# index: 0 |