-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathconfig.ini
116 lines (99 loc) · 2.33 KB
/
config.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
[base]
es_url = http://10.30.89.124:9200/
hbase_url= 10.30.89.124
redis_url=10.30.89.124
mongo_url = 10.30.89.124
redis_port=6379
hbase_port=9090
mongo_port = 27011
mongo_db = zhihu_new
[recall]
es_url = http://10.30.89.124:9200/
index_name = articles
hbase_url= 10.30.89.124
redis_url=10.30.89.124
redis_port=6379
hbase_port=9090
title_recall_nums=10
summary_recall_nums=10
content_recall_nums=3
text_recall_nums = 60
default_index_name = articles
vector_dir = recall/vector_data/
bert_model_path = bert-base-chinese
[sampler]
user_nums = 100000
user_search_max_nums = 200
test_data_nums = 50000
data_path = dataset/data/
[mongo]
name = load data
url = mongodb://10.30.89.124:27013/
db = zhihu_new
collection = articles
batch_size = 64
[document_hbase]
name = noname
host = 10.30.89.124
port = 9090
h_table_name = document_features_test4
num_customers = 4
[search_info_hbase]
host = 10.30.89.124
port = 9090
data_path = data/search_information.csv
h_table_name = searchinfo_features_test1
[user_hbase]
host = 10.30.89.124
port = 9090
data_path = data/user_data.csv
h_table_name = user_features_test1
[document_feature_api]
port = 9090
host = 10.30.89.124
table_name = document_features_test3
[hbase_to_csv]
table_name = document_features_test3
host = 10.30.89.124
port = 9090
batch_size = 64
output_file_path = document_features.txt
field_name = author:avatar_url,
author:description,
author:gender,
author:headline,
author:id,
author:is_advertiser,
author:name,
author:url,
author:url_token,
author:user_type,
comment:avatar_url_list,
comment:comment_count,
comment:content_list,
comment:created_time_list,
comment:name_list,
comment:url_token_list,
comment:vote_count_list,
comment:voteup_count,
document:clean_content,
document:clean_content_vector,
document:created,
document:entity,
document:excerpt,
document:excerpt_vector,
document:has_column,
document:id,
document:image_url,
document:title,
document:title_vector,
document:tokens,
document:top5words,
document:type,
document:updated
[hbase_to_hive]
table_name = document_features_test3
queue = queue
batch_size = 64
host = 10.30.89.124
num_customers = 6