-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathesmon_install.conf
211 lines (211 loc) · 7.02 KB
/
esmon_install.conf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
#
# Configuration file of ESPerfMon from DDN
#
# This file is automatically generated by esmon_config command. To update this
# file, please run esmon_config command.
#
# Configuration Guide:
#
# 1. agents
# This list includes the information of the ES PERFMON agents.
# Default value: [{'host_id': 'localhost'}]
#
# 1.1 enable_disk
# This option determines whether to collect disk metrics from this agent.
# Default value: False
#
# 1.2 host_id
# This option is the ID of the host. The ID of a host is a unique value to
# identify the host.
#
# 1.3 ime
# This option determines whether to enable IME metrics collection on this
# ES PERFMON agent.
# Default value: False
#
# 1.4 infiniband
# This option determines whether to enable Infiniband metrics collection on this
# ES PERFMON agent.
# Default value: False
#
# 1.5 lustre_mds
# This option determines whether to enable Lustre MDS metrics collection on
# this ES PERFMON agent.
# Default value: True
#
# 1.6 lustre_oss
# This option determines whether to enable Lustre OSS metrics collection on this
# ES PERFMON agent.
# Default value: True
#
# 1.7 sfas
# This list includes the information of SFAs on this ES PERFMON agent.
# Default value: []
#
# 1.7.1 controller0_host
# This option is the hostname/IP of the controller 0 of this SFA.
# Default value: controller0_host
#
# 1.7.2 controller1_host
# This option is the hostname/IP of the controller 1 of this SFA.
# Default value: controller1_host
#
# 1.7.3 name
# This option is the unique name of this controller. This value will be used as
# the value of "fqdn" tag for metrics of this SFA. Thus, two SFAs shouldn't have
# the same name.
#
# 2. agents_reinstall
# This option determines whether to reinstall ESMON agents or not.
# Default value: True
#
# 3. collect_interval
# This option determines the interval seconds to collect datapoint.
# Default value: 60
#
# 4. continuous_query_periods
# This option determines the interval of continuous queries. ES PERFMON uses
# continuous queries of Influxdb to aggregate data. To calculate the interval
# seconds of continuous queries, please multiply this number by the value of
# the "collect_interval" option. If this number is "1", the interval of
# continous queries would be "collect_interval" seconds. Usually, in order to
# downsample the data and reduce performance impact, this value should be
# larger than "1".
# Default value: 4
#
# 5. iso_path
# This option is the path of ES PERFMON ISO.
# Default value: /root/esmon.iso
#
# 6. lustre_default_version
# This option determines the default Lustre version to use, if the Lustre
# RPMs installed on the ES PERFMON agent is not with the supported version.
# Default value: es3
#
# 7. lustre_exp_mdt
# This option determines whether ES PERFMON agents collect exp_md_stats_*
# metrics from Lustre MDT. If there are too many Lustre clients on the system,
# this option should be disabled to avoid performance issues.
# Default value: False
#
# 8. lustre_exp_ost
# This option determines whether ES PERFMON agents collect exp_ost_stats_[read|
# write] metrics from Lustre OST or not. If there are too many Lustre clients on
# the system, this option should be disabled to avoid performance issues.
# Default value: False
#
# 9. server
# This group of options include the information about the ES PERFMON server.
# Default value: {'host_id': 'localhost'}
#
# 9.1 drop_database
# This option determines whether to drop existing ES PERFMON database of
# Influxdb.
# Important: This option should ONLY be set to "True" if the data/metadata in
# ES PERFMON database of Influxdb is not needed any more.
# Default value: False
#
# 9.2 erase_influxdb
# This option determines whether to erase all data and metadata of Influxdb.
# Important: This option should ONLY be set to "True" if the data/metadata of
# Influxdb is not needed any more. When Influxdb is totally
# corrupted, please enable this option to erase and fix. And please
# double check the influxdb_path option is properly configured before
# enabling this option.
# Default value: False
#
# 9.3 host_id
# This option is the ID of the host. The ID of a host is a unique value to
# identify the host.
#
# 9.4 influxdb_path
# This option is Influxdb directory path on ES PERFMON server node.
# Important: Please do not put any other files/directries under this directory of
# ES PERFMON server node, because, with "erase_influxdb" option
# enabled, all of the files/directries under that directory will be
# removed.
# Default value: /esmon/influxdb
#
# 9.5 reinstall
# This option determines whether to reinstall the ES PERFMON server.
# Default value: True
#
# 9.6 auto_open_ports_on_firewall
# This option determines whether ES PERFMON installation process will open
# the ports on monitoring server node automatically or not. If this options is
# enabled, firewall-cmd will be run on the server node to open ports in the
# firewall. If the option is disabled, administrator need to make sure the ports
# are opened or the firewall is disabled, otherwise there might be access failure
# becaused of banned ports (e.g. 3000, 4242, 8086, 8088, 25826).
# Default value: False
#
# 10. ssh_hosts
# This list includes the informations about how to login into the hosts using
# SSH connections.
# Default value: [{'local_host': True, 'host_id': 'localhost', 'hostname': 'localhost'}]
#
# 10.1 host_id
# This option is the ID of the host. The ID of a host is a unique value to
# identify the host.
#
# 10.2 hostname
# This option is the hostname or IP of the host. "ssh" command will use this
# hostname/IP to login into the host. If the host is the ES PERFMON server, this
# hostname/IP will be used as the server host in the write_tsdb plugin of
# ES PERFMON agent.
#
# 10.3 ssh_identity_file
# This option is the SSH key file used when using SSH command to login into
# the host. If the default SSH identity file works, this option can be set to
# "None".
# Default value: None
#
# 10.4 local_host
# This option determines whether this host is local host.
# Default value: False
#
# 11. jobid_var
# This option determines the job ID var used by the file system, which can
# be read by command "lctl get_param jobid_var"
# Default value: unknown
#
agents:
- enable_disk: false
host_id: Agent1
ime: false
infiniband: false
lustre_mds: true
lustre_oss: true
sfas:
- controller0_host: 10.0.0.1
controller1_host: 10.0.0.2
name: SFA1
- controller0_host: 10.0.0.3
controller1_host: 10.0.0.4
name: SFA2
- host_id: Agent2
sfas: []
agents_reinstall: true
collect_interval: 60
continuous_query_periods: 4
iso_path: /root/esmon.iso
jobid_var: unknown
lustre_default_version: es3
lustre_exp_mdt: false
lustre_exp_ost: false
server:
auto_open_ports_on_firewall: false
drop_database: false
erase_influxdb: false
host_id: Server
influxdb_path: /esmon/influxdb
reinstall: true
ssh_hosts:
- host_id: Agent1
hostname: Agent1
local_host: false
ssh_identity_file: None
- host_id: Agent2
hostname: Agent2
- host_id: Server
hostname: Server