author | Mahlon E. Smith <mahlon@martini.nu> |
Mon, 19 Nov 2018 12:05:47 -0800 | |
changeset 17 | 96b8799a565a |
parent 16 | fce5b4150c09 |
child 19 | 1f09cfb560e0 |
permissions | -rw-r--r-- |
8 | 1 |
# vim: set et nosta sw=4 ts=4 : |
0 | 2 |
# |
3 |
# Copyright (c) 2018, Mahlon E. Smith <mahlon@martini.nu> |
|
4 |
# All rights reserved. |
|
5 |
# Redistribution and use in source and binary forms, with or without |
|
6 |
# modification, are permitted provided that the following conditions are met: |
|
7 |
# |
|
8 |
# * Redistributions of source code must retain the above copyright |
|
9 |
# notice, this list of conditions and the following disclaimer. |
|
10 |
# |
|
11 |
# * Redistributions in binary form must reproduce the above copyright |
|
12 |
# notice, this list of conditions and the following disclaimer in the |
|
13 |
# documentation and/or other materials provided with the distribution. |
|
14 |
# |
|
15 |
# * Neither the name of Mahlon E. Smith nor the names of his |
|
16 |
# contributors may be used to endorse or promote products derived |
|
17 |
# from this software without specific prior written permission. |
|
18 |
# |
|
19 |
# THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND ANY |
|
20 |
# EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |
|
21 |
# WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE |
|
22 |
# DISCLAIMED. IN NO EVENT SHALL THE REGENTS AND CONTRIBUTORS BE LIABLE FOR ANY |
|
23 |
# DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |
|
24 |
# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
|
25 |
# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |
|
26 |
# ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
|
27 |
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
|
28 |
# SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
29 |
||
30 |
||
31 |
import |
|
32 |
db_postgres, |
|
33 |
json, |
|
5 | 34 |
math, |
0 | 35 |
nativesockets, |
36 |
net, |
|
5 | 37 |
os, |
16 | 38 |
parseopt, |
8 | 39 |
posix, |
0 | 40 |
strutils, |
41 |
tables, |
|
5 | 42 |
terminal, |
8 | 43 |
times |
0 | 44 |
|
45 |
||
46 |
const |
|
16 | 47 |
VERSION = "v0.2.0" |
0 | 48 |
USAGE = """ |
17
96b8799a565a
Fix command line usage docs, replace deprecated recvLine() with readLine().
Mahlon E. Smith <mahlon@martini.nu>
parents:
16
diff
changeset
|
49 |
./netdata_tsrelay [-d][-h][-q][-t][-T][-v] --dbopts="[PostgreSQL connection string]" --listen-port=14866 --listen-addr=0.0.0.0 |
5 | 50 |
|
51 |
-q: Quiet mode. No output at all. Ignored if -d is supplied. |
|
52 |
-d: Debug: Show incoming and parsed data. |
|
53 |
-v: Display version number. |
|
11 | 54 |
-T: Change the destination table name from the default 'netdata'. |
55 |
-t: Alter the maximum time (in ms) an open socket waits for data. Default: 500ms. |
|
5 | 56 |
-h: Help. You're lookin' at it. |
0 | 57 |
|
58 |
The default connection string is: |
|
13
e1777929ba15
Remove port and user from the default dbopts, so they instead use the postgresql behavioral default.
Mahlon E. Smith <mahlon@laika.com>
parents:
11
diff
changeset
|
59 |
"host=localhost dbname=netdata application_name=netdata-tsrelay" |
0 | 60 |
""" |
61 |
INSERT_SQL = """ |
|
11 | 62 |
INSERT INTO $1 |
0 | 63 |
( time, host, metrics ) |
64 |
VALUES |
|
65 |
( 'epoch'::timestamptz + ? * '1 second'::interval, ?, ? ) |
|
66 |
""" |
|
67 |
||
68 |
||
5 | 69 |
type |
70 |
Config = object of RootObj |
|
71 |
dbopts: string # The postgresql connection parameters. (See https://www.postgresql.org/docs/current/static/libpq-connect.html) |
|
11 | 72 |
dbtable: string # The name of the table to write to. |
73 |
listen_port: int # The port to listen for incoming connections. |
|
5 | 74 |
listen_addr: string # The IP address listen for incoming connections. Defaults to inaddr_any. |
75 |
verbose: bool # Be informative |
|
76 |
debug: bool # Spew out raw data |
|
11 | 77 |
insertsql: string # The SQL insert string after interpolating the table name. |
78 |
timeout: int # How long to block, waiting on connection data. |
|
0 | 79 |
|
8 | 80 |
# Global configuration |
81 |
var conf: Config |
|
0 | 82 |
|
9
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
83 |
|
5 | 84 |
proc hl( msg: string, fg: ForegroundColor, bright=false ): string = |
85 |
## Quick wrapper for color formatting a string, since the 'terminal' |
|
86 |
## module only deals with stdout directly. |
|
8 | 87 |
if not isatty(stdout): return msg |
5 | 88 |
|
89 |
var color: BiggestInt = ord( fg ) |
|
90 |
if bright: inc( color, 60 ) |
|
91 |
result = "\e[" & $color & 'm' & msg & "\e[0m" |
|
92 |
||
93 |
||
0 | 94 |
proc fetch_data( client: Socket ): string = |
95 |
## Netdata JSON backend doesn't send a length, so we read line by |
|
96 |
## line and wait for stream timeout to determine a "sample". |
|
17
96b8799a565a
Fix command line usage docs, replace deprecated recvLine() with readLine().
Mahlon E. Smith <mahlon@martini.nu>
parents:
16
diff
changeset
|
97 |
var buf = "" |
0 | 98 |
try: |
17
96b8799a565a
Fix command line usage docs, replace deprecated recvLine() with readLine().
Mahlon E. Smith <mahlon@martini.nu>
parents:
16
diff
changeset
|
99 |
while true: |
96b8799a565a
Fix command line usage docs, replace deprecated recvLine() with readLine().
Mahlon E. Smith <mahlon@martini.nu>
parents:
16
diff
changeset
|
100 |
client.readline( buf, timeout=conf.timeout ) |
16 | 101 |
if buf != "": result = result & buf & "\n" |
0 | 102 |
except TimeoutError: |
17
96b8799a565a
Fix command line usage docs, replace deprecated recvLine() with readLine().
Mahlon E. Smith <mahlon@martini.nu>
parents:
16
diff
changeset
|
103 |
return |
0 | 104 |
|
105 |
||
8 | 106 |
proc parse_data( data: string ): seq[ JsonNode ] = |
107 |
## Given a raw +data+ string, parse JSON and return a sequence |
|
108 |
## of JSON samples. Netdata can buffer multiple samples in one batch. |
|
109 |
result = @[] |
|
16 | 110 |
if data == "": return |
0 | 111 |
|
112 |
# Hash of sample timeperiods to pivoted json data |
|
8 | 113 |
var pivoted_data = init_table[ BiggestInt, JsonNode ]() |
0 | 114 |
|
115 |
for sample in split_lines( data ): |
|
16 | 116 |
if sample == "": continue |
11 | 117 |
if conf.debug: echo sample.hl( fgBlack, bright=true ) |
0 | 118 |
|
119 |
var parsed: JsonNode |
|
120 |
try: |
|
121 |
parsed = sample.parse_json |
|
122 |
except JsonParsingError: |
|
5 | 123 |
if conf.debug: echo hl( "Unable to parse sample line: " & sample.hl(fgRed, bright=true), fgRed ) |
8 | 124 |
continue |
125 |
if parsed.kind != JObject: return |
|
0 | 126 |
|
127 |
# Create or use existing Json object for modded data. |
|
128 |
# |
|
129 |
var pivot: JsonNode |
|
8 | 130 |
try: |
16 | 131 |
let key = parsed[ "timestamp" ].get_int |
8 | 132 |
|
133 |
if pivoted_data.has_key( key ): |
|
134 |
pivot = pivoted_data[ key ] |
|
135 |
else: |
|
136 |
pivot = newJObject() |
|
137 |
pivoted_data[ key ] = pivot |
|
0 | 138 |
|
8 | 139 |
var name = parsed[ "chart_id" ].get_str & "." & parsed[ "id" ].get_str |
140 |
pivot[ "hostname" ] = parsed[ "hostname" ] |
|
141 |
pivot[ "timestamp" ] = parsed[ "timestamp" ] |
|
142 |
pivot[ name ] = parsed[ "value" ] |
|
143 |
except: |
|
144 |
continue |
|
0 | 145 |
|
8 | 146 |
for timestamp, sample in pivoted_data: |
147 |
result.add( sample ) |
|
0 | 148 |
|
149 |
||
8 | 150 |
proc write_to_database( samples: seq[ JsonNode ] ): void = |
151 |
## Given a sequence of json samples, write them to database. |
|
152 |
if samples.len == 0: return |
|
153 |
||
154 |
let db = open( "", "", "", conf.dbopts ) |
|
155 |
||
156 |
try: |
|
157 |
db.exec sql( "BEGIN" ) |
|
158 |
for sample in samples: |
|
159 |
var |
|
16 | 160 |
timestamp = sample[ "timestamp" ].get_int |
15
ed87882bb7f0
Lowercase all hostnames before sending to the database.
Mahlon E. Smith <mahlon@martini.nu>
parents:
13
diff
changeset
|
161 |
host = sample[ "hostname" ].get_str.to_lowerascii |
8 | 162 |
sample.delete( "timestamp" ) |
163 |
sample.delete( "hostname" ) |
|
11 | 164 |
db.exec sql( conf.insertsql ), timestamp, host, sample |
8 | 165 |
db.exec sql( "COMMIT" ) |
166 |
except: |
|
167 |
let |
|
168 |
e = getCurrentException() |
|
169 |
msg = getCurrentExceptionMsg() |
|
170 |
echo "Got exception ", repr(e), " while writing to DB: ", msg |
|
171 |
discard |
|
172 |
||
173 |
db.close |
|
174 |
||
175 |
||
176 |
proc process( client: Socket, address: string ): void = |
|
9
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
177 |
## Do the work for a connected client within child process. |
8 | 178 |
let t0 = cpu_time() |
0 | 179 |
var raw_data = client.fetch_data |
180 |
||
5 | 181 |
# Done with the socket, netdata will automatically |
182 |
# reconnect. Save local resources/file descriptors |
|
183 |
# by closing after the send is considered complete. |
|
184 |
# |
|
0 | 185 |
try: |
186 |
client.close |
|
187 |
except OSError: |
|
188 |
return |
|
189 |
||
8 | 190 |
# Pivot the parsed data to a single JSON blob per sample time. |
191 |
var samples = parse_data( raw_data ) |
|
192 |
write_to_database( samples ) |
|
5 | 193 |
|
194 |
if conf.verbose: |
|
195 |
echo( |
|
8 | 196 |
hl( $(epochTime().to_int), fgMagenta, bright=true ), |
197 |
" ", |
|
198 |
hl( $(samples.len), fgWhite, bright=true ), |
|
5 | 199 |
" sample(s) parsed from ", |
200 |
address.hl( fgYellow, bright=true ), |
|
201 |
" in ", hl($( round(cpu_time() - t0, 3) ), fgWhite, bright=true), " seconds." |
|
202 |
# " ", hl($(round((get_occupied_mem()/1024/1024),1)), fgWhite, bright=true), "MB memory used." |
|
203 |
) |
|
204 |
||
0 | 205 |
|
8 | 206 |
proc serverloop( conf: Config ): void = |
0 | 207 |
## Open a database connection, bind to the listening socket, |
208 |
## and start serving incoming netdata streams. |
|
209 |
let db = open( "", "", "", conf.dbopts ) |
|
9
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
210 |
db.close |
8 | 211 |
if conf.verbose: echo( "Successfully tested connection to the backend database.".hl( fgGreen ) ) |
9
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
212 |
|
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
213 |
# Ensure children are properly reaped. |
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
214 |
# |
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
215 |
var sa: Sigaction |
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
216 |
sa.sa_handler = SIG_IGN |
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
217 |
discard sigaction( SIGCHLD, sa ) |
5 | 218 |
|
8 | 219 |
# Setup listening socket. |
220 |
# |
|
221 |
var server = newSocket() |
|
0 | 222 |
server.set_sock_opt( OptReuseAddr, true ) |
5 | 223 |
server.bind_addr( Port(conf.listen_port), conf.listen_addr ) |
0 | 224 |
server.listen() |
225 |
||
5 | 226 |
if conf.verbose: |
227 |
echo( |
|
228 |
"Listening for incoming connections on ".hl( fgGreen, bright=true ), |
|
229 |
hl( (if conf.listen_addr == "0.0.0.0": "*" else: conf.listen_addr) , fgBlue, bright=true ), |
|
230 |
":", |
|
231 |
hl( $conf.listen_port, fgBlue, bright=true ), |
|
232 |
) |
|
233 |
echo "" |
|
234 |
||
8 | 235 |
# Wait for incoming connections, fork for each client. |
236 |
# |
|
0 | 237 |
while true: |
8 | 238 |
var |
239 |
client = new Socket |
|
240 |
address = "" |
|
6
1f366fc61592
Each incoming connection requires its own client socket.
Mahlon E. Smith <mahlon@laika.com>
parents:
5
diff
changeset
|
241 |
|
9
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
242 |
# Block, waiting for new connections. |
aa9d537f7067
Properly reap child processes.
Mahlon E. Smith <mahlon@laika.com>
parents:
8
diff
changeset
|
243 |
server.acceptAddr( client, address ) |
8 | 244 |
|
245 |
if fork() == 0: |
|
246 |
server.close |
|
247 |
client.process( address ) |
|
248 |
quit( 0 ) |
|
7
c0bcf3bea772
Force a GC pass after 25 cycles. Don't bother with sync() at exit, unnecessary.
Mahlon E. Smith <mahlon@laika.com>
parents:
6
diff
changeset
|
249 |
|
6
1f366fc61592
Each incoming connection requires its own client socket.
Mahlon E. Smith <mahlon@laika.com>
parents:
5
diff
changeset
|
250 |
client.close |
7
c0bcf3bea772
Force a GC pass after 25 cycles. Don't bother with sync() at exit, unnecessary.
Mahlon E. Smith <mahlon@laika.com>
parents:
6
diff
changeset
|
251 |
when defined( testing ): dumpNumberOfInstances() |
0 | 252 |
|
253 |
||
8 | 254 |
proc parse_cmdline: Config = |
0 | 255 |
## Populate the config object with the user's preferences. |
5 | 256 |
|
8 | 257 |
# Config object defaults. |
258 |
# |
|
259 |
result = Config( |
|
13
e1777929ba15
Remove port and user from the default dbopts, so they instead use the postgresql behavioral default.
Mahlon E. Smith <mahlon@laika.com>
parents:
11
diff
changeset
|
260 |
dbopts: "host=localhost dbname=netdata application_name=netdata-tsrelay", |
11 | 261 |
dbtable: "netdata", |
8 | 262 |
listen_port: 14866, |
263 |
listen_addr: "0.0.0.0", |
|
264 |
verbose: true, |
|
11 | 265 |
debug: false, |
266 |
timeout: 500, |
|
267 |
insertsql: INSERT_SQL % [ "netdata" ] |
|
8 | 268 |
) |
269 |
||
5 | 270 |
# always set debug mode if development build. |
8 | 271 |
result.debug = defined( testing ) |
5 | 272 |
|
0 | 273 |
for kind, key, val in getopt(): |
274 |
case kind |
|
275 |
||
276 |
of cmdArgument: |
|
277 |
discard |
|
278 |
||
279 |
of cmdLongOption, cmdShortOption: |
|
280 |
case key |
|
5 | 281 |
of "debug", "d": |
8 | 282 |
result.debug = true |
5 | 283 |
|
0 | 284 |
of "help", "h": |
285 |
echo USAGE |
|
286 |
quit( 0 ) |
|
5 | 287 |
|
288 |
of "quiet", "q": |
|
8 | 289 |
result.verbose = false |
11 | 290 |
|
0 | 291 |
of "version", "v": |
5 | 292 |
echo hl( "netdata_tsrelay " & VERSION, fgWhite, bright=true ) |
0 | 293 |
quit( 0 ) |
11 | 294 |
|
295 |
of "timeout", "t": result.timeout = val.parse_int |
|
296 |
||
297 |
of "dbtable", "T": |
|
298 |
result.insertsql = INSERT_SQL % [ val ] |
|
8 | 299 |
of "dbopts": result.dbopts = val |
11 | 300 |
|
8 | 301 |
of "listen-addr", "a": result.listen_addr = val |
302 |
of "listen-port", "p": result.listen_port = val.parse_int |
|
0 | 303 |
|
304 |
else: discard |
|
305 |
||
306 |
of cmdEnd: assert( false ) # shouldn't reach here ever |
|
307 |
||
308 |
||
309 |
when isMainModule: |
|
5 | 310 |
system.addQuitProc( resetAttributes ) |
8 | 311 |
conf = parse_cmdline() |
7
c0bcf3bea772
Force a GC pass after 25 cycles. Don't bother with sync() at exit, unnecessary.
Mahlon E. Smith <mahlon@laika.com>
parents:
6
diff
changeset
|
312 |
if conf.debug: echo hl( $conf, fgYellow ) |
8 | 313 |
serverloop( conf ) |
0 | 314 |