forked from influxdata/go-syslog
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmachine.go.rl
263 lines (209 loc) · 6.32 KB
/
machine.go.rl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
package rfc3164
import (
"fmt"
"time"
"github.com/influxdata/go-syslog/v3"
"github.com/influxdata/go-syslog/v3/common"
)
var (
errPrival = "expecting a priority value in the range 1-191 or equal to 0 [col %d]"
errPri = "expecting a priority value within angle brackets [col %d]"
errTimestamp = "expecting a Stamp timestamp [col %d]"
errRFC3339 = "expecting a Stamp or a RFC3339 timestamp [col %d]"
errHostname = "expecting an hostname (from 1 to max 255 US-ASCII characters) [col %d]"
errTag = "expecting an alphanumeric tag (max 32 characters) [col %d]"
errContentStart = "expecting a content part starting with a non-alphanumeric character [col %d]"
errContent = "expecting a content part composed by visible characters only [col %d]"
errParse = "parsing error [col %d]"
)
%%{
machine rfc3164;
include common "common.rl";
# unsigned alphabet
alphtype uint8;
action mark {
m.pb = m.p
}
action set_prival {
output.priority = uint8(common.UnsafeUTF8DecimalCodePointsToInt(m.text()))
output.prioritySet = true
}
action set_timestamp {
if t, e := time.Parse(time.Stamp, string(m.text())); e != nil {
m.err = fmt.Errorf("%s [col %d]", e, m.p)
fhold;
fgoto fail;
} else {
if m.timezone != nil {
t, _ = time.ParseInLocation(time.Stamp, string(m.text()), m.timezone)
}
output.timestamp = t.AddDate(m.yyyy, 0, 0)
if m.loc != nil {
output.timestamp = output.timestamp.In(m.loc)
}
output.timestampSet = true
}
}
action set_rfc3339 {
if t, e := time.Parse(time.RFC3339, string(m.text())); e != nil {
m.err = fmt.Errorf("%s [col %d]", e, m.p)
fhold;
fgoto fail;
} else {
output.timestamp = t
output.timestampSet = true
}
}
action set_hostname {
output.hostname = string(m.text())
}
action set_tag {
output.tag = string(m.text())
}
action set_content {
output.content = string(m.text())
}
action set_message {
output.message = string(m.text())
}
action err_prival {
m.err = fmt.Errorf(errPrival, m.p)
fhold;
fgoto fail;
}
action err_pri {
m.err = fmt.Errorf(errPri, m.p)
fhold;
fgoto fail;
}
action err_timestamp {
m.err = fmt.Errorf(errTimestamp, m.p)
fhold;
fgoto fail;
}
action err_rfc3339 {
m.err = fmt.Errorf(errRFC3339, m.p)
fhold;
fgoto fail;
}
action err_hostname {
m.err = fmt.Errorf(errHostname, m.p)
fhold;
fgoto fail;
}
action err_tag {
m.err = fmt.Errorf(errTag, m.p)
fhold;
fgoto fail;
}
action err_contentstart {
m.err = fmt.Errorf(errContentStart, m.p)
fhold;
fgoto fail;
}
action err_content {
m.err = fmt.Errorf(errContent, m.p)
fhold;
fgoto fail;
}
pri = ('<' prival >mark %from(set_prival) $err(err_prival) '>') @err(err_pri);
timestamp = (datemmm sp datemday sp hhmmss) >mark %set_timestamp @err(err_timestamp);
rfc3339 = fulldate >mark 'T' hhmmss timeoffset %set_rfc3339 @err(err_rfc3339);
# note > RFC 3164 says "The Domain Name MUST NOT be included in the HOSTNAME field"
# note > this could mean that the we may need to create and to use a labelrange = graph{1,63} here if we want the parser to be stricter.
hostname = hostnamerange >mark %set_hostname $err(err_hostname);
# Section 4.1.3
# note > alnum{1,32} is too restrictive (eg., no dashes)
# note > see https://tools.ietf.org/html/rfc2234#section-2.1 for an interpretation of "ABNF alphanumeric" as stated by RFC 3164 regarding the tag
# note > while RFC3164 assumes only ABNF alphanumeric process names, many BSD-syslog contains processe names with additional characters (-, _, .)
tag = (print -- [ :\[]){1,32} >mark %set_tag @err(err_tag);
visible = print | 0x80..0xFF;
# The first not alphanumeric character starts the content (usually containing a PID) part of the message part
contentval = !alnum @err(err_contentstart) >mark print* %set_content @err(err_content);
content = '[' contentval ']'; # todo(leodido) > support ':' and ' ' too. Also they have to match?
mex = visible+ >mark %set_message;
msg = (tag content? ':' sp)? mex;
fail := (any - [\n\r])* @err{ fgoto main; };
main := pri (timestamp | (rfc3339 when { m.rfc3339 })) sp hostname sp msg;
}%%
%% write data noerror noprefix;
type machine struct {
data []byte
cs int
p, pe, eof int
pb int
err error
bestEffort bool
yyyy int
rfc3339 bool
loc *time.Location
timezone *time.Location
}
// NewMachine creates a new FSM able to parse RFC3164 syslog messages.
func NewMachine(options ...syslog.MachineOption) syslog.Machine {
m := &machine{}
for _, opt := range options {
opt(m)
}
%% access m.;
%% variable p m.p;
%% variable pe m.pe;
%% variable eof m.eof;
%% variable data m.data;
return m
}
// WithBestEffort enables best effort mode.
func (m *machine) WithBestEffort() {
m.bestEffort = true
}
// HasBestEffort tells whether the receiving machine has best effort mode on or off.
func (m *machine) HasBestEffort() bool {
return m.bestEffort
}
// WithYear sets the year for the Stamp timestamp of the RFC 3164 syslog message.
func (m *machine) WithYear(o YearOperator) {
m.yyyy = YearOperation{o}.Operate()
}
// WithTimezone sets the time zone for the Stamp timestamp of the RFC 3164 syslog message.
func (m *machine) WithTimezone(loc *time.Location) {
m.loc = loc
}
// WithLocaleTimezone sets the locale time zone for the Stamp timestamp of the RFC 3164 syslog message.
func (m *machine) WithLocaleTimezone(loc *time.Location) {
m.timezone = loc
}
// WithRFC3339 enables ability to ALSO match RFC3339 timestamps.
//
// Notice this does not disable the default and correct timestamps - ie., Stamp timestamps.
func (m *machine) WithRFC3339() {
m.rfc3339 = true
}
// Err returns the error that occurred on the last call to Parse.
//
// If the result is nil, then the line was parsed successfully.
func (m *machine) Err() error {
return m.err
}
func (m *machine) text() []byte {
return m.data[m.pb:m.p]
}
// Parse parses the input byte array as a RFC3164 syslog message.
func (m *machine) Parse(input []byte) (syslog.Message, error) {
m.data = input
m.p = 0
m.pb = 0
m.pe = len(input)
m.eof = len(input)
m.err = nil
output := &syslogMessage{}
%% write init;
%% write exec;
if m.cs < first_final || m.cs == en_fail {
if m.bestEffort && output.minimal() {
// An error occurred but partial parsing is on and partial message is minimally valid
return output.export(), m.err
}
return nil, m.err
}
return output.export(), nil
}