grok_test.go 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738
  1. package grok
  2. import (
  3. "bufio"
  4. "fmt"
  5. "strings"
  6. "testing"
  7. )
  8. func TestNew(t *testing.T) {
  9. g, _ := New()
  10. if len(g.patterns) == 0 {
  11. t.Fatal("the Grok object should have some patterns pre loaded")
  12. }
  13. g, _ = NewWithConfig(&Config{NamedCapturesOnly: true})
  14. if len(g.patterns) == 0 {
  15. t.Fatal("the Grok object should have some patterns pre loaded")
  16. }
  17. }
  18. func TestParseWithDefaultCaptureMode(t *testing.T) {
  19. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  20. if captures, err := g.Parse("%{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`); err != nil {
  21. t.Fatalf("error can not capture : %s", err.Error())
  22. } else {
  23. if captures["timestamp"] != "23/Apr/2014:22:58:32 +0200" {
  24. t.Fatalf("%s should be '%s' have '%s'", "timestamp", "23/Apr/2014:22:58:32 +0200", captures["timestamp"])
  25. }
  26. if captures["TIME"] != "" {
  27. t.Fatalf("%s should be '%s' have '%s'", "TIME", "", captures["TIME"])
  28. }
  29. }
  30. g, _ = New()
  31. if captures, err := g.Parse("%{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`); err != nil {
  32. t.Fatalf("error can not capture : %s", err.Error())
  33. } else {
  34. if captures["timestamp"] != "23/Apr/2014:22:58:32 +0200" {
  35. t.Fatalf("%s should be '%s' have '%s'", "timestamp", "23/Apr/2014:22:58:32 +0200", captures["timestamp"])
  36. }
  37. if captures["TIME"] != "22:58:32" {
  38. t.Fatalf("%s should be '%s' have '%s'", "TIME", "22:58:32", captures["TIME"])
  39. }
  40. }
  41. }
  42. func TestMultiParseWithDefaultCaptureMode(t *testing.T) {
  43. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  44. res, _ := g.ParseToMultiMap("%{COMMONAPACHELOG} %{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:23:58:32 +0200] "GET /index.php HTTP/1.1" 404 207 127.0.0.1 - - [24/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  45. if len(res["TIME"]) != 0 {
  46. t.Fatalf("DAY should be an array of 0 elements, but is '%s'", res["TIME"])
  47. }
  48. g, _ = New()
  49. res, _ = g.ParseToMultiMap("%{COMMONAPACHELOG} %{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:23:58:32 +0200] "GET /index.php HTTP/1.1" 404 207 127.0.0.1 - - [24/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  50. if len(res["TIME"]) != 2 {
  51. t.Fatalf("TIME should be an array of 2 elements, but is '%s'", res["TIME"])
  52. }
  53. if len(res["timestamp"]) != 2 {
  54. t.Fatalf("timestamp should be an array of 2 elements, but is '%s'", res["timestamp"])
  55. }
  56. }
  57. func TestNewWithNoDefaultPatterns(t *testing.T) {
  58. g, _ := NewWithConfig(&Config{SkipDefaultPatterns: true})
  59. if len(g.patterns) != 0 {
  60. t.Fatal("Using SkipDefaultPatterns the Grok object should not have any patterns pre loaded")
  61. }
  62. }
  63. func TestAddPatternErr(t *testing.T) {
  64. name := "Error"
  65. pattern := "%{ERR}"
  66. g, _ := New()
  67. err := g.addPattern(name, pattern)
  68. if err == nil {
  69. t.Fatalf("AddPattern should returns an error when path is invalid")
  70. }
  71. }
  72. func TestAddPatternsFromPathErr(t *testing.T) {
  73. g, _ := New()
  74. err := g.AddPatternsFromPath("./Lorem ipsum Minim qui in.")
  75. if err == nil {
  76. t.Fatalf("AddPatternsFromPath should returns an error when path is invalid")
  77. }
  78. }
  79. func TestConfigPatternsDir(t *testing.T) {
  80. g, err := NewWithConfig(&Config{PatternsDir: []string{"./patterns"}})
  81. if err != nil {
  82. t.Error(err)
  83. }
  84. if captures, err := g.Parse("%{SYSLOGLINE}", `Sep 12 23:19:02 docker syslog-ng[25389]: syslog-ng starting up; version='3.5.3'`); err != nil {
  85. t.Fatalf("error : %s", err.Error())
  86. } else {
  87. // pp.Print(captures)
  88. if captures["program"] != "syslog-ng" {
  89. t.Fatalf("%s should be '%s' have '%s'", "program", "syslog-ng", captures["program"])
  90. }
  91. }
  92. }
  93. func TestAddPatternsFromPathFileOpenErr(t *testing.T) {
  94. t.Skipped()
  95. }
  96. func TestAddPatternsFromPathFile(t *testing.T) {
  97. g, _ := New()
  98. err := g.AddPatternsFromPath("./patterns/grok-patterns")
  99. if err != nil {
  100. t.Fatalf("err %#v", err)
  101. }
  102. }
  103. func TestAddPattern(t *testing.T) {
  104. name := "DAYO"
  105. pattern := "(?:Mon(?:day)?|Tue(?:sday)?|Wed(?:nesday)?|Thu(?:rsday)?|Fri(?:day)?|Sat(?:urday)?|Sun(?:day)?)"
  106. g, _ := New()
  107. cPatterns := len(g.patterns)
  108. g.AddPattern(name, pattern)
  109. g.AddPattern(name+"2", pattern)
  110. if len(g.patterns) != cPatterns+2 {
  111. t.Fatalf("%d Default patterns should be available, have %d", cPatterns+2, len(g.patterns))
  112. }
  113. g, _ = NewWithConfig(&Config{NamedCapturesOnly: true})
  114. cPatterns = len(g.patterns)
  115. g.AddPattern(name, pattern)
  116. g.AddPattern(name+"2", pattern)
  117. if len(g.patterns) != cPatterns+2 {
  118. t.Fatalf("%d NamedCapture patterns should be available, have %d", cPatterns+2, len(g.patterns))
  119. }
  120. }
  121. func TestMatch(t *testing.T) {
  122. g, _ := New()
  123. g.AddPatternsFromPath("./patterns")
  124. if r, err := g.Match("%{MONTH}", "June"); !r {
  125. t.Fatalf("June should match %s: err=%s", "%{MONTH}", err.Error())
  126. }
  127. }
  128. func TestDoesNotMatch(t *testing.T) {
  129. g, _ := New()
  130. g.AddPatternsFromPath("./patterns")
  131. if r, _ := g.Match("%{MONTH}", "13"); r {
  132. t.Fatalf("13 should not match %s", "%{MONTH}")
  133. }
  134. }
  135. func TestErrorMatch(t *testing.T) {
  136. g, _ := New()
  137. if _, err := g.Match("(", "13"); err == nil {
  138. t.Fatal("Error expected")
  139. }
  140. }
  141. func TestShortName(t *testing.T) {
  142. g, _ := New()
  143. g.AddPattern("A", "a")
  144. m, err := g.Match("%{A}", "a")
  145. if err != nil {
  146. t.Fatal("a should match %%{A}: err=%s", err.Error())
  147. }
  148. if !m {
  149. t.Fatal("%%{A} didn't match 'a'")
  150. }
  151. }
  152. func TestDayCompile(t *testing.T) {
  153. g, _ := New()
  154. g.AddPattern("DAY", "(?:Mon(?:day)?|Tue(?:sday)?|Wed(?:nesday)?|Thu(?:rsday)?|Fri(?:day)?|Sat(?:urday)?|Sun(?:day)?)")
  155. pattern := "%{DAY}"
  156. _, err := g.compile(pattern)
  157. if err != nil {
  158. t.Fatal("Error:", err)
  159. }
  160. }
  161. func TestErrorCompile(t *testing.T) {
  162. g, _ := New()
  163. _, err := g.compile("(")
  164. if err == nil {
  165. t.Fatal("Error:", err)
  166. }
  167. }
  168. func TestNamedCaptures(t *testing.T) {
  169. g, _ := New()
  170. g.AddPatternsFromPath("./patterns")
  171. check := func(key, value, pattern, text string) {
  172. captures, _ := g.Parse(pattern, text)
  173. if captures[key] != value {
  174. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  175. }
  176. }
  177. check("jour", "Tue",
  178. "%{DAY:jour}",
  179. "Tue May 15 11:21:42 [conn1047685] moveChunk deleted: 7157",
  180. )
  181. check("day-of.week", "Tue",
  182. "%{DAY:day-of.week}",
  183. "Tue May 15 11:21:42 [conn1047685] moveChunk deleted: 7157",
  184. )
  185. }
  186. func TestErrorCaptureUnknowPattern(t *testing.T) {
  187. g, _ := New()
  188. pattern := "%{UNKNOWPATTERN}"
  189. _, err := g.Parse(pattern, "")
  190. if err == nil {
  191. t.Fatal("Expected error not set")
  192. }
  193. }
  194. func TestParse(t *testing.T) {
  195. g, _ := New()
  196. g.AddPatternsFromPath("./patterns")
  197. res, _ := g.Parse("%{DAY}", "Tue qds")
  198. if res["DAY"] != "Tue" {
  199. t.Fatalf("DAY should be 'Tue' have '%s'", res["DAY"])
  200. }
  201. }
  202. func TestErrorParseToMultiMap(t *testing.T) {
  203. g, _ := New()
  204. pattern := "%{UNKNOWPATTERN}"
  205. _, err := g.ParseToMultiMap(pattern, "")
  206. if err == nil {
  207. t.Fatal("Expected error not set")
  208. }
  209. }
  210. func TestParseToMultiMap(t *testing.T) {
  211. g, _ := New()
  212. g.AddPatternsFromPath("./patterns")
  213. res, _ := g.ParseToMultiMap("%{COMMONAPACHELOG} %{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:23:58:32 +0200] "GET /index.php HTTP/1.1" 404 207 127.0.0.1 - - [24/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  214. if len(res["TIME"]) != 2 {
  215. t.Fatalf("DAY should be an array of 3 elements, but is '%s'", res["TIME"])
  216. }
  217. if res["TIME"][0] != "23:58:32" {
  218. t.Fatalf("TIME[0] should be '23:58:32' have '%s'", res["TIME"][0])
  219. }
  220. if res["TIME"][1] != "22:58:32" {
  221. t.Fatalf("TIME[1] should be '22:58:32' have '%s'", res["TIME"][1])
  222. }
  223. }
  224. func TestParseToMultiMapOnlyNamedCaptures(t *testing.T) {
  225. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  226. g.AddPatternsFromPath("./patterns")
  227. res, _ := g.ParseToMultiMap("%{COMMONAPACHELOG} %{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207 127.0.0.1 - - [24/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  228. if len(res["timestamp"]) != 2 {
  229. t.Fatalf("timestamp should be an array of 2 elements, but is '%s'", res["timestamp"])
  230. }
  231. if res["timestamp"][0] != "23/Apr/2014:22:58:32 +0200" {
  232. t.Fatalf("timestamp[0] should be '23/Apr/2014:22:58:32 +0200' have '%s'", res["DAY"][0])
  233. }
  234. if res["timestamp"][1] != "24/Apr/2014:22:58:32 +0200" {
  235. t.Fatalf("timestamp[1] should be '24/Apr/2014:22:58:32 +0200' have '%s'", res["DAY"][1])
  236. }
  237. }
  238. func TestCaptureAll(t *testing.T) {
  239. g, _ := New()
  240. g.AddPatternsFromPath("./patterns")
  241. check := func(key, value, pattern, text string) {
  242. if captures, err := g.Parse(pattern, text); err != nil {
  243. t.Fatalf("error can not capture : %s", err.Error())
  244. } else {
  245. if captures[key] != value {
  246. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  247. }
  248. }
  249. }
  250. check("timestamp", "23/Apr/2014:22:58:32 +0200",
  251. "%{COMMONAPACHELOG}",
  252. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  253. )
  254. check("TIME", "22:58:32",
  255. "%{COMMONAPACHELOG}",
  256. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  257. )
  258. check("SECOND", `17,1599`, "%{TIMESTAMP_ISO8601}", `s d9fq4999s ../ sdf 2013-11-06 04:50:17,1599sd`)
  259. check("HOSTNAME", `google.com`, "%{HOSTPORT}", `google.com:8080`)
  260. //HOSTPORT
  261. check("POSINT", `8080`, "%{HOSTPORT}", `google.com:8080`)
  262. }
  263. func TestNamedCapture(t *testing.T) {
  264. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  265. g.AddPatternsFromPath("./patterns")
  266. check := func(key, value, pattern, text string) {
  267. if captures, err := g.Parse(pattern, text); err != nil {
  268. t.Fatalf("error can not capture : %s", err.Error())
  269. } else {
  270. if captures[key] != value {
  271. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  272. }
  273. }
  274. }
  275. check("timestamp", "23/Apr/2014:22:58:32 +0200",
  276. "%{COMMONAPACHELOG}",
  277. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  278. )
  279. check("TIME", "",
  280. "%{COMMONAPACHELOG}",
  281. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  282. )
  283. check("SECOND", ``, "%{TIMESTAMP_ISO8601}", `s d9fq4999s ../ sdf 2013-11-06 04:50:17,1599sd`)
  284. check("HOSTNAME", ``, "%{HOSTPORT}", `google.com:8080`)
  285. //HOSTPORT
  286. check("POSINT", ``, "%{HOSTPORT}", `google.com:8080`)
  287. }
  288. func TestRemoveEmptyValues(t *testing.T) {
  289. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true, RemoveEmptyValues: true})
  290. capturesExists := func(key, pattern, text string) {
  291. if captures, err := g.Parse(pattern, text); err != nil {
  292. t.Fatalf("error can not capture : %s", err.Error())
  293. } else {
  294. if _, ok := captures[key]; ok {
  295. t.Fatalf("%s should be absent", key)
  296. }
  297. }
  298. }
  299. capturesExists("rawrequest", "%{COMMONAPACHELOG}",
  300. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  301. )
  302. }
  303. func TestCapturesAndNamedCapture(t *testing.T) {
  304. check := func(key, value, pattern, text string) {
  305. g, _ := New()
  306. if captures, err := g.Parse(pattern, text); err != nil {
  307. t.Fatalf("error can not capture : %s", err.Error())
  308. } else {
  309. if captures[key] != value {
  310. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  311. }
  312. }
  313. }
  314. checkNamed := func(key, value, pattern, text string) {
  315. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  316. if captures, err := g.Parse(pattern, text); err != nil {
  317. t.Fatalf("error can not capture : %s", err.Error())
  318. } else {
  319. if captures[key] != value {
  320. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  321. }
  322. }
  323. }
  324. check("DAY", "Tue",
  325. "%{DAY}",
  326. "Tue May 15 11:21:42 [conn1047685] moveChunk deleted: 7157",
  327. )
  328. checkNamed("jour", "Tue",
  329. "%{DAY:jour}",
  330. "Tue May 15 11:21:42 [conn1047685] moveChunk deleted: 7157",
  331. )
  332. check("clientip", "127.0.0.1",
  333. "%{COMMONAPACHELOG}",
  334. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  335. )
  336. check("verb", "GET",
  337. "%{COMMONAPACHELOG}",
  338. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  339. )
  340. check("timestamp", "23/Apr/2014:22:58:32 +0200",
  341. "%{COMMONAPACHELOG}",
  342. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  343. )
  344. check("bytes", "207",
  345. "%{COMMONAPACHELOG}",
  346. `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`,
  347. )
  348. //PATH
  349. check("WINPATH", `c:\winfows\sdf.txt`, "%{WINPATH}", `s dfqs c:\winfows\sdf.txt`)
  350. check("WINPATH", `\\sdf\winfows\sdf.txt`, "%{WINPATH}", `s dfqs \\sdf\winfows\sdf.txt`)
  351. check("UNIXPATH", `/usr/lib/`, "%{UNIXPATH}", `s dfqs /usr/lib/ sqfd`)
  352. check("UNIXPATH", `/usr/lib`, "%{UNIXPATH}", `s dfqs /usr/lib sqfd`)
  353. check("UNIXPATH", `/usr/`, "%{UNIXPATH}", `s dfqs /usr/ sqfd`)
  354. check("UNIXPATH", `/usr`, "%{UNIXPATH}", `s dfqs /usr sqfd`)
  355. check("UNIXPATH", `/`, "%{UNIXPATH}", `s dfqs / sqfd`)
  356. //YEAR
  357. check("YEAR", `4999`, "%{YEAR}", `s d9fq4999s ../ sdf`)
  358. check("YEAR", `79`, "%{YEAR}", `s d79fq4999s ../ sdf`)
  359. check("TIMESTAMP_ISO8601", `2013-11-06 04:50:17,1599`, "%{TIMESTAMP_ISO8601}", `s d9fq4999s ../ sdf 2013-11-06 04:50:17,1599sd`)
  360. //MAC
  361. check("MAC", `01:02:03:04:ab:cf`, "%{MAC}", `s d9fq4999s ../ sdf 2013- 01:02:03:04:ab:cf 11-06 04:50:17,1599sd`)
  362. check("MAC", `01-02-03-04-ab-cd`, "%{MAC}", `s d9fq4999s ../ sdf 2013- 01-02-03-04-ab-cd 11-06 04:50:17,1599sd`)
  363. //QUOTEDSTRING
  364. check("QUOTEDSTRING", `"lkj"`, "%{QUOTEDSTRING}", `qsdklfjqsd fk"lkj"mkj`)
  365. check("QUOTEDSTRING", `'lkj'`, "%{QUOTEDSTRING}", `qsdklfjqsd fk'lkj'mkj`)
  366. check("QUOTEDSTRING", `"fk'lkj'm"`, "%{QUOTEDSTRING}", `qsdklfjqsd "fk'lkj'm"kj`)
  367. check("QUOTEDSTRING", `'fk"lkj"m'`, "%{QUOTEDSTRING}", `qsdklfjqsd 'fk"lkj"m'kj`)
  368. //BASE10NUM
  369. check("BASE10NUM", `1`, "%{BASE10NUM}", `1`) // this is a nice one
  370. check("BASE10NUM", `8080`, "%{BASE10NUM}", `qsfd8080qsfd`)
  371. }
  372. // Should be run with -race
  373. func TestConcurentParse(t *testing.T) {
  374. g, _ := New()
  375. g.AddPatternsFromPath("./patterns")
  376. check := func(key, value, pattern, text string) {
  377. if captures, err := g.Parse(pattern, text); err != nil {
  378. t.Fatalf("error can not capture : %s", err.Error())
  379. } else {
  380. if captures[key] != value {
  381. t.Fatalf("%s should be '%s' have '%s'", key, value, captures[key])
  382. }
  383. }
  384. }
  385. go check("QUOTEDSTRING", `"lkj"`, "%{QUOTEDSTRING}", `qsdklfjqsd fk"lkj"mkj`)
  386. go check("QUOTEDSTRING", `'lkj'`, "%{QUOTEDSTRING}", `qsdklfjqsd fk'lkj'mkj`)
  387. go check("QUOTEDSTRING", `'lkj'`, "%{QUOTEDSTRING}", `qsdklfjqsd fk'lkj'mkj`)
  388. go check("QUOTEDSTRING", `"fk'lkj'm"`, "%{QUOTEDSTRING}", `qsdklfjqsd "fk'lkj'm"kj`)
  389. go check("QUOTEDSTRING", `'fk"lkj"m'`, "%{QUOTEDSTRING}", `qsdklfjqsd 'fk"lkj"m'kj`)
  390. }
  391. func TestPatterns(t *testing.T) {
  392. g, _ := NewWithConfig(&Config{SkipDefaultPatterns: true})
  393. if len(g.patterns) != 0 {
  394. t.Fatalf("Patterns should return 0, have '%d'", len(g.patterns))
  395. }
  396. name := "DAY0"
  397. pattern := "(?:Mon(?:day)?|Tue(?:sday)?|Wed(?:nesday)?|Thu(?:rsday)?|Fri(?:day)?|Sat(?:urday)?|Sun(?:day)?)"
  398. g.AddPattern(name, pattern)
  399. g.AddPattern(name+"1", pattern)
  400. if len(g.patterns) != 2 {
  401. t.Fatalf("Patterns should return 2, have '%d'", len(g.patterns))
  402. }
  403. }
  404. func TestParseTypedWithDefaultCaptureMode(t *testing.T) {
  405. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  406. if captures, err := g.ParseTyped("%{IPV4:ip:string} %{NUMBER:status:int} %{NUMBER:duration:float}", `127.0.0.1 200 0.8`); err != nil {
  407. t.Fatalf("error can not capture : %s", err.Error())
  408. } else {
  409. if captures["ip"] != "127.0.0.1" {
  410. t.Fatalf("%s should be '%s' have '%s'", "ip", "127.0.0.1", captures["ip"])
  411. } else {
  412. if captures["status"] != 200 {
  413. t.Fatalf("%s should be '%d' have '%d'", "status", 200, captures["status"])
  414. } else {
  415. if captures["duration"] != 0.8 {
  416. t.Fatalf("%s should be '%f' have '%f'", "duration", 0.8, captures["duration"])
  417. }
  418. }
  419. }
  420. }
  421. }
  422. func TestParseTypedWithNoTypeInfo(t *testing.T) {
  423. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  424. if captures, err := g.ParseTyped("%{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`); err != nil {
  425. t.Fatalf("error can not capture : %s", err.Error())
  426. } else {
  427. if captures["timestamp"] != "23/Apr/2014:22:58:32 +0200" {
  428. t.Fatalf("%s should be '%s' have '%s'", "timestamp", "23/Apr/2014:22:58:32 +0200", captures["timestamp"])
  429. }
  430. if captures["TIME"] != nil {
  431. t.Fatalf("%s should be nil have '%s'", "TIME", captures["TIME"])
  432. }
  433. }
  434. g, _ = New()
  435. if captures, err := g.ParseTyped("%{COMMONAPACHELOG}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`); err != nil {
  436. t.Fatalf("error can not capture : %s", err.Error())
  437. } else {
  438. if captures["timestamp"] != "23/Apr/2014:22:58:32 +0200" {
  439. t.Fatalf("%s should be '%s' have '%s'", "timestamp", "23/Apr/2014:22:58:32 +0200", captures["timestamp"])
  440. }
  441. if captures["TIME"] != "22:58:32" {
  442. t.Fatalf("%s should be '%s' have '%s'", "TIME", "22:58:32", captures["TIME"])
  443. }
  444. }
  445. }
  446. func TestParseTypedWithIntegerTypeCoercion(t *testing.T) {
  447. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  448. if captures, err := g.ParseTyped("%{WORD:coerced:int}", `5.75`); err != nil {
  449. t.Fatalf("error can not capture : %s", err.Error())
  450. } else {
  451. if captures["coerced"] != 5 {
  452. t.Fatalf("%s should be '%s' have '%s'", "coerced", "5", captures["coerced"])
  453. }
  454. }
  455. }
  456. func TestParseTypedWithUnknownType(t *testing.T) {
  457. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  458. if _, err := g.ParseTyped("%{WORD:word:unknown}", `hello`); err == nil {
  459. t.Fatalf("parsing an unknown type must result in a conversion error")
  460. }
  461. }
  462. func TestParseTypedErrorCaptureUnknowPattern(t *testing.T) {
  463. g, _ := New()
  464. pattern := "%{UNKNOWPATTERN}"
  465. _, err := g.ParseTyped(pattern, "")
  466. if err == nil {
  467. t.Fatal("Expected error not set")
  468. }
  469. }
  470. func TestParseTypedWithTypedParents(t *testing.T) {
  471. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  472. g.AddPattern("TESTCOMMON", `%{IPORHOST:clientip} %{USER:ident} %{USER:auth} \[%{HTTPDATE:timestamp}\] "(?:%{WORD:verb} %{NOTSPACE:request}(?: HTTP/%{NUMBER:httpversion})?|%{DATA:rawrequest})" %{NUMBER:response} (?:%{NUMBER:bytes:int}|-)`)
  473. if captures, err := g.ParseTyped("%{TESTCOMMON}", `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`); err != nil {
  474. t.Fatalf("error can not capture : %s", err.Error())
  475. } else {
  476. if captures["bytes"] != 207 {
  477. t.Fatalf("%s should be '%s' have '%s'", "bytes", "207", captures["bytes"])
  478. }
  479. }
  480. }
  481. func TestParseTypedWithSemanticHomonyms(t *testing.T) {
  482. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true, SkipDefaultPatterns: true})
  483. g.AddPattern("BASE10NUM", `([+-]?(?:[0-9]+(?:\.[0-9]+)?)|\.[0-9]+)`)
  484. g.AddPattern("NUMBER", `(?:%{BASE10NUM})`)
  485. g.AddPattern("MYNUM", `%{NUMBER:bytes:int}`)
  486. g.AddPattern("MYSTR", `%{NUMBER:bytes:string}`)
  487. if captures, err := g.ParseTyped("%{MYNUM}", `207`); err != nil {
  488. t.Fatalf("error can not scapture : %s", err.Error())
  489. } else {
  490. if captures["bytes"] != 207 {
  491. t.Fatalf("%s should be %#v have %#v", "bytes", 207, captures["bytes"])
  492. }
  493. }
  494. if captures, err := g.ParseTyped("%{MYSTR}", `207`); err != nil {
  495. t.Fatalf("error can not capture : %s", err.Error())
  496. } else {
  497. if captures["bytes"] != "207" {
  498. t.Fatalf("%s should be %#v have %#v", "bytes", "207", captures["bytes"])
  499. }
  500. }
  501. }
  502. var resultNew *Grok
  503. func BenchmarkNew(b *testing.B) {
  504. b.ReportAllocs()
  505. b.ResetTimer()
  506. var g *Grok
  507. // run the check function b.N times
  508. for n := 0; n < b.N; n++ {
  509. g, _ = NewWithConfig(&Config{NamedCapturesOnly: true})
  510. }
  511. resultNew = g
  512. }
  513. func BenchmarkCaptures(b *testing.B) {
  514. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  515. b.ReportAllocs()
  516. b.ResetTimer()
  517. // run the check function b.N times
  518. for n := 0; n < b.N; n++ {
  519. g.Parse(`%{IPORHOST:clientip} %{USER:ident} %{USER:auth} \[%{HTTPDATE:timestamp}\] "(?:%{WORD:verb} %{NOTSPACE:request}(?: HTTP/%{NUMBER:httpversion})?|%{DATA:rawrequest})" %{NUMBER:response} (?:%{NUMBER:bytes}|-)`, `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  520. }
  521. }
  522. func BenchmarkCapturesTypedFake(b *testing.B) {
  523. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  524. b.ReportAllocs()
  525. b.ResetTimer()
  526. // run the check function b.N times
  527. for n := 0; n < b.N; n++ {
  528. g.Parse(`%{IPORHOST:clientip} %{USER:ident} %{USER:auth} \[%{HTTPDATE:timestamp}\] "(?:%{WORD:verb} %{NOTSPACE:request}(?: HTTP/%{NUMBER:httpversion})?|%{DATA:rawrequest})" %{NUMBER:response} (?:%{NUMBER:bytes}|-)`, `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  529. }
  530. }
  531. func BenchmarkCapturesTypedReal(b *testing.B) {
  532. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  533. b.ReportAllocs()
  534. b.ResetTimer()
  535. // run the check function b.N times
  536. for n := 0; n < b.N; n++ {
  537. g.ParseTyped(`%{IPORHOST:clientip} %{USER:ident} %{USER:auth} \[%{HTTPDATE:timestamp}\] "(?:%{WORD:verb} %{NOTSPACE:request}(?: HTTP/%{NUMBER:httpversion:int})?|%{DATA:rawrequest})" %{NUMBER:response:int} (?:%{NUMBER:bytes:int}|-)`, `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  538. }
  539. }
  540. func BenchmarkParallelCaptures(b *testing.B) {
  541. g, _ := NewWithConfig(&Config{NamedCapturesOnly: true})
  542. b.ReportAllocs()
  543. b.ResetTimer()
  544. b.RunParallel(func(b *testing.PB) {
  545. for b.Next() {
  546. g.Parse(`%{IPORHOST:clientip} %{USER:ident} %{USER:auth} \[%{HTTPDATE:timestamp}\] "(?:%{WORD:verb} %{NOTSPACE:request}(?: HTTP/%{NUMBER:httpversion})?|%{DATA:rawrequest})" %{NUMBER:response} (?:%{NUMBER:bytes}|-)`, `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207`)
  547. }
  548. })
  549. }
  550. func TestGrok_AddPatternsFromMap_not_exist(t *testing.T) {
  551. defer func() {
  552. if r := recover(); r != nil {
  553. t.Fatalf("AddPatternsFromMap panics: %v", r)
  554. }
  555. }()
  556. g, _ := NewWithConfig(&Config{SkipDefaultPatterns: true})
  557. err := g.AddPatternsFromMap(map[string]string{
  558. "SOME": "%{NOT_EXIST}",
  559. })
  560. if err == nil {
  561. t.Errorf("AddPatternsFromMap should returns an error")
  562. }
  563. }
  564. func TestGrok_AddPatternsFromMap_simple(t *testing.T) {
  565. defer func() {
  566. if r := recover(); r != nil {
  567. t.Fatalf("AddPatternsFromMap panics: %v", r)
  568. }
  569. }()
  570. g, _ := NewWithConfig(&Config{SkipDefaultPatterns: true})
  571. err := g.AddPatternsFromMap(map[string]string{
  572. "NO3": `\d{3}`,
  573. })
  574. if err != nil {
  575. t.Errorf("AddPatternsFromMap returns an error: %v", err)
  576. }
  577. mss, err := g.Parse("%{NO3:match}", "333")
  578. if err != nil {
  579. t.Error("parsing error:", err)
  580. t.FailNow()
  581. }
  582. if mss["match"] != "333" {
  583. t.Errorf("bad match: expected 333, got %s", mss["match"])
  584. }
  585. }
  586. func TestGrok_AddPatternsFromMap_complex(t *testing.T) {
  587. defer func() {
  588. if r := recover(); r != nil {
  589. t.Fatalf("AddPatternsFromMap panics: %v", r)
  590. }
  591. }()
  592. g, _ := NewWithConfig(&Config{
  593. SkipDefaultPatterns: true,
  594. NamedCapturesOnly: true,
  595. })
  596. err := g.AddPatternsFromMap(map[string]string{
  597. "NO3": `\d{3}`,
  598. "NO6": "%{NO3}%{NO3}",
  599. })
  600. if err != nil {
  601. t.Errorf("AddPatternsFromMap returns an error: %v", err)
  602. }
  603. mss, err := g.Parse("%{NO6:number}", "333666")
  604. if err != nil {
  605. t.Error("parsing error:", err)
  606. t.FailNow()
  607. }
  608. if mss["number"] != "333666" {
  609. t.Errorf("bad match: expected 333666, got %s", mss["match"])
  610. }
  611. }
  612. func TestParseStream(t *testing.T) {
  613. g, _ := New()
  614. pTest := func(m map[string]string) error {
  615. ts, ok := m["timestamp"]
  616. if !ok {
  617. t.Error("timestamp not found")
  618. }
  619. if len(ts) == 0 {
  620. t.Error("empty timestamp")
  621. }
  622. return nil
  623. }
  624. const testLog = `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207
  625. 127.0.0.1 - - [23/Apr/2014:22:59:32 +0200] "GET /index.php HTTP/1.1" 404 207
  626. 127.0.0.1 - - [23/Apr/2014:23:00:32 +0200] "GET /index.php HTTP/1.1" 404 207
  627. `
  628. r := bufio.NewReader(strings.NewReader(testLog))
  629. if err := g.ParseStream(r, "%{COMMONAPACHELOG}", pTest); err != nil {
  630. t.Fatal(err)
  631. }
  632. }
  633. func TestParseStreamError(t *testing.T) {
  634. g, _ := New()
  635. pTest := func(m map[string]string) error {
  636. if _, ok := m["timestamp"]; !ok {
  637. return fmt.Errorf("timestamp not found")
  638. }
  639. return nil
  640. }
  641. const testLog = `127.0.0.1 - - [23/Apr/2014:22:58:32 +0200] "GET /index.php HTTP/1.1" 404 207
  642. 127.0.0.1 - - [xxxxxxxxxxxxxxxxxxxx +0200] "GET /index.php HTTP/1.1" 404 207
  643. 127.0.0.1 - - [23/Apr/2014:23:00:32 +0200] "GET /index.php HTTP/1.1" 404 207
  644. `
  645. r := bufio.NewReader(strings.NewReader(testLog))
  646. if err := g.ParseStream(r, "%{COMMONAPACHELOG}", pTest); err == nil {
  647. t.Fatal("Error expected")
  648. }
  649. }