parsing_test.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420
  1. package parser
  2. import (
  3. "bytes"
  4. "errors"
  5. "fmt"
  6. "html/template"
  7. "io"
  8. "os"
  9. "sort"
  10. "strings"
  11. "testing"
  12. "github.com/davecgh/go-spew/spew"
  13. log "github.com/sirupsen/logrus"
  14. "gopkg.in/yaml.v2"
  15. "github.com/crowdsecurity/crowdsec/pkg/exprhelpers"
  16. "github.com/crowdsecurity/crowdsec/pkg/types"
  17. )
  18. type TestFile struct {
  19. Lines []types.Event `yaml:"lines,omitempty"`
  20. Results []types.Event `yaml:"results,omitempty"`
  21. }
  22. var debug bool = false
  23. func TestParser(t *testing.T) {
  24. debug = true
  25. log.SetLevel(log.InfoLevel)
  26. var envSetting = os.Getenv("TEST_ONLY")
  27. pctx, ectx, err := prepTests()
  28. if err != nil {
  29. t.Fatalf("failed to load env : %s", err)
  30. }
  31. //Init the enricher
  32. if envSetting != "" {
  33. if err := testOneParser(pctx, ectx, envSetting, nil); err != nil {
  34. t.Fatalf("Test '%s' failed : %s", envSetting, err)
  35. }
  36. } else {
  37. fds, err := os.ReadDir("./tests/")
  38. if err != nil {
  39. t.Fatalf("Unable to read test directory : %s", err)
  40. }
  41. for _, fd := range fds {
  42. if !fd.IsDir() {
  43. continue
  44. }
  45. fname := "./tests/" + fd.Name()
  46. log.Infof("Running test on %s", fname)
  47. if err := testOneParser(pctx, ectx, fname, nil); err != nil {
  48. t.Fatalf("Test '%s' failed : %s", fname, err)
  49. }
  50. }
  51. }
  52. }
  53. func BenchmarkParser(t *testing.B) {
  54. log.Printf("start bench !!!!")
  55. debug = false
  56. log.SetLevel(log.ErrorLevel)
  57. pctx, ectx, err := prepTests()
  58. if err != nil {
  59. t.Fatalf("failed to load env : %s", err)
  60. }
  61. var envSetting = os.Getenv("TEST_ONLY")
  62. if envSetting != "" {
  63. if err := testOneParser(pctx, ectx, envSetting, t); err != nil {
  64. t.Fatalf("Test '%s' failed : %s", envSetting, err)
  65. }
  66. } else {
  67. fds, err := os.ReadDir("./tests/")
  68. if err != nil {
  69. t.Fatalf("Unable to read test directory : %s", err)
  70. }
  71. for _, fd := range fds {
  72. if !fd.IsDir() {
  73. continue
  74. }
  75. fname := "./tests/" + fd.Name()
  76. log.Infof("Running test on %s", fname)
  77. if err := testOneParser(pctx, ectx, fname, t); err != nil {
  78. t.Fatalf("Test '%s' failed : %s", fname, err)
  79. }
  80. }
  81. }
  82. }
  83. func testOneParser(pctx *UnixParserCtx, ectx EnricherCtx, dir string, b *testing.B) error {
  84. var (
  85. err error
  86. pnodes []Node
  87. parser_configs []Stagefile
  88. )
  89. log.Warningf("testing %s", dir)
  90. parser_cfg_file := fmt.Sprintf("%s/parsers.yaml", dir)
  91. cfg, err := os.ReadFile(parser_cfg_file)
  92. if err != nil {
  93. return fmt.Errorf("failed opening %s : %s", parser_cfg_file, err)
  94. }
  95. tmpl, err := template.New("test").Parse(string(cfg))
  96. if err != nil {
  97. return fmt.Errorf("failed to parse template %s : %s", cfg, err)
  98. }
  99. var out bytes.Buffer
  100. err = tmpl.Execute(&out, map[string]string{"TestDirectory": dir})
  101. if err != nil {
  102. panic(err)
  103. }
  104. if err = yaml.UnmarshalStrict(out.Bytes(), &parser_configs); err != nil {
  105. return fmt.Errorf("failed unmarshaling %s : %s", parser_cfg_file, err)
  106. }
  107. pnodes, err = LoadStages(parser_configs, pctx, ectx)
  108. if err != nil {
  109. return fmt.Errorf("unable to load parser config : %s", err)
  110. }
  111. //TBD: Load post overflows
  112. //func testFile(t *testing.T, file string, pctx UnixParserCtx, nodes []Node) bool {
  113. parser_test_file := fmt.Sprintf("%s/test.yaml", dir)
  114. tests := loadTestFile(parser_test_file)
  115. count := 1
  116. if b != nil {
  117. count = b.N
  118. b.ResetTimer()
  119. }
  120. for n := 0; n < count; n++ {
  121. if testFile(tests, *pctx, pnodes) != true {
  122. return fmt.Errorf("test failed !")
  123. }
  124. }
  125. return nil
  126. }
  127. // prepTests is going to do the initialisation of parser : it's going to load enrichment plugins and load the patterns. This is done here so that we don't redo it for each test
  128. func prepTests() (*UnixParserCtx, EnricherCtx, error) {
  129. var (
  130. err error
  131. pctx *UnixParserCtx
  132. ectx EnricherCtx
  133. )
  134. err = exprhelpers.Init(nil)
  135. if err != nil {
  136. log.Fatalf("exprhelpers init failed: %s", err)
  137. }
  138. //Load enrichment
  139. datadir := "./test_data/"
  140. err = exprhelpers.GeoIPInit(datadir)
  141. if err != nil {
  142. log.Fatalf("unable to initialize GeoIP: %s", err)
  143. }
  144. ectx, err = Loadplugin()
  145. if err != nil {
  146. log.Fatalf("failed to load plugin geoip : %v", err)
  147. }
  148. log.Printf("Loaded -> %+v", ectx)
  149. //Load the parser patterns
  150. cfgdir := "../../config/"
  151. /* this should be refactored to 2 lines :p */
  152. // Init the parser
  153. pctx, err = Init(map[string]interface{}{"patterns": cfgdir + string("/patterns/"), "data": "./tests/"})
  154. if err != nil {
  155. return nil, ectx, fmt.Errorf("failed to initialize parser : %v", err)
  156. }
  157. return pctx, ectx, nil
  158. }
  159. func loadTestFile(file string) []TestFile {
  160. yamlFile, err := os.Open(file)
  161. if err != nil {
  162. log.Fatalf("yamlFile.Get err #%v ", err)
  163. }
  164. dec := yaml.NewDecoder(yamlFile)
  165. dec.SetStrict(true)
  166. var testSet []TestFile
  167. for {
  168. tf := TestFile{}
  169. err := dec.Decode(&tf)
  170. if err != nil {
  171. if errors.Is(err, io.EOF) {
  172. break
  173. }
  174. log.Fatalf("Failed to load testfile '%s' yaml error : %v", file, err)
  175. return nil
  176. }
  177. testSet = append(testSet, tf)
  178. }
  179. return testSet
  180. }
  181. func matchEvent(expected types.Event, out types.Event, debug bool) ([]string, bool) {
  182. var retInfo []string
  183. var valid = false
  184. expectMaps := []map[string]string{expected.Parsed, expected.Meta, expected.Enriched}
  185. outMaps := []map[string]string{out.Parsed, out.Meta, out.Enriched}
  186. outLabels := []string{"Parsed", "Meta", "Enriched"}
  187. //allow to check as well for stage and processed flags
  188. if expected.Stage != "" {
  189. if expected.Stage != out.Stage {
  190. if debug {
  191. retInfo = append(retInfo, fmt.Sprintf("mismatch stage %s != %s", expected.Stage, out.Stage))
  192. }
  193. goto checkFinished
  194. } else {
  195. valid = true
  196. if debug {
  197. retInfo = append(retInfo, fmt.Sprintf("ok stage %s == %s", expected.Stage, out.Stage))
  198. }
  199. }
  200. }
  201. if expected.Process != out.Process {
  202. if debug {
  203. retInfo = append(retInfo, fmt.Sprintf("mismatch process %t != %t", expected.Process, out.Process))
  204. }
  205. goto checkFinished
  206. } else {
  207. valid = true
  208. if debug {
  209. retInfo = append(retInfo, fmt.Sprintf("ok process %t == %t", expected.Process, out.Process))
  210. }
  211. }
  212. if expected.Whitelisted != out.Whitelisted {
  213. if debug {
  214. retInfo = append(retInfo, fmt.Sprintf("mismatch whitelist %t != %t", expected.Whitelisted, out.Whitelisted))
  215. }
  216. goto checkFinished
  217. } else {
  218. if debug {
  219. retInfo = append(retInfo, fmt.Sprintf("ok whitelist %t == %t", expected.Whitelisted, out.Whitelisted))
  220. }
  221. valid = true
  222. }
  223. for mapIdx := 0; mapIdx < len(expectMaps); mapIdx++ {
  224. for expKey, expVal := range expectMaps[mapIdx] {
  225. if outVal, ok := outMaps[mapIdx][expKey]; ok {
  226. if outVal == expVal { //ok entry
  227. if debug {
  228. retInfo = append(retInfo, fmt.Sprintf("ok %s[%s] %s == %s", outLabels[mapIdx], expKey, expVal, outVal))
  229. }
  230. valid = true
  231. } else { //mismatch entry
  232. if debug {
  233. retInfo = append(retInfo, fmt.Sprintf("mismatch %s[%s] %s != %s", outLabels[mapIdx], expKey, expVal, outVal))
  234. }
  235. valid = false
  236. goto checkFinished
  237. }
  238. } else { //missing entry
  239. if debug {
  240. retInfo = append(retInfo, fmt.Sprintf("missing entry %s[%s]", outLabels[mapIdx], expKey))
  241. }
  242. valid = false
  243. goto checkFinished
  244. }
  245. }
  246. }
  247. checkFinished:
  248. if valid {
  249. if debug {
  250. retInfo = append(retInfo, fmt.Sprintf("OK ! \n\t%s", strings.Join(retInfo, "\n\t")))
  251. }
  252. } else {
  253. if debug {
  254. retInfo = append(retInfo, fmt.Sprintf("KO ! \n\t%s", strings.Join(retInfo, "\n\t")))
  255. }
  256. }
  257. return retInfo, valid
  258. }
  259. func testSubSet(testSet TestFile, pctx UnixParserCtx, nodes []Node) (bool, error) {
  260. var results []types.Event
  261. for _, in := range testSet.Lines {
  262. out, err := Parse(pctx, in, nodes)
  263. if err != nil {
  264. log.Errorf("Failed to process %s : %v", spew.Sdump(in), err)
  265. }
  266. //log.Infof("Parser output : %s", spew.Sdump(out))
  267. results = append(results, out)
  268. }
  269. log.Infof("parsed %d lines", len(testSet.Lines))
  270. log.Infof("got %d results", len(results))
  271. /*
  272. check the results we got against the expected ones
  273. only the keys of the expected part are checked against result
  274. */
  275. if len(testSet.Results) == 0 && len(results) == 0 {
  276. log.Fatal("No results, no tests, abort.")
  277. return false, fmt.Errorf("no tests, no results")
  278. }
  279. reCheck:
  280. failinfo := []string{}
  281. for ridx, result := range results {
  282. for eidx, expected := range testSet.Results {
  283. explain, match := matchEvent(expected, result, debug)
  284. if match == true {
  285. log.Infof("expected %d/%d matches result %d/%d", eidx, len(testSet.Results), ridx, len(results))
  286. if len(explain) > 0 {
  287. log.Printf("-> %s", explain[len(explain)-1])
  288. }
  289. //don't do this at home : delete current element from list and redo
  290. results[len(results)-1], results[ridx] = results[ridx], results[len(results)-1]
  291. results = results[:len(results)-1]
  292. testSet.Results[len(testSet.Results)-1], testSet.Results[eidx] = testSet.Results[eidx], testSet.Results[len(testSet.Results)-1]
  293. testSet.Results = testSet.Results[:len(testSet.Results)-1]
  294. goto reCheck
  295. } else {
  296. failinfo = append(failinfo, explain...)
  297. }
  298. }
  299. }
  300. if len(results) > 0 {
  301. log.Printf("Errors : %s", strings.Join(failinfo, " / "))
  302. return false, fmt.Errorf("leftover results : %+v", results)
  303. }
  304. if len(testSet.Results) > 0 {
  305. log.Printf("Errors : %s", strings.Join(failinfo, " / "))
  306. return false, fmt.Errorf("leftover expected results : %+v", testSet.Results)
  307. }
  308. return true, nil
  309. }
  310. func testFile(testSet []TestFile, pctx UnixParserCtx, nodes []Node) bool {
  311. log.Warning("Going to process one test set")
  312. for _, tf := range testSet {
  313. //func testSubSet(testSet TestFile, pctx UnixParserCtx, nodes []Node) (bool, error) {
  314. testOk, err := testSubSet(tf, pctx, nodes)
  315. if err != nil {
  316. log.Fatalf("test failed : %s", err)
  317. }
  318. if !testOk {
  319. log.Fatalf("failed test : %+v", tf)
  320. }
  321. }
  322. return true
  323. }
  324. /*THIS IS ONLY PRESENT TO BE ABLE TO GENERATE DOCUMENTATION OF EXISTING PATTERNS*/
  325. type Pair struct {
  326. Key string
  327. Value string
  328. }
  329. type PairList []Pair
  330. func (p PairList) Len() int { return len(p) }
  331. func (p PairList) Swap(i, j int) { p[i], p[j] = p[j], p[i] }
  332. func (p PairList) Less(i, j int) bool { return len(p[i].Value) < len(p[j].Value) }
  333. func TestGeneratePatternsDoc(t *testing.T) {
  334. if os.Getenv("GO_WANT_TEST_DOC") != "1" {
  335. return
  336. }
  337. pctx, err := Init(map[string]interface{}{"patterns": "../../config/patterns/", "data": "./tests/"})
  338. if err != nil {
  339. t.Fatalf("unable to load patterns : %s", err)
  340. }
  341. log.Infof("-> %s", spew.Sdump(pctx))
  342. /*don't judge me, we do it for the users*/
  343. p := make(PairList, len(pctx.Grok.Patterns))
  344. i := 0
  345. for key, val := range pctx.Grok.Patterns {
  346. p[i] = Pair{key, val}
  347. p[i].Value = strings.ReplaceAll(p[i].Value, "{%{", "\\{\\%\\{")
  348. i++
  349. }
  350. sort.Sort(p)
  351. f, err := os.OpenFile("./patterns-documentation.md", os.O_TRUNC|os.O_CREATE|os.O_WRONLY, 0644)
  352. if err != nil {
  353. t.Fatalf("failed to open : %s", err)
  354. }
  355. if _, err := f.WriteString("# Patterns documentation\n\n"); err != nil {
  356. t.Fatal("failed to write to file")
  357. }
  358. if _, err := f.WriteString("You will find here a generated documentation of all the patterns loaded by crowdsec.\n"); err != nil {
  359. t.Fatal("failed to write to file")
  360. }
  361. if _, err := f.WriteString("They are sorted by pattern length, and are meant to be used in parsers, in the form %{PATTERN_NAME}.\n"); err != nil {
  362. t.Fatal("failed to write to file")
  363. }
  364. if _, err := f.WriteString("\n\n"); err != nil {
  365. t.Fatal("failed to write to file")
  366. }
  367. for _, k := range p {
  368. if _, err := fmt.Fprintf(f, "## %s\n\nPattern :\n```\n%s\n```\n\n", k.Key, k.Value); err != nil {
  369. t.Fatal("failed to write to file")
  370. }
  371. fmt.Printf("%v\t%v\n", k.Key, k.Value)
  372. }
  373. if _, err := f.WriteString("\n"); err != nil {
  374. t.Fatal("failed to write to file")
  375. }
  376. if _, err := f.WriteString("# Documentation generation\n"); err != nil {
  377. t.Fatal("failed to write to file")
  378. }
  379. if _, err := f.WriteString("This documentation is generated by `pkg/parser` : `GO_WANT_TEST_DOC=1 go test -run TestGeneratePatternsDoc`\n"); err != nil {
  380. t.Fatal("failed to write to file")
  381. }
  382. f.Close()
  383. }