| 64 | } |
| 65 | |
| 66 | func (d *Drain) Train(content string) *LogCluster { |
| 67 | d.tokenBuffer = d.tokenizer.Tokenize(content, d.tokenBuffer) |
| 68 | if len(d.tokenBuffer) == 0 { |
| 69 | return nil |
| 70 | } |
| 71 | |
| 72 | if len(d.tokenBuffer) < d.config.MinTokens { |
| 73 | d.metrics.LinesSkippedTooFewTokens.Inc() |
| 74 | return nil |
| 75 | } |
| 76 | if len(d.tokenBuffer) > d.config.MaxTokens { |
| 77 | d.metrics.LinesSkippedTooManyTokens.Inc() |
| 78 | return nil |
| 79 | } |
| 80 | d.metrics.TokensPerLine.Observe(float64(len(d.tokenBuffer))) |
| 81 | |
| 82 | return d.train(d.tokenBuffer) |
| 83 | } |
| 84 | |
| 85 | func (d *Drain) newCluster(tokens []string) *LogCluster { |
| 86 | d.clustersCounter++ |