* @package LanguageDetection */ class WhitespaceTokenizer implements TokenizerInterface { /** * @param string $str * @return array */ public function tokenize(string $str): array { return \array_map(function ($word) { return "_{$word}_"; }, \preg_split('/[^\pL]+(?