pub fn TokenizeContent(content: &str) -> Vec<String>
Tokenize content for indexing with improved word boundary handling