function tokenize(text){ var puncRE = /([ \?!,\.]+)/; var bits = text.split(puncRE); var words = []; for (var i=0;i 1 && !(bits[i].match(puncRE))) words.push(bits[i]); return words; }