Effective tokenizing is all about handling sentences that contain features beyond words & punctuations such as e-mails, mentions, emojis, emoticons, hashtags, urls and more! Here is an example:
// Load wink tokenizer.
var winkTokenize = require( 'wink-tokenizer' );
// Instantiate and obtain tokenize api.
var tokenize = winkTokenize().tokenize;
// Notice apart from tokenization, how the feature of every token is identified & tagged.
var s = '@FeminismInIndia👧 conducted a workshop at #AmbedkarUniversity on "online safety" \
recently:-)! reach us at firstname.lastname@example.org. #DigitalSaftey http://bit.ly/2F2m9rL';
console.log( tokenize( s ) );