import TokenTransformingMixins from 'causal-net/packages/causality-preprocessing/src/NLP/tokenTransforming.mixins.js'

public class | source

TokenTransformingMixins

PreprocessingClass → TokenTransformingMixins

Method Summary

Public Methods
public	badWordsFilter(tokens: Array , badWordList: Array ): Array Remove bad words from tokens
public	tokenize(sentence: String ): Array tokenized sentence
public	wordDuplicateRemove(tokens: Array ): * Remove duplicated tokens
public	wordFreqCount(tokens: Array , freqCount: Object ): Object Count number of apperance of each token in the token list

Remove bad words from tokens

Array

tokens without bad words

tokenized sentence

Name	Type	Attribute	Description
sentence	String		array of string sentence

Array

array of tokenized sentences

Remove duplicated tokens

Name	Type	Attribute	Description
tokens	Array		array of string token

Count number of apperance of each token in the token list

Name	Type	Attribute	Description
tokens	Array		array of string tokens
freqCount	Object	optional default: {}	objec or previous wordFreqCount, empty object if not provided

Object

json object with token as key and counting number as corresponding value