This functions is still under development At this time you can generate a stopwords list in Portuguese and English.

There is many options of stopwords lists available in R, like:

But none is categorized allowing a more fine grained control of the words by grammar categories.

Choose the language and which grammar tags use to generate a stopword list. The lang parameter uses the two word designation, and the cat designs the grammar category following Penn Treebank. See here

POS Tag Description Example Description
CC coordinating conjunction and
CD cardinal number one, third
DT determiner the
EX existential there there is
PP pronoum me, you, he, she, it, we, they
PPZ pronoum
UH interjection oops!
V verb are be have variations of verbs to be, have,
gen_stopwords()
#>  [1] "e"                "ou"               "mas"              "que"             
#>  [5] "porque"           "por que"          "porquê"           "por quê"         
#>  [9] "se"               "como"             "primeiro"         "segundo"         
#> [13] "terceiro"         "quarto"           "quinto"           "sexto"           
#> [17] "sétimo"           "oitavo"           "nono"             "décimo"          
#> [21] "vigésimo"         "trigésimo"        "quadrigésimo"     "quinquagésimo"   
#> [25] "sexagésimo"       "septuagésimo"     "setuagésimo"      "octogésimo"      
#> [29] "nonagésimo"       "centésimo"        "ducentésimo"      "trecentésimo"    
#> [33] "quadringentésimo" "quingentésimo"    "seiscentésimo"    "sexcentésimo"    
#> [37] "septingentésimo"  "setingentésimo"   "octingentésimo"   "nongentésimo"    
#> [41] "milésimo"         "milionésimo"      "bilionésimo"      "o"               
#> [45] "a"                "os"               "as"
gen_stopwords(lang = "en", categories = "CC")
#> [1] "and" "but" "or"  "for" "yet" "so"
gen_stopwords(lang = "pt", categories = "CC DT")
#>  [1] "e"       "ou"      "mas"     "que"     "porque"  "por que" "porquê" 
#>  [8] "por quê" "se"      "como"    "o"       "a"       "os"      "as"
# to convert the list into a named vector
gen_stopwords(lang = "en", categories = "CC DT V")
#>  [1] "and"   "but"   "or"    "for"   "yet"   "so"    "a"     "the"   "this" 
#> [10] "am"    "are"   "is"    "be"    "can"   "could" "did"   "do"    "have" 
#> [19] "he"    "it"    "may"   "might" "must"  "need"  "no"    "not"   "now"  
#> [28] "of"    "on"    "she"   "that"  "to"    "was"   "were"

gen_stopwords(lang = "pt")
#>  [1] "e"                "ou"               "mas"              "que"             
#>  [5] "porque"           "por que"          "porquê"           "por quê"         
#>  [9] "se"               "como"             "primeiro"         "segundo"         
#> [13] "terceiro"         "quarto"           "quinto"           "sexto"           
#> [17] "sétimo"           "oitavo"           "nono"             "décimo"          
#> [21] "vigésimo"         "trigésimo"        "quadrigésimo"     "quinquagésimo"   
#> [25] "sexagésimo"       "septuagésimo"     "setuagésimo"      "octogésimo"      
#> [29] "nonagésimo"       "centésimo"        "ducentésimo"      "trecentésimo"    
#> [33] "quadringentésimo" "quingentésimo"    "seiscentésimo"    "sexcentésimo"    
#> [37] "septingentésimo"  "setingentésimo"   "octingentésimo"   "nongentésimo"    
#> [41] "milésimo"         "milionésimo"      "bilionésimo"      "o"               
#> [45] "a"                "os"               "as"
gen_stopwords(lang = "pt", categories = "V")
#>   [1] "ser"        "sou"        "sois"       "é"          "és"        
#>   [6] "somos"      "são"        "era"        "eram"       "éramos"    
#>  [11] "serei"      "será"       "serão"      "serás"      "fui"       
#>  [16] "foste"      "foi"        "fomos"      "fostes"     "foram"     
#>  [21] "eras"       "éreis"      "seremos"    "sereis"     "seja"      
#>  [26] "sejam"      "estar"      "estou"      "estás"      "está"      
#>  [31] "estamos"    "estais"     "estão"      "estive"     "estiveste" 
#>  [36] "esteve"     "estivemos"  "estivestes" "estiveram"  "estava"    
#>  [41] "estavas"    "estávamos"  "estáveis"   "estavam"    "estarei"   
#>  [46] "estarás"    "estará"     "estaremos"  "estareis"   "estarão"   
#>  [51] "esteja"     "estejam"    "ter"        "tenham"     "têem"      
#>  [56] "tenho"      "tens"       "tem"        "temos"      "tendes"    
#>  [61] "têm"        "tive"       "tiveste"    "teve"       "tivemos"   
#>  [66] "tivestes"   "tiveram"    "tinha"      "tinhas"     "tínhamos"  
#>  [71] "tínheis"    "tinham"     "terei"      "terás"      "terá"      
#>  [76] "teremos"    "tereis"     "terão"      "teria"      "teriam"    
#>  [81] "haver"      "houve"      "haveria"    "haveriam"   "hei"       
#>  [86] "hás"        "há"         "havemos"    "haveis"     "hão"       
#>  [91] "houver"     "houveres"   "houvermos"  "houverdes"  "houverem"  
#>  [96] "havia"      "havias"     "havíamos"   "havíeis"    "haviam"    
#> [101] "haverei"    "haverás"    "haverá"     "haveremos"  "havereis"  
#> [106] "haverão"    "haja"       "hajam"      "houvera"    "houveram"  
#> [111] "houvesse"   "ir"         "vou"        "vai"        "vais"      
#> [116] "vamos"

With the vec parameter, it is possible to have three different output formats: list, vector (default) and named vector.

gen_stopwords(lang = "pt", categories = "V", vec = "list")
#> $V
#> $V$ser
#>  [1] "ser"     "sou"     "sois"    "é"       "és"      "somos"   "sois"   
#>  [8] "são"     "era"     "eram"    "éramos"  "serei"   "será"    "serão"  
#> [15] "serás"   "fui"     "foste"   "foi"     "fomos"   "fostes"  "foram"  
#> [22] "era"     "eras"    "era"     "éramos"  "éreis"   "eram"    "serei"  
#> [29] "serás"   "será"    "seremos" "sereis"  "serão"   "seja"    "sejam"  
#> 
#> $V$estar
#>  [1] "estar"      "estou"      "estás"      "está"       "estamos"   
#>  [6] "estais"     "estão"      "estive"     "estiveste"  "esteve"    
#> [11] "estivemos"  "estivestes" "estiveram"  "estava"     "estavas"   
#> [16] "estava"     "estávamos"  "estáveis"   "estavam"    "estarei"   
#> [21] "estarás"    "estará"     "estaremos"  "estareis"   "estarão"   
#> [26] "esteja"     "estejam"   
#> 
#> $V$ter
#>  [1] "ter"      "tenham"   "têem"     "tenho"    "tens"     "tem"     
#>  [7] "temos"    "tendes"   "têm"      "tive"     "tiveste"  "teve"    
#> [13] "tivemos"  "tivestes" "tiveram"  "tinha"    "tinhas"   "tinha"   
#> [19] "tínhamos" "tínheis"  "tinham"   "terei"    "terás"    "terá"    
#> [25] "teremos"  "tereis"   "terão"    "teria"    "teriam"  
#> 
#> $V$haver
#>  [1] "haver"     "houve"     "haveria"   "haveriam"  "hei"       "hás"      
#>  [7] "há"        "havemos"   "haveis"    "hão"       "houver"    "houveres" 
#> [13] "houver"    "houvermos" "houverdes" "houverem"  "havia"     "havias"   
#> [19] "havia"     "havíamos"  "havíeis"   "haviam"    "haverei"   "haverás"  
#> [25] "haverá"    "haveremos" "havereis"  "haverão"   "haja"      "hajam"    
#> [31] "houvera"   "houveram"  "houvesse" 
#> 
#> $V$ir
#> [1] "ir"    "vou"   "vai"   "vais"  "vamos" "fui"   "foi"   "fomos"
#> 
#> 
#> $<NA>
#> NULL
gen_stopwords(lang = "pt", categories = "V", vec = "vec")
#>   [1] "ser"        "sou"        "sois"       "é"          "és"        
#>   [6] "somos"      "são"        "era"        "eram"       "éramos"    
#>  [11] "serei"      "será"       "serão"      "serás"      "fui"       
#>  [16] "foste"      "foi"        "fomos"      "fostes"     "foram"     
#>  [21] "eras"       "éreis"      "seremos"    "sereis"     "seja"      
#>  [26] "sejam"      "estar"      "estou"      "estás"      "está"      
#>  [31] "estamos"    "estais"     "estão"      "estive"     "estiveste" 
#>  [36] "esteve"     "estivemos"  "estivestes" "estiveram"  "estava"    
#>  [41] "estavas"    "estávamos"  "estáveis"   "estavam"    "estarei"   
#>  [46] "estarás"    "estará"     "estaremos"  "estareis"   "estarão"   
#>  [51] "esteja"     "estejam"    "ter"        "tenham"     "têem"      
#>  [56] "tenho"      "tens"       "tem"        "temos"      "tendes"    
#>  [61] "têm"        "tive"       "tiveste"    "teve"       "tivemos"   
#>  [66] "tivestes"   "tiveram"    "tinha"      "tinhas"     "tínhamos"  
#>  [71] "tínheis"    "tinham"     "terei"      "terás"      "terá"      
#>  [76] "teremos"    "tereis"     "terão"      "teria"      "teriam"    
#>  [81] "haver"      "houve"      "haveria"    "haveriam"   "hei"       
#>  [86] "hás"        "há"         "havemos"    "haveis"     "hão"       
#>  [91] "houver"     "houveres"   "houvermos"  "houverdes"  "houverem"  
#>  [96] "havia"      "havias"     "havíamos"   "havíeis"    "haviam"    
#> [101] "haverei"    "haverás"    "haverá"     "haveremos"  "havereis"  
#> [106] "haverão"    "haja"       "hajam"      "houvera"    "houveram"  
#> [111] "houvesse"   "ir"         "vou"        "vai"        "vais"      
#> [116] "vamos"
gen_stopwords(lang = "pt", categories = "V", vec = "n_vec")
#>       V.ser1       V.ser2       V.ser3       V.ser4       V.ser5       V.ser6 
#>        "ser"        "sou"       "sois"          "é"         "és"      "somos" 
#>       V.ser7       V.ser8       V.ser9      V.ser10      V.ser11      V.ser12 
#>       "sois"        "são"        "era"       "eram"     "éramos"      "serei" 
#>      V.ser13      V.ser14      V.ser15      V.ser16      V.ser17      V.ser18 
#>       "será"      "serão"      "serás"        "fui"      "foste"        "foi" 
#>      V.ser19      V.ser20      V.ser21      V.ser22      V.ser23      V.ser24 
#>      "fomos"     "fostes"      "foram"        "era"       "eras"        "era" 
#>      V.ser25      V.ser26      V.ser27      V.ser28      V.ser29      V.ser30 
#>     "éramos"      "éreis"       "eram"      "serei"      "serás"       "será" 
#>      V.ser31      V.ser32      V.ser33      V.ser34      V.ser35     V.estar1 
#>    "seremos"     "sereis"      "serão"       "seja"      "sejam"      "estar" 
#>     V.estar2     V.estar3     V.estar4     V.estar5     V.estar6     V.estar7 
#>      "estou"      "estás"       "está"    "estamos"     "estais"      "estão" 
#>     V.estar8     V.estar9    V.estar10    V.estar11    V.estar12    V.estar13 
#>     "estive"  "estiveste"     "esteve"  "estivemos" "estivestes"  "estiveram" 
#>    V.estar14    V.estar15    V.estar16    V.estar17    V.estar18    V.estar19 
#>     "estava"    "estavas"     "estava"  "estávamos"   "estáveis"    "estavam" 
#>    V.estar20    V.estar21    V.estar22    V.estar23    V.estar24    V.estar25 
#>    "estarei"    "estarás"     "estará"  "estaremos"   "estareis"    "estarão" 
#>    V.estar26    V.estar27       V.ter1       V.ter2       V.ter3       V.ter4 
#>     "esteja"    "estejam"        "ter"     "tenham"       "têem"      "tenho" 
#>       V.ter5       V.ter6       V.ter7       V.ter8       V.ter9      V.ter10 
#>       "tens"        "tem"      "temos"     "tendes"        "têm"       "tive" 
#>      V.ter11      V.ter12      V.ter13      V.ter14      V.ter15      V.ter16 
#>    "tiveste"       "teve"    "tivemos"   "tivestes"    "tiveram"      "tinha" 
#>      V.ter17      V.ter18      V.ter19      V.ter20      V.ter21      V.ter22 
#>     "tinhas"      "tinha"   "tínhamos"    "tínheis"     "tinham"      "terei" 
#>      V.ter23      V.ter24      V.ter25      V.ter26      V.ter27      V.ter28 
#>      "terás"       "terá"    "teremos"     "tereis"      "terão"      "teria" 
#>      V.ter29     V.haver1     V.haver2     V.haver3     V.haver4     V.haver5 
#>     "teriam"      "haver"      "houve"    "haveria"   "haveriam"        "hei" 
#>     V.haver6     V.haver7     V.haver8     V.haver9    V.haver10    V.haver11 
#>        "hás"         "há"    "havemos"     "haveis"        "hão"     "houver" 
#>    V.haver12    V.haver13    V.haver14    V.haver15    V.haver16    V.haver17 
#>   "houveres"     "houver"  "houvermos"  "houverdes"   "houverem"      "havia" 
#>    V.haver18    V.haver19    V.haver20    V.haver21    V.haver22    V.haver23 
#>     "havias"      "havia"   "havíamos"    "havíeis"     "haviam"    "haverei" 
#>    V.haver24    V.haver25    V.haver26    V.haver27    V.haver28    V.haver29 
#>    "haverás"     "haverá"  "haveremos"   "havereis"    "haverão"       "haja" 
#>    V.haver30    V.haver31    V.haver32    V.haver33        V.ir1        V.ir2 
#>      "hajam"    "houvera"   "houveram"   "houvesse"         "ir"        "vou" 
#>        V.ir3        V.ir4        V.ir5        V.ir6        V.ir7        V.ir8 
#>        "vai"       "vais"      "vamos"        "fui"        "foi"      "fomos"

To use only certain kinds of verbs, like only the variations/conjugations of the Portuguese verb ser:

my_sw <- gen_stopwords("pt", "V", vec = "list")
my_sw$V$ser
#>  [1] "ser"     "sou"     "sois"    "é"       "és"      "somos"   "sois"   
#>  [8] "são"     "era"     "eram"    "éramos"  "serei"   "será"    "serão"  
#> [15] "serás"   "fui"     "foste"   "foi"     "fomos"   "fostes"  "foram"  
#> [22] "era"     "eras"    "era"     "éramos"  "éreis"   "eram"    "serei"  
#> [29] "serás"   "será"    "seremos" "sereis"  "serão"   "seja"    "sejam"
# or shorter
gen_stopwords("pt", "V", vec = "list")$V$ser
#>  [1] "ser"     "sou"     "sois"    "é"       "és"      "somos"   "sois"   
#>  [8] "são"     "era"     "eram"    "éramos"  "serei"   "será"    "serão"  
#> [15] "serás"   "fui"     "foste"   "foi"     "fomos"   "fostes"  "foram"  
#> [22] "era"     "eras"    "era"     "éramos"  "éreis"   "eram"    "serei"  
#> [29] "serás"   "será"    "seremos" "sereis"  "serão"   "seja"    "sejam"

It is possible to add new words to the stopwords in two ways:

gen_stopwords("en", "CC", add = c("word1", "word2"))
#> [1] "and"   "but"   "or"    "for"   "yet"   "so"    "word1" "word2"
gen_stopwords("en", "CC", add = s2v("word1 word2 word3"))
#> [1] "and"   "but"   "or"    "for"   "yet"   "so"    "word1" "word2" "word3"

To see all the categories and its respective terms, run the following code

show_sw("en")
#> $IN
#> [1] "of"  "for" "in"  "by" 
#> 
#> $DT
#> [1] "a"    "the"  "this"
#> 
#> $CC
#> [1] "and" "but" "or"  "for" "yet" "so" 
#> 
#> $CD
#>  [1] "zero"    "one"     "two"     "three"   "four"    "five"    "first"  
#>  [8] "second"  "third"   "fourth"  "fifth"   "sixth"   "seventh" "eighth" 
#> [15] "ninth"   "tenth"  
#> 
#> $JJ
#> [1] "blue"  "happy" "sad"  
#> 
#> $JJR
#> [1] "bluer"   "happier"
#> 
#> $JJS
#> [1] "bluest"   "happiest"
#> 
#> $MD
#> [1] "could" "will" 
#> 
#> $PP
#> [1] "I"   "you" "he"  "she" "it"  "we" 
#> 
#> $PRP
#> [1] "I"    "you"  "he"   "she"  "we"   "us"   "they"
#> 
#> $PPZ
#> [1] "your" "my"   "mine" "ours" "his"  "her" 
#> 
#> $RB
#> [1] "however"   "usually"   "naturally" "here"      "good"     
#> 
#> $RBR
#> [1] "better"
#> 
#> $UH
#> [1] "aha" "uhu"
#> 
#> $RP
#> [1] "up"  "off"
#> 
#> $V
#>  [1] "am"    "are"   "is"    "be"    "can"   "could" "did"   "do"    "have" 
#> [10] "he"    "is"    "it"    "may"   "might" "must"  "need"  "no"    "not"  
#> [19] "now"   "of"    "on"    "or"    "she"   "that"  "the"   "to"    "was"  
#> [28] "were" 
#> 
#> $question
#> [1] "what"  "when"  "where" "who"   "whom"  "why"   "how"   "would" "could"
#> 
#> $conclusion
#> [1] "because"     "therefore"   "furthermore" "so"         
#> 
#> $time
#> $time$month
#>  [1] "January"   "February"  "March"     "April"     "May"       "June"     
#>  [7] "July"      "August"    "September" "October"   "November"  "December" 
#> 
#> $time$time
#>  [1] "today"     "tomorrow"  "yesterday" "now"       "later"     "sooner"   
#>  [7] "during"    "after"     "before"    "meanwhile"
#> 
#> 
#> $PT
#> [1] "Mr."   "Mrs."  "Miss"  "Ms."   "Sir"   "Madam" "Dr."   "Prof."
#> 
#> $`non-classified-yet`
#>  [1] "if"            "at"            "as"            "like"         
#>  [5] "there"         "these"         "all"           "some"         
#>  [9] "most"          "many"          "more"          "few"          
#> [13] "such"          "let"           "even"          "according"    
#> [17] "with"          "since"         "our"           "put"          
#> [21] "over"          "you've"        "we've"         "they'd"       
#> [25] "i'd"           "you'd"         "he'd"          "she'd"        
#> [29] "we'd"          "they'dfmyself" "ourselves"     "yours"        
#> [33] "yourself"      "yourselves"    "him"           "himself"      
#> 
#> $added
#> character(0)
show_sw("en", as_vector = TRUE)
#>   [1] "a"             "according"     "after"         "aha"          
#>   [5] "all"           "am"            "and"           "April"        
#>   [9] "are"           "as"            "at"            "August"       
#>  [13] "be"            "because"       "before"        "better"       
#>  [17] "blue"          "bluer"         "bluest"        "but"          
#>  [21] "by"            "can"           "could"         "December"     
#>  [25] "did"           "do"            "Dr."           "during"       
#>  [29] "eighth"        "even"          "February"      "few"          
#>  [33] "fifth"         "first"         "five"          "for"          
#>  [37] "four"          "fourth"        "furthermore"   "good"         
#>  [41] "happier"       "happiest"      "happy"         "have"         
#>  [45] "he"            "he'd"          "her"           "here"         
#>  [49] "him"           "himself"       "his"           "how"          
#>  [53] "however"       "I"             "i'd"           "if"           
#>  [57] "in"            "is"            "it"            "January"      
#>  [61] "July"          "June"          "later"         "let"          
#>  [65] "like"          "Madam"         "many"          "March"        
#>  [69] "may"           "May"           "meanwhile"     "might"        
#>  [73] "mine"          "Miss"          "more"          "most"         
#>  [77] "Mr."           "Mrs."          "Ms."           "must"         
#>  [81] "my"            "naturally"     "need"          "ninth"        
#>  [85] "no"            "not"           "November"      "now"          
#>  [89] "October"       "of"            "off"           "on"           
#>  [93] "one"           "or"            "our"           "ours"         
#>  [97] "ourselves"     "over"          "Prof."         "put"          
#> [101] "sad"           "second"        "September"     "seventh"      
#> [105] "she"           "she'd"         "since"         "Sir"          
#> [109] "sixth"         "so"            "some"          "sooner"       
#> [113] "such"          "tenth"         "that"          "the"          
#> [117] "there"         "therefore"     "these"         "they"         
#> [121] "they'd"        "they'dfmyself" "third"         "this"         
#> [125] "three"         "to"            "today"         "tomorrow"     
#> [129] "two"           "uhu"           "up"            "us"           
#> [133] "usually"       "was"           "we"            "we'd"         
#> [137] "we've"         "were"          "what"          "when"         
#> [141] "where"         "who"           "whom"          "why"          
#> [145] "will"          "with"          "would"         "yesterday"    
#> [149] "yet"           "you"           "you'd"         "you've"       
#> [153] "your"          "yours"         "yourself"      "yourselves"   
#> [157] "zero"
show_sw("pt", as_vector = TRUE)
#>   [1] "a"                "à"                "agora"           
#>   [4] "ah"               "ai"               "além"            
#>   [7] "algum"            "alguma"           "algumas"         
#>  [10] "alguns"           "ambos"            "ao"              
#>  [13] "após"             "aquela"           "aquelas"         
#>  [16] "aquele"           "aqueles"          "aqui"            
#>  [19] "as"               "assim"            "bilionésimo"     
#>  [22] "bosta"            "cabe"             "caralho"         
#>  [25] "caramba"          "cem"              "centésimo"       
#>  [28] "cinco"            "cinquenta"        "clique"          
#>  [31] "cocô"             "com"              "como"            
#>  [34] "concluindo"       "Conclusão"        "conosco"         
#>  [37] "consectário"      "consequentemente" "consigo"         
#>  [40] "convosco"         "credo"            "da"              
#>  [43] "das"              "de"               "décimo"          
#>  [46] "decorre"          "dela"             "delas"           
#>  [49] "dele"             "deles"            "depreende-se"    
#>  [52] "desde"            "desse modo"       "dez"             
#>  [55] "dezenove"         "dezesseis"        "dezessete"       
#>  [58] "dezoito"          "diante"           "do"              
#>  [61] "dois"             "dos"              "Doutor"          
#>  [64] "Doutora"          "Doutores"         "doze"            
#>  [67] "Dr."              "Dra."             "duas"            
#>  [70] "ducentésimo"      "duzentos"         "e"               
#>  [73] "é"                "eh"               "ei"              
#>  [76] "ela"              "elas"             "ele"             
#>  [79] "eles"             "em"               "em suma"         
#>  [82] "em vista disso"   "embora"           "enfim"           
#>  [85] "enquanto"         "então"            "entenda"         
#>  [88] "entre"            "era"              "eram"            
#>  [91] "éramos"           "eras"             "éreis"           
#>  [94] "és"               "essa"             "essas"           
#>  [97] "esse"             "esses"            "esta"            
#> [100] "está"             "estais"           "estamos"         
#> [103] "estão"            "estar"            "estará"          
#> [106] "estarão"          "estarás"          "estarei"         
#> [109] "estareis"         "estaremos"        "estas"           
#> [112] "estás"            "estava"           "estavam"         
#> [115] "estávamos"        "estavas"          "estáveis"        
#> [118] "este"             "esteja"           "estejam"         
#> [121] "estes"            "esteve"           "estive"          
#> [124] "estivemos"        "estiveram"        "estiveste"       
#> [127] "estivestes"       "estou"            "eu"              
#> [130] "Excelentíssima"   "Excelentíssimo"   "Excelentíssimos" 
#> [133] "Exmo."            "Exmos."           "finalmente"      
#> [136] "fiu"              "foi"              "fomos"           
#> [139] "foram"            "foste"            "fostes"          
#> [142] "fui"              "há"               "haja"            
#> [145] "hajam"            "hão"              "hás"             
#> [148] "haveis"           "havemos"          "haver"           
#> [151] "haverá"           "haverão"          "haverás"         
#> [154] "haverei"          "havereis"         "haveremos"       
#> [157] "haveria"          "haveriam"         "havia"           
#> [160] "haviam"           "havíamos"         "havias"          
#> [163] "havíeis"          "hei"              "hoje"            
#> [166] "houve"            "houver"           "houvera"         
#> [169] "houveram"         "houverdes"        "houverem"        
#> [172] "houveres"         "houvermos"        "houvesse"        
#> [175] "ir"               "isso"             "isto"            
#> [178] "lhe"              "logo"             "mais"            
#> [181] "mas"              "me"               "meo"             
#> [184] "merda"            "mesmo"            "meu"             
#> [187] "milésimo"         "milionésimo"      "mim"             
#> [190] "na"               "não"              "naquela"         
#> [193] "naquelas"         "naquele"          "naqueles"        
#> [196] "né"               "neh"              "nessa"           
#> [199] "nessas"           "nesse"            "nesses"          
#> [202] "nesta"            "nestas"           "neste"           
#> [205] "nestes"           "nisso"            "nisto"           
#> [208] "no"               "nonagésimo"       "nongentésimo"    
#> [211] "nono"             "nos"              "nós"             
#> [214] "nossa"            "nossas"           "nosso"           
#> [217] "nossos"           "nove"             "noventa"         
#> [220] "o"                "octingentésimo"   "octogésimo"      
#> [223] "oh"               "oitavo"           "oitenta"         
#> [226] "oito"             "onze"             "opa"             
#> [229] "os"               "ou"               "ou seja"         
#> [232] "para"             "passo"            "pois"            
#> [235] "por"              "por isso"         "por que"         
#> [238] "por quê"          "porque"           "porquê"          
#> [241] "porra"            "portanto"         "pqp"             
#> [244] "primeiro"         "psiu"             "quadrigésimo"    
#> [247] "quadringentésimo" "qual"             "quando"          
#> [250] "quarenta"         "quarto"           "quatorze"        
#> [253] "quatro"           "que"              "quem"            
#> [256] "quingentésimo"    "quinquagésimo"    "quinto"          
#> [259] "quinze"           "Rev.ma"           "são"             
#> [262] "se"               "segue-se"         "segundo"         
#> [265] "seis"             "seiscentésimo"    "seja"            
#> [268] "sejam"            "sem"              "Senhor"          
#> [271] "Senhoras"         "Senhores"         "septingentésimo" 
#> [274] "septuagésimo"     "ser"              "será"            
#> [277] "serão"            "serás"            "serei"           
#> [280] "sereis"           "seremos"          "sessenta"        
#> [283] "sete"             "setenta"          "sétimo"          
#> [286] "setingentésimo"   "setuagésimo"      "seu"             
#> [289] "sexagésimo"       "sexcentésimo"     "sexto"           
#> [292] "si"               "sobre"            "sois"            
#> [295] "somos"            "sou"              "Sr."             
#> [298] "Sra."             "sua"              "também"          
#> [301] "te"               "têem"             "tem"             
#> [304] "têm"              "temos"            "tendes"          
#> [307] "tenham"           "tenho"            "tens"            
#> [310] "ter"              "terá"             "terão"           
#> [313] "terás"            "terceiro"         "terei"           
#> [316] "tereis"           "teremos"          "teria"           
#> [319] "teriam"           "teu"              "teve"            
#> [322] "ti"               "tinha"            "tinham"          
#> [325] "tínhamos"         "tinhas"           "tínheis"         
#> [328] "tive"             "tivemos"          "tiveram"         
#> [331] "tiveste"          "tivestes"         "todos"           
#> [334] "trecentésimo"     "tres"             "três"            
#> [337] "treze"            "trezentos"        "trigésimo"       
#> [340] "trinta"           "tu"               "uhu"             
#> [343] "ui"               "um"               "uma"             
#> [346] "uou"              "use"              "V.A."            
#> [349] "V.Ex."            "V.Ex.a"           "V.Ex.as"         
#> [352] "V.Mag"            "V.S."             "V.S.a"           
#> [355] "vai"              "vais"             "vamos"           
#> [358] "veja"             "vigésimo"         "vinte"           
#> [361] "você"             "vocês"            "vos"             
#> [364] "vós"              "vou"              "vtnc"            
#> [367] "VV.AA."           "wow"