-
Notifications
You must be signed in to change notification settings - Fork 14
/
_pkgdown.yml
64 lines (62 loc) · 1.39 KB
/
_pkgdown.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
url: https://textrecipes.tidymodels.org
template:
package: tidytemplate
bootstrap: 5
bslib:
primary: "#CA225E"
includes:
in_header: |
<script defer data-domain="textrecipes.tidymodels.org,all.tidymodels.org" src="https://plausible.io/js/plausible.js"></script>
development:
mode: auto
reference:
- title: Step Functions - Tokenization
contents:
- step_tokenize
- step_tokenize_bpe
- step_tokenize_sentencepiece
- step_tokenize_wordpiece
- title: Step Functions - Un-Tokenization
contents:
- step_untokenize
- title: Step Functions - Token Modification
contents:
- step_lemma
- step_ngram
- step_pos_filter
- step_stem
- step_stopwords
- step_tokenfilter
- step_tokenmerge
- title: Step Functions - Numeric Variables From Tokens
contents:
- step_lda
- step_texthash
- step_tf
- step_tfidf
- step_word_embeddings
- title: Step Functions - Numeric Variables From Characters
contents:
- step_dummy_hash
- step_sequence_onehot
- step_textfeature
- title: Step Functions - Text Normalization
contents:
- step_text_normalization
- title: Step Functions - Text Cleaning
contents:
- step_clean_levels
- step_clean_names
- title: Token Functions
contents:
- tokenlist
- show_tokens
- title: Selectors
contents:
- all_tokenized
- title: Count Functions
contents:
- count_functions
- title: Data Sets
contents:
- emoji_samples