33 lines
631 B
YAML
33 lines
631 B
YAML
stages:
|
|
prepare:
|
|
cmd: python src/prepare.py data/data.xml
|
|
deps:
|
|
- data/data.xml
|
|
- src/prepare.py
|
|
params:
|
|
- prepare.seed
|
|
- prepare.split
|
|
outs:
|
|
- data/prepared
|
|
featurize:
|
|
cmd: python src/featurization.py data/prepared data/features
|
|
deps:
|
|
- data/prepared
|
|
- src/featurization.py
|
|
params:
|
|
- featurize.max_features
|
|
- featurize.ngrams
|
|
outs:
|
|
- data/features
|
|
train:
|
|
cmd: python src/train.py data/features model.pkl
|
|
deps:
|
|
- data/features
|
|
- src/train.py
|
|
params:
|
|
- train.min_split
|
|
- train.n_est
|
|
- train.seed
|
|
outs:
|
|
- model.pkl
|