pipeline defined

This commit is contained in:
2026-03-14 21:44:33 +08:00
parent b77c37cfa5
commit 620d1dfb2d
4 changed files with 58 additions and 0 deletions

32
dvc.yaml Normal file
View File

@@ -0,0 +1,32 @@
stages:
prepare:
cmd: python src/prepare.py data/data.xml
deps:
- data/data.xml
- src/prepare.py
params:
- prepare.seed
- prepare.split
outs:
- data/prepared
featurize:
cmd: python src/featurization.py data/prepared data/features
deps:
- data/prepared
- src/featurization.py
params:
- featurize.max_features
- featurize.ngrams
outs:
- data/features
train:
cmd: python src/train.py data/features model.pkl
deps:
- data/features
- src/train.py
params:
- train.min_split
- train.n_est
- train.seed
outs:
- model.pkl