Newer
Older
"python create_corpus_before_lang.py"
rule corpus_iramuteq:
input:
"data/preprocessed/",
output:
directory("data/corpus_iramuteq/")
shell:
"python create_corpus.py -t themes.json -d data/preprocessed/ -m iramuteq"
rule corpus_cortex:
input:
"data/preprocessed/",
output:
directory("data/corpus_cortex/")
shell:
"python create_corpus.py -t themes.json -d data/preprocessed/ -m cortext"
rule preprocess:
input:
shell:
"python preprocess.py"
"python parse_docs.py"
rule download:
output:
rule clean:
shell:
"rm -rf docs txts preprocessed"