diff --git a/fra_wikipedia_2021_10K-sentences.txt b/corpus/fra_wikipedia_2021_10K-sentences.txt similarity index 100% rename from fra_wikipedia_2021_10K-sentences.txt rename to corpus/fra_wikipedia_2021_10K-sentences.txt diff --git a/markov.py b/markov.py index c90608a..8af36bd 100755 --- a/markov.py +++ b/markov.py @@ -1,11 +1,11 @@ from collections import defaultdict -from random import choice, randrange +from pathlib import Path +from random import choice + suivants = defaultdict(list) -for path in ( - "fra_wikipedia_2021_10K-sentences.txt", -): - with open(path, "r", encoding="utf-8") as fichier: +for chemin in Path("corpus").iterdir(): + with open(chemin, "r", encoding="utf-8") as fichier: for phrase in fichier: antepenultieme, penultieme = "", "" for word in phrase.split():