From 8f9987fcd27d6f0bc8b2bc246e849748d8b982bd Mon Sep 17 00:00:00 2001 From: adrien Date: Thu, 5 Feb 2026 20:15:56 +0100 Subject: [PATCH] importer tout le dossier corpus --- .../fra_wikipedia_2021_10K-sentences.txt | 0 markov.py | 10 +++++----- 2 files changed, 5 insertions(+), 5 deletions(-) rename fra_wikipedia_2021_10K-sentences.txt => corpus/fra_wikipedia_2021_10K-sentences.txt (100%) diff --git a/fra_wikipedia_2021_10K-sentences.txt b/corpus/fra_wikipedia_2021_10K-sentences.txt similarity index 100% rename from fra_wikipedia_2021_10K-sentences.txt rename to corpus/fra_wikipedia_2021_10K-sentences.txt diff --git a/markov.py b/markov.py index c90608a..8af36bd 100755 --- a/markov.py +++ b/markov.py @@ -1,11 +1,11 @@ from collections import defaultdict -from random import choice, randrange +from pathlib import Path +from random import choice + suivants = defaultdict(list) -for path in ( - "fra_wikipedia_2021_10K-sentences.txt", -): - with open(path, "r", encoding="utf-8") as fichier: +for chemin in Path("corpus").iterdir(): + with open(chemin, "r", encoding="utf-8") as fichier: for phrase in fichier: antepenultieme, penultieme = "", "" for word in phrase.split():