From ccba64ed353884e3d10ddf97c2a1f4b106344db6 Mon Sep 17 00:00:00 2001 From: adrien Date: Thu, 5 Feb 2026 16:02:30 +0100 Subject: [PATCH] plusieurs sources, plusieurs phrases --- markov.py | 20 +++++++++++--------- 1 file changed, 11 insertions(+), 9 deletions(-) diff --git a/markov.py b/markov.py index b2828da..a77ea31 100755 --- a/markov.py +++ b/markov.py @@ -2,17 +2,19 @@ from collections import defaultdict from random import choice, randrange suivants = defaultdict(list) +for path in ( + "fra_wikipedia_2021_10K-sentences.txt", +): + with open(path, "r", encoding="utf-8") as fichier: + for phrase in fichier: + antepenultieme, penultieme = "", "" + for word in phrase.split(): + suivants[(antepenultieme, penultieme)].append(word) + antepenultieme, penultieme = penultieme, word -with open("fra_wikipedia_2021_10K-sentences.txt", "r", encoding="utf-8") as fichier: - for phrase in fichier: - antepenultieme, penultieme = "", "" - for word in phrase.split(): - suivants[(antepenultieme, penultieme)].append(word) - antepenultieme, penultieme = penultieme, word - -def parle(): +def parle(nb_phrases=1): phrases = [] - for _ in range(randrange(1, 4)): + for _ in range(nb_phrases): antepenultieme, penultieme = "", "" phrase = [] while mots_possibles := suivants[(antepenultieme, penultieme)]: