From 9879a7b47f1c33b48c047cd955497af247bc8ca3 Mon Sep 17 00:00:00 2001 From: Edoardo Rosa <6991986+notdodo@users.noreply.github.com> Date: Wed, 25 Sep 2024 16:29:10 +0200 Subject: [PATCH] enh: fuzz search fn --- app/erfiume/tgbot.py | 115 +++++++++++++++++++++---------------------- 1 file changed, 56 insertions(+), 59 deletions(-) diff --git a/app/erfiume/tgbot.py b/app/erfiume/tgbot.py index 11fc8b6..37fb612 100644 --- a/app/erfiume/tgbot.py +++ b/app/erfiume/tgbot.py @@ -22,6 +22,8 @@ if TYPE_CHECKING: from aws_lambda_powertools.utilities.typing import LambdaContext + from .apis import Stazione + from aws_lambda_powertools.utilities import parameters from .apis import KNOWN_STATIONS @@ -49,11 +51,6 @@ def is_from_group(update: Update) -> bool: ] -def is_from_user(update: Update) -> bool: - """Check if the update is from a real user.""" - return update.effective_user is not None - - def is_from_private_chat(update: Update) -> bool: """Check if the update is from a private chat with the bot.""" return update.effective_chat is not None and update.effective_chat.type == "private" @@ -70,6 +67,22 @@ def has_joined_group(update: Update) -> bool: return False +async def fuzz_search_station( + station_name: str, +) -> tuple[Stazione | None, str]: + """Search for a station even if the name is not exactly correct.""" + fuzzy_query = process.extractOne( + station_name, KNOWN_STATIONS, score_cutoff=FUZZ_SCORE_CUTOFF + ) + if fuzzy_query: + async with AsyncDynamoDB(table_name="Stazioni") as dynamo: + return ( + await dynamo.get_matching_station(fuzzy_query[0]), + fuzzy_query[0], + ) + return None, "" + + async def send_donation_link( update: Update, context: ContextTypes.DEFAULT_TYPE ) -> None: @@ -106,17 +119,12 @@ async def send_random_messages( # HANDLERS async def start(update: Update, _: ContextTypes.DEFAULT_TYPE | None) -> None: """Send a message when the command /start is issued.""" - if ( - is_from_user(update) - and is_from_private_chat(update) - and update.effective_user - and update.message - ): + if update.effective_user and is_from_private_chat(update) and update.message: user = update.effective_user message = rf"Ciao {user.mention_html()}! Scrivi il nome di una stazione da monitorare per iniziare (e.g. Cesena o /S. Carlo) o cercane una con /stazioni" # noqa: E501 await update.message.reply_html(message) elif ( - is_from_user(update) + update.effective_user and is_from_group(update) and update.effective_chat and update.message @@ -128,15 +136,13 @@ async def start(update: Update, _: ContextTypes.DEFAULT_TYPE | None) -> None: async def cesena(update: Update, _: ContextTypes.DEFAULT_TYPE) -> None: """Send a message when the command /cesena is issued.""" - async with AsyncDynamoDB(table_name="Stazioni") as dynamo: - stazione = await dynamo.get_matching_station("Cesena") - if stazione: - if update.message: - await update.message.reply_html(stazione.create_station_message()) - elif update.message: - await update.message.reply_html( - "Nessun stazione trovata!", - ) + station, _match = await fuzz_search_station("Cesena") + if update.message and station: + await update.message.reply_html(station.create_station_message()) + elif update.message: + await update.message.reply_html( + "Nessun stazione trovata!", + ) async def list_stations(update: Update, _: ContextTypes.DEFAULT_TYPE) -> None: @@ -165,7 +171,7 @@ async def handle_private_message( update: Update, context: ContextTypes.DEFAULT_TYPE ) -> None: """ - Handle messages written from private chat to match a specific station + Handle messages from private chat to match a specific station """ message = cleandoc( @@ -175,30 +181,27 @@ async def handle_private_message( Se non sai quale cercare prova con /stazioni""" ) if update.message and update.effective_chat and update.message.text: - async with AsyncDynamoDB(table_name="Stazioni") as dynamo: - query = update.message.text.replace("/", "").strip() - fuzzy_query = process.extractOne( - query, KNOWN_STATIONS, score_cutoff=FUZZ_SCORE_CUTOFF - ) - logger.info(query) - if fuzzy_query: - stazione = await dynamo.get_matching_station(fuzzy_query[0]) - if stazione and update.message: - message = stazione.create_station_message() - if query != fuzzy_query[0]: - message += "\nSe non è la stazione corretta prova ad affinare la ricerca." - await context.bot.send_message( - chat_id=update.effective_chat.id, - text=message, - ) - await send_random_messages(update, context) + query = update.message.text.replace("/", "").strip() + logger.info(query) + station, match = await fuzz_search_station(query) + if station: + message = station.create_station_message() + if query != match: + message += ( + "\nSe non è la stazione corretta prova ad affinare la ricerca." + ) + await context.bot.send_message( + chat_id=update.effective_chat.id, + text=message, + ) + await send_random_messages(update, context) async def handle_group_message( update: Update, context: ContextTypes.DEFAULT_TYPE ) -> None: """ - Handle messages writte from private chat to match a specific station + Handle messages from groups to match a specific station """ message = cleandoc( @@ -208,25 +211,19 @@ async def handle_group_message( Se non sai quale cercare prova con /stazioni""" ) if update.message and update.effective_chat and update.message.text: - async with AsyncDynamoDB(table_name="Stazioni") as dynamo: - query = ( - update.message.text.replace("/", "").replace("erfiume_bot", "").strip() - ) - fuzzy_query = process.extractOne( - query, KNOWN_STATIONS, score_cutoff=FUZZ_SCORE_CUTOFF - ) - logger.info(query) - if fuzzy_query: - stazione = await dynamo.get_matching_station(fuzzy_query[0]) - if stazione and update.message: - message = stazione.create_station_message() - if query != fuzzy_query[0]: - message += "\nSe non é la stazione corretta prova ad affinare la ricerca." - await context.bot.send_message( - chat_id=update.effective_chat.id, - text=message, - ) - await send_random_messages(update, context) + query = update.message.text.replace("/", "").replace("erfiume_bot", "").strip() + station, match = await fuzz_search_station(query) + if station: + message = station.create_station_message() + if query != match: + message += ( + "\nSe non é la stazione corretta prova ad affinare la ricerca." + ) + await context.bot.send_message( + chat_id=update.effective_chat.id, + text=message, + ) + await send_random_messages(update, context) # END HANDLERS