From 904a45eaa5bcafb083c417bb14fc9caa7914a909 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 06:53:48 -0300 Subject: [PATCH 01/11] Added a CatchAll Message Finder Signed-off-by: Guilherme Bacellar Moralez --- TEx/finder/all_messages_finder.py | 16 ++++++++ TEx/finder/finder_engine.py | 7 ++++ TEx/notifier/elastic_search_notifier.py | 50 +++++++++++++++++++++++++ 3 files changed, 73 insertions(+) create mode 100644 TEx/finder/all_messages_finder.py create mode 100644 TEx/notifier/elastic_search_notifier.py diff --git a/TEx/finder/all_messages_finder.py b/TEx/finder/all_messages_finder.py new file mode 100644 index 0000000..e96fd19 --- /dev/null +++ b/TEx/finder/all_messages_finder.py @@ -0,0 +1,16 @@ +"""All Messages Finder.""" +from configparser import SectionProxy + +from TEx.finder.base_finder import BaseFinder + + +class AllMessagesFinder(BaseFinder): + """All Messages Based Finder.""" + + def __init__(self, config: SectionProxy) -> None: + """Initialize All Messages Finder.""" + pass + + async def find(self, raw_text: str) -> bool: + """Find Message. Always Return True.""" + return True diff --git a/TEx/finder/finder_engine.py b/TEx/finder/finder_engine.py index d037115..199a49a 100644 --- a/TEx/finder/finder_engine.py +++ b/TEx/finder/finder_engine.py @@ -4,6 +4,7 @@ from telethon.events import NewMessage +from TEx.finder.all_messages_finder import AllMessagesFinder from TEx.finder.regex_finder import RegexFinder from TEx.notifier.notifier_engine import NotifierEngine @@ -34,6 +35,12 @@ def __load_rules(self, config: ConfigParser) -> None: 'instance': RegexFinder(config=config[sec]), 'notifier': config[sec]['notifier'] }) + elif config[sec]['type'] == 'all': + self.rules.append({ + 'id': sec, + 'instance': AllMessagesFinder(config=config[sec]), + 'notifier': config[sec]['notifier'] + }) def configure(self, config: ConfigParser) -> None: """Configure Finder.""" diff --git a/TEx/notifier/elastic_search_notifier.py b/TEx/notifier/elastic_search_notifier.py new file mode 100644 index 0000000..31699a7 --- /dev/null +++ b/TEx/notifier/elastic_search_notifier.py @@ -0,0 +1,50 @@ +"""Discord Notifier.""" +from configparser import SectionProxy + +from discord_webhook import DiscordEmbed, DiscordWebhook +from telethon.events import NewMessage + +from TEx.notifier.notifier_base import BaseNotifier + + +class DiscordNotifier(BaseNotifier): + """Basic Discord Notifier.""" + + def __init__(self) -> None: + """Initialize Discord Notifier.""" + super().__init__() + self.url: str = '' + + def configure(self, url: str, config: SectionProxy) -> None: + """Configure the Notifier.""" + self.url = url + self.configure_base(config=config) + + async def run(self, message: NewMessage.Event, rule_id: str) -> None: + """Run Discord Notifier.""" + # Check and Update Deduplication Control + is_duplicated, duplication_tag = self.check_is_duplicated(message=message.raw_text) + if is_duplicated: + return + + # Run the Notification Process. + webhook = DiscordWebhook( + url=self.url, + rate_limit_retry=True + ) + + embed = DiscordEmbed( + title=f'**{message.chat.title}** ({message.chat.id})', + description=message.raw_text + ) + + embed.add_embed_field(name="Rule", value=rule_id, inline=False) + embed.add_embed_field(name="Message ID", value=str(message.id), inline=False) + embed.add_embed_field(name="Group Name", value=message.chat.title, inline=True) + embed.add_embed_field(name="Group ID", value=message.chat.id, inline=True) + embed.add_embed_field(name="Message Date", value=str(message.date), inline=False) + embed.add_embed_field(name="Tag", value=duplication_tag, inline=False) + + # add embed object to webhook + webhook.add_embed(embed) + webhook.execute() From 9bbc0f7b40fca85558f998b8f4fefa5b29ded40f Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 06:54:19 -0300 Subject: [PATCH 02/11] Added ElasticSearch Notifier Signed-off-by: Guilherme Bacellar Moralez --- TEx/notifier/elastic_search_notifier.py | 86 +++++++++++++++---------- TEx/notifier/notifier_engine.py | 9 +++ 2 files changed, 60 insertions(+), 35 deletions(-) diff --git a/TEx/notifier/elastic_search_notifier.py b/TEx/notifier/elastic_search_notifier.py index 31699a7..4229eea 100644 --- a/TEx/notifier/elastic_search_notifier.py +++ b/TEx/notifier/elastic_search_notifier.py @@ -1,50 +1,66 @@ -"""Discord Notifier.""" +"""Elastic Search Notifier.""" from configparser import SectionProxy +from typing import Dict, Optional -from discord_webhook import DiscordEmbed, DiscordWebhook +import pytz +from elasticsearch import AsyncElasticsearch from telethon.events import NewMessage +from telethon.tl.types import PeerUser from TEx.notifier.notifier_base import BaseNotifier -class DiscordNotifier(BaseNotifier): - """Basic Discord Notifier.""" +class ElasticSearchNotifier(BaseNotifier): + """Basic Elastic Search Notifier.""" def __init__(self) -> None: - """Initialize Discord Notifier.""" + """Initialize Elastic Search Notifier.""" super().__init__() self.url: str = '' + self.client: AsyncElasticsearch = None + self.index: str = '' + self.pipeline: str = '' - def configure(self, url: str, config: SectionProxy) -> None: + def configure(self, config: SectionProxy) -> None: """Configure the Notifier.""" - self.url = url - self.configure_base(config=config) + hosts_list: Optional[str] = config.get('address', fallback=None) + + self.client = AsyncElasticsearch( + hosts=hosts_list.split(',') if hosts_list else None, + api_key=config.get('api_key', fallback=None), + verify_certs=config.get('verify_ssl_cert', fallback='True') == 'True', + cloud_id=config.get('cloud_id', fallback=None) + ) + self.index = config['index_name'] + self.pipeline = config['pipeline_name'] async def run(self, message: NewMessage.Event, rule_id: str) -> None: - """Run Discord Notifier.""" - # Check and Update Deduplication Control - is_duplicated, duplication_tag = self.check_is_duplicated(message=message.raw_text) - if is_duplicated: - return - - # Run the Notification Process. - webhook = DiscordWebhook( - url=self.url, - rate_limit_retry=True - ) - - embed = DiscordEmbed( - title=f'**{message.chat.title}** ({message.chat.id})', - description=message.raw_text - ) - - embed.add_embed_field(name="Rule", value=rule_id, inline=False) - embed.add_embed_field(name="Message ID", value=str(message.id), inline=False) - embed.add_embed_field(name="Group Name", value=message.chat.title, inline=True) - embed.add_embed_field(name="Group ID", value=message.chat.id, inline=True) - embed.add_embed_field(name="Message Date", value=str(message.date), inline=False) - embed.add_embed_field(name="Tag", value=duplication_tag, inline=False) - - # add embed object to webhook - webhook.add_embed(embed) - webhook.execute() + """Run Elastic Search Notifier.""" + content: Dict = { + 'time': message.date.astimezone(tz=pytz.utc), + 'rule': rule_id, + 'raw': message.raw_text, + 'group_name': message.chat.title, + 'group_id': message.chat.id, + 'from_id': message.from_id.user_id if isinstance(message.from_id, PeerUser) else '', + 'to_id': message.to_id.channel_id if message.to_id is not None else None, + 'reply_to_msg_id': message.reply_to.reply_to_msg_id if message.is_reply else None, + 'message_id': message.id, + 'is_reply': message.is_reply, + } + + if hasattr(message, 'file') and message.file: + content['has_media'] = True + content['media_mime_type'] = message.file.mime_type if hasattr(message.file, 'mime_type') else None + content['media_size'] = message.file.size if hasattr(message.file, 'size') else None + else: + content['has_media'] = False + content['media_mime_type'] = None + content['media_size'] = None + + await self.client.index( + index=self.index, + pipeline=self.pipeline, + id=f'{message.chat.id}_{message.id}', + document=content + ) \ No newline at end of file diff --git a/TEx/notifier/notifier_engine.py b/TEx/notifier/notifier_engine.py index 8abf79d..c63fe77 100644 --- a/TEx/notifier/notifier_engine.py +++ b/TEx/notifier/notifier_engine.py @@ -5,6 +5,7 @@ from telethon.events import NewMessage from TEx.notifier.discord_notifier import DiscordNotifier +from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier from TEx.notifier.notifier_base import BaseNotifier @@ -29,6 +30,14 @@ def __load_notifiers(self, config: ConfigParser) -> None: register: {'instance': notifier} }) + if 'ELASTIC_SEARCH' in register: + notifier_es: ElasticSearchNotifier = ElasticSearchNotifier() + notifier_es.configure(config=config[register]) + + self.notifiers.update({ + register: {'instance': notifier_es} + }) + def configure(self, config: ConfigParser) -> None: """Configure Finder.""" self.__load_notifiers(config) From ab09e1b1347a1f9a15ecb6cd8986545fbf515e08 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 06:54:41 -0300 Subject: [PATCH 03/11] Added ElasticSearch Dependency Signed-off-by: Guilherme Bacellar Moralez --- pyproject.toml | 1 + 1 file changed, 1 insertion(+) diff --git a/pyproject.toml b/pyproject.toml index 6bda8ee..42e2164 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -67,6 +67,7 @@ cachetools = ">=5.3.1,<6" toml = ">=0.10.2" tox = "^4.10.0" discord-webhook = ">=1.3.0,<2" +elasticsearch = {extras = ["async"], version = "8.10.0"} [tool.poetry.dev-dependencies] pytest = ">=7.4.0" From ffb32874171cd666d14a47615cea7e5aefa642b0 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 06:55:29 -0300 Subject: [PATCH 04/11] Disabling InsecureWarning Signed-off-by: Guilherme Bacellar Moralez --- TEx/runner.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/TEx/runner.py b/TEx/runner.py index 338b7f7..d77a3dc 100644 --- a/TEx/runner.py +++ b/TEx/runner.py @@ -11,6 +11,8 @@ import types from configparser import ConfigParser from typing import Dict, List, Optional +from urllib3.exceptions import InsecureRequestWarning +from urllib3 import disable_warnings import toml @@ -144,6 +146,7 @@ def __setup_logging(self) -> None: """Setups Log Config.""" logging.config.fileConfig(os.path.join(os.path.dirname(__file__), 'logging.conf')) logging.getLogger('telethon').setLevel(level=logging.WARNING) + disable_warnings(InsecureRequestWarning) def __list_modules(self) -> None: """ From befd01a5df90774eafc340263b2669c7b1fd447d Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 06:55:50 -0300 Subject: [PATCH 05/11] Change Log Level Signed-off-by: Guilherme Bacellar Moralez --- TEx/logging.conf | 14 ++++++++++++-- 1 file changed, 12 insertions(+), 2 deletions(-) diff --git a/TEx/logging.conf b/TEx/logging.conf index bc85321..5e138b0 100644 --- a/TEx/logging.conf +++ b/TEx/logging.conf @@ -1,5 +1,5 @@ [loggers] -keys=root,sqlalchemy,TelegramExplorer +keys=root,sqlalchemy,TelegramExplorer,elasticsearch,elastic_transport.transport ####################### @@ -17,6 +17,16 @@ keys=simpleFormatter level=INFO handlers=consoleHandler +[logger_elasticsearch] +level=ERROR +handlers=consoleHandler +qualname=elasticsearch + +[logger_elastic_transport.transport] +level=ERROR +handlers=consoleHandler +qualname=elastic_transport.transport + [logger_TelegramExplorer] level=INFO handlers=consoleHandler @@ -40,4 +50,4 @@ args=(sys.stdout,) ####################### [formatter_simpleFormatter] -format=%(asctime)s - %(levelname)s - %(message)s +format= %(asctime)s - %(levelname)s - %(message)s From 76d32a94a087aee8a8193de6512f44e417f78bcc Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Sun, 15 Oct 2023 07:25:11 -0300 Subject: [PATCH 06/11] Added a Source Information on Finder and Notification Engine + Update Discord Message Template to Add a Source Information + Added Source Information on ElasticSearch Data + Updated Documentation Signed-off-by: Guilherme Bacellar Moralez --- TEx/finder/finder_engine.py | 10 ++++++++-- TEx/modules/telegram_messages_listener.py | 5 ++++- TEx/notifier/discord_notifier.py | 5 +++-- TEx/notifier/elastic_search_notifier.py | 3 ++- TEx/notifier/notifier_base.py | 2 +- TEx/notifier/notifier_engine.py | 13 ++++++++++--- docs/changelog/v030.md | 1 + tests/finder/test_finder_engine.py | 6 ++++-- tests/notifier/test_discord_notifier.py | 23 +++++++++++++---------- tests/notifier/test_notifier_engine.py | 7 ++++--- 10 files changed, 50 insertions(+), 25 deletions(-) diff --git a/TEx/finder/finder_engine.py b/TEx/finder/finder_engine.py index 8cd9e3a..c1451dc 100644 --- a/TEx/finder/finder_engine.py +++ b/TEx/finder/finder_engine.py @@ -50,8 +50,13 @@ def configure(self, config: ConfigParser) -> None: self.__load_rules(config=config) self.notification_engine.configure(config=config) - async def run(self, message: NewMessage.Event) -> None: - """Execute the Finder with Raw Text.""" + async def run(self, message: NewMessage.Event, source: str) -> None: + """Execute the Finder with Raw Text. + + :param message: Message Object + :param source: Source Account/Phone Number + :return: + """ if not self.is_finder_enabled: return @@ -65,4 +70,5 @@ async def run(self, message: NewMessage.Event) -> None: notifiers=rule['notifier'].split(','), message=message, rule_id=rule['id'], + source=source, ) diff --git a/TEx/modules/telegram_messages_listener.py b/TEx/modules/telegram_messages_listener.py index 8e76a81..93e094b 100644 --- a/TEx/modules/telegram_messages_listener.py +++ b/TEx/modules/telegram_messages_listener.py @@ -84,7 +84,10 @@ async def __handler(self, event: NewMessage.Event) -> None: values['from_type'] = None # Execute Finder - await self.finder.run(message=message) + await self.finder.run( + message=message, + source=self.target_phone_number, + ) # Add to DB TelegramMessageDatabaseManager.insert(values) diff --git a/TEx/notifier/discord_notifier.py b/TEx/notifier/discord_notifier.py index 7b9151c..bb88b31 100644 --- a/TEx/notifier/discord_notifier.py +++ b/TEx/notifier/discord_notifier.py @@ -20,7 +20,7 @@ def configure(self, url: str, config: SectionProxy) -> None: self.url = url self.configure_base(config=config) - async def run(self, message: NewMessage.Event, rule_id: str) -> None: + async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: """Run Discord Notifier.""" # Check and Update Deduplication Control is_duplicated, duplication_tag = self.check_is_duplicated(message=message.raw_text) @@ -38,7 +38,8 @@ async def run(self, message: NewMessage.Event, rule_id: str) -> None: description=message.raw_text, ) - embed.add_embed_field(name='Rule', value=rule_id, inline=False) + embed.add_embed_field(name='Source', value=source, inline=True) + embed.add_embed_field(name='Rule', value=rule_id, inline=True) embed.add_embed_field(name='Message ID', value=str(message.id), inline=False) embed.add_embed_field(name='Group Name', value=message.chat.title, inline=True) embed.add_embed_field(name='Group ID', value=message.chat.id, inline=True) diff --git a/TEx/notifier/elastic_search_notifier.py b/TEx/notifier/elastic_search_notifier.py index 2d40e9b..add5906 100644 --- a/TEx/notifier/elastic_search_notifier.py +++ b/TEx/notifier/elastic_search_notifier.py @@ -36,10 +36,11 @@ def configure(self, config: SectionProxy) -> None: self.index = config['index_name'] self.pipeline = config['pipeline_name'] - async def run(self, message: NewMessage.Event, rule_id: str) -> None: + async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: """Run Elastic Search Notifier.""" content: Dict = { 'time': message.date.astimezone(tz=pytz.utc), + 'source': source, 'rule': rule_id, 'raw': message.raw_text, 'group_name': message.chat.title, diff --git a/TEx/notifier/notifier_base.py b/TEx/notifier/notifier_base.py index 5c78786..f01bc07 100644 --- a/TEx/notifier/notifier_base.py +++ b/TEx/notifier/notifier_base.py @@ -38,5 +38,5 @@ def check_is_duplicated(self, message: str) -> Tuple[bool, str]: return False, tag @abc.abstractmethod - async def run(self, message: NewMessage.Event, rule_id: str) -> None: + async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: """Run the Notification Process.""" diff --git a/TEx/notifier/notifier_engine.py b/TEx/notifier/notifier_engine.py index ca3a240..5d557be 100644 --- a/TEx/notifier/notifier_engine.py +++ b/TEx/notifier/notifier_engine.py @@ -44,12 +44,19 @@ def configure(self, config: ConfigParser) -> None: """Configure Finder.""" self.__load_notifiers(config) - async def run(self, notifiers: List[str], message: NewMessage.Event, rule_id: str) -> None: - """Dispatch all Notifications.""" + async def run(self, notifiers: List[str], message: NewMessage.Event, rule_id: str, source: str) -> None: + """Dispatch all Notifications. + + :param notifiers: + :param message: Message Object + :param rule_id: Triggered Rule ID + :param source: Source Account/Phone Number + :return: + """ if len(notifiers) == 0: return for dispatcher_name in notifiers: target_notifier: BaseNotifier = self.notifiers[dispatcher_name]['instance'] - await target_notifier.run(message=message, rule_id=rule_id) + await target_notifier.run(message=message, rule_id=rule_id, source=source) diff --git a/docs/changelog/v030.md b/docs/changelog/v030.md index 8e2b8b8..43cb47f 100644 --- a/docs/changelog/v030.md +++ b/docs/changelog/v030.md @@ -3,6 +3,7 @@ **🚀 Features** - Proxy (HTTP, SOCKS4, SOCKS5) support ([#26](https://github.com/guibacellar/TEx/issues/26)) +- Discord Notifications now have a source information with account/phone number **🐛 Bug Fixes** diff --git a/tests/finder/test_finder_engine.py b/tests/finder/test_finder_engine.py index a007ce4..39f9e3f 100644 --- a/tests/finder/test_finder_engine.py +++ b/tests/finder/test_finder_engine.py @@ -46,7 +46,8 @@ def test_run_with_regex_finder(self): # Invoke Test Target target.run( - message=target_message + message=target_message, + source='+15558987453' ) ) @@ -54,5 +55,6 @@ def test_run_with_regex_finder(self): target.notification_engine.run.assert_awaited_once_with( notifiers=['NOTIFIER.DISCORD.NOT_002'], message=target_message, - rule_id='FINDER.RULE.UT_Finder_Demo' + rule_id='FINDER.RULE.UT_Finder_Demo', + source='+15558987453' ) diff --git a/tests/notifier/test_discord_notifier.py b/tests/notifier/test_discord_notifier.py index cb6717e..806bc9c 100644 --- a/tests/notifier/test_discord_notifier.py +++ b/tests/notifier/test_discord_notifier.py @@ -49,7 +49,8 @@ def test_run_no_duplication(self): # Invoke Test Target target.run( message=target_message, - rule_id='RULE_UT_01' + rule_id='RULE_UT_01', + source='+15558987453' ) ) @@ -60,13 +61,13 @@ def test_run_no_duplication(self): self.assertEqual(call_arg.title, '**Channel 1972142108** (1972142108)') self.assertEqual(call_arg.description, 'Mocked Raw Text') - self.assertEqual(len(call_arg.fields), 6) - self.assertEqual(call_arg.fields[0], {'inline': False, 'name': 'Rule', 'value': 'RULE_UT_01'}) - self.assertEqual(call_arg.fields[1], {'inline': False, 'name': 'Message ID', 'value': '5975883'}) - self.assertEqual(call_arg.fields[2], {'inline': True, 'name': 'Group Name', 'value': 'Channel 1972142108'}) - self.assertEqual(call_arg.fields[3], {'inline': True, 'name': 'Group ID', 'value': 1972142108}) - self.assertEqual(call_arg.fields[5], - {'inline': False, 'name': 'Tag', 'value': 'de33f5dda9c686c64d23b8aec2eebfc7'}) + self.assertEqual(len(call_arg.fields), 7) + self.assertEqual(call_arg.fields[0], {'inline': True, 'name': 'Source', 'value': '+15558987453'}) + self.assertEqual(call_arg.fields[1], {'inline': True, 'name': 'Rule', 'value': 'RULE_UT_01'}) + self.assertEqual(call_arg.fields[2], {'inline': False, 'name': 'Message ID', 'value': '5975883'}) + self.assertEqual(call_arg.fields[3], {'inline': True, 'name': 'Group Name', 'value': 'Channel 1972142108'}) + self.assertEqual(call_arg.fields[4], {'inline': True, 'name': 'Group ID', 'value': 1972142108}) + self.assertEqual(call_arg.fields[6], {'inline': False, 'name': 'Tag', 'value': 'de33f5dda9c686c64d23b8aec2eebfc7'}) # Check if Webhook was Executed discord_webhook_mock.execute.assert_called_once() @@ -104,7 +105,8 @@ def test_run_duplication_control(self): # Invoke Test Target target.run( message=target_message, - rule_id='RULE_UT_01' + rule_id='RULE_UT_01', + source='+15558987453' ) ) @@ -113,7 +115,8 @@ def test_run_duplication_control(self): # Invoke Test Target Again target.run( message=target_message, - rule_id='RULE_UT_01' + rule_id='RULE_UT_01', + source='+15558987453' ) ) diff --git a/tests/notifier/test_notifier_engine.py b/tests/notifier/test_notifier_engine.py index 562c391..4da79cf 100644 --- a/tests/notifier/test_notifier_engine.py +++ b/tests/notifier/test_notifier_engine.py @@ -44,11 +44,12 @@ def test_run(self): target.run( notifiers=['NOTIFIER.DISCORD.NOT_001', 'NOTIFIER.DISCORD.NOT_002'], message=base_messages_mockup_data[0], - rule_id='RULE_UT_01' + rule_id='RULE_UT_01', + source='+15558987453' ) ) discord_notifier_mockup.run.assert_has_awaits([ - call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01'), - call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01'), + call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01', source='+15558987453'), + call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01', source='+15558987453'), ]) From 783084a420050ebf5b9ab3a8e96028455f9857f5 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Tue, 17 Oct 2023 17:43:45 -0300 Subject: [PATCH 07/11] Added unittests for All Messages Finder module Signed-off-by: Guilherme Bacellar Moralez --- TEx/notifier/elastic_search_notifier.py | 2 +- tests/finder/test_all_messages_finder.py | 28 ++++++++ .../notifier/test_elastic_search_notifier.py | 69 +++++++++++++++++++ tests/unittest_configfile.config | 7 ++ 4 files changed, 105 insertions(+), 1 deletion(-) create mode 100644 tests/finder/test_all_messages_finder.py create mode 100644 tests/notifier/test_elastic_search_notifier.py diff --git a/TEx/notifier/elastic_search_notifier.py b/TEx/notifier/elastic_search_notifier.py index add5906..8d6e64e 100644 --- a/TEx/notifier/elastic_search_notifier.py +++ b/TEx/notifier/elastic_search_notifier.py @@ -47,7 +47,7 @@ async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> Non 'group_id': message.chat.id, 'from_id': message.from_id.user_id if isinstance(message.from_id, PeerUser) else '', 'to_id': message.to_id.channel_id if message.to_id is not None else None, - 'reply_to_msg_id': message.reply_to.reply_to_msg_id if message.is_reply else None, + 'reply_to_msg_id': message.reply_to.reply_to_msg_id if message.is_reply and message.reply_to else None, 'message_id': message.id, 'is_reply': message.is_reply, } diff --git a/tests/finder/test_all_messages_finder.py b/tests/finder/test_all_messages_finder.py new file mode 100644 index 0000000..a4b6b8a --- /dev/null +++ b/tests/finder/test_all_messages_finder.py @@ -0,0 +1,28 @@ +import asyncio +import unittest +from configparser import ConfigParser + +from TEx.finder.all_messages_finder import AllMessagesFinder + + +class AllMessagesFinderTest(unittest.TestCase): + + def setUp(self) -> None: + self.config = ConfigParser() + self.config.read('../../config.ini') + + def test_find_true(self): + """Test the always true return.""" + + target: AllMessagesFinder = AllMessagesFinder(config=self.config) + + loop = asyncio.get_event_loop() + tasks = target.find(raw_text='foo'), target.find(raw_text=None) + + h_result_content, h_result_none = loop.run_until_complete( + asyncio.gather(*tasks) + ) + + self.assertTrue(h_result_content) + self.assertTrue(h_result_none) + diff --git a/tests/notifier/test_elastic_search_notifier.py b/tests/notifier/test_elastic_search_notifier.py new file mode 100644 index 0000000..915e3c5 --- /dev/null +++ b/tests/notifier/test_elastic_search_notifier.py @@ -0,0 +1,69 @@ +import asyncio +import datetime +import unittest +from configparser import ConfigParser +from typing import Dict +from unittest import mock + +from telethon.tl.types import Message, MessageFwdHeader, PeerChannel, PeerUser + +from TEx.notifier.discord_notifier import DiscordNotifier +from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier +from tests.modules.common import TestsCommon +from tests.modules.mockups_groups_mockup_data import base_groups_mockup_data, base_messages_mockup_data, \ + channel_1_mocked + + +class ElasticSearchNotifierTest(unittest.TestCase): + + def setUp(self) -> None: + self.config = ConfigParser() + self.config.read('../../config.ini') + + def test_run_without_file(self): + """Test Run Method Without Message File Attachment.""" + + # Setup Mock + elastic_search_api_mock = mock.AsyncMock() + elastic_search_api_mock.index = mock.AsyncMock() + + target: ElasticSearchNotifier = ElasticSearchNotifier() + args: Dict = { + 'config': 'unittest_configfile.config' + } + data: Dict = {} + TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + + # Set Mock Message + origin_mock_message = base_messages_mockup_data[1] + mocked_message = mock.MagicMock(spec=origin_mock_message) + for attr_name in origin_mock_message.__dict__: + setattr(mocked_message, attr_name, getattr(origin_mock_message, attr_name)) + mocked_message.chat = channel_1_mocked + + with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): + # Execute Discord Notifier Configure Method + target.configure( + config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] + ) + + loop = asyncio.get_event_loop() + loop.run_until_complete( + + # Invoke Test Target + target.run( + message=mocked_message, + rule_id='RULE_UT_01', + source='+15558987453' + ) + ) + + # Check .index call + elastic_search_api_mock.index.assert_called_once() + call_arg = elastic_search_api_mock.index.call_args[1] + + self.assertEqual(call_arg['index'], 'test_index_name') + self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') + self.assertEqual(call_arg['id'], '1972142108_183017') + + submited_document = call_arg['document'] diff --git a/tests/unittest_configfile.config b/tests/unittest_configfile.config index 818edb5..10b63bd 100644 --- a/tests/unittest_configfile.config +++ b/tests/unittest_configfile.config @@ -28,3 +28,10 @@ prevent_duplication_for_minutes=240 [NOTIFIER.DISCORD.NOT_002] webhook=https://uri.domain.com/webhook/002 prevent_duplication_for_minutes=240 + +[NOTIFIER.ELASTIC_SEARCH.UT_01] +address=https://localhost:666 +api_key=test_api_key +verify_ssl_cert=False +index_name=test_index_name +pipeline_name=test_pipeline_name From a5e1539559c01f7f4a475c78de62f3dfe48ed4a6 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Wed, 18 Oct 2023 14:25:50 -0300 Subject: [PATCH 08/11] Internal Refactory to Introduce Facade Objects for Notification and Finder Modules (Reduce Overall Code and Tests Complexity, Allow Future Modules as Easy Way, and, Reduce Mental Overload for Core Review) + Included Pydantic deps + Fix some invalid Telethon Message Object Type Hint + Fix Unittest Signed-off-by: Guilherme Bacellar Moralez --- TEx/core/mapper/telethon_message_mapper.py | 64 ++++++++ .../do_nothing_media_downloader.py | 2 +- .../photo_media_downloader.py | 2 +- .../std_media_downloader.py | 2 +- TEx/core/media_handler.py | 12 +- .../do_nothing_media_handler.py | 2 +- .../generic_binary_handler.py | 5 +- .../media_metadata_handling/geo_handler.py | 5 +- .../media_metadata_handling/mp4_handler.py | 5 +- .../media_metadata_handling/pdf_handler.py | 8 +- .../media_metadata_handling/photo_handler.py | 5 +- .../sticker_handler.py | 9 +- .../media_metadata_handling/text_handler.py | 5 +- .../webimage_handler.py | 16 +- TEx/core/state_file.py | 2 +- TEx/core/temp_file.py | 6 +- TEx/database/telegram_group_database.py | 8 +- TEx/finder/finder_engine.py | 15 +- TEx/models/database/telegram_db_model.py | 2 +- TEx/models/database/temp_db_models.py | 2 +- .../finder_notification_facade_entity.py | 26 ++++ .../facade/media_handler_facade_entity.py | 12 ++ .../telegram_group_report_facade_entity.py | 11 +- .../telegram_message_report_facade_entity.py | 6 +- TEx/modules/telegram_messages_listener.py | 16 +- TEx/modules/telegram_messages_scrapper.py | 6 +- .../telegram_html_report_generator.py | 6 +- TEx/notifier/discord_notifier.py | 18 +-- TEx/notifier/elastic_search_notifier.py | 38 ++--- TEx/notifier/notifier_base.py | 5 +- TEx/notifier/notifier_engine.py | 7 +- mypy.ini | 8 +- pyproject.toml | 1 + tests/finder/test_finder_engine.py | 20 ++- tests/modules/mockups_groups_mockup_data.py | 2 +- .../test_telegram_messages_listener.py | 1 + tests/notifier/test_discord_notifier.py | 43 ++++-- .../notifier/test_elastic_search_notifier.py | 146 +++++++++--------- tests/notifier/test_notifier_engine.py | 50 ++++-- 39 files changed, 400 insertions(+), 199 deletions(-) create mode 100644 TEx/core/mapper/telethon_message_mapper.py create mode 100644 TEx/models/facade/finder_notification_facade_entity.py create mode 100644 TEx/models/facade/media_handler_facade_entity.py diff --git a/TEx/core/mapper/telethon_message_mapper.py b/TEx/core/mapper/telethon_message_mapper.py new file mode 100644 index 0000000..9c37e79 --- /dev/null +++ b/TEx/core/mapper/telethon_message_mapper.py @@ -0,0 +1,64 @@ +"""Telethon Event Entity Mapper.""" +from __future__ import annotations + +from typing import Optional, Union + +from pydantic import BaseModel +from telethon.tl.patched import Message +from telethon.tl.types import Channel, Chat, PeerUser, User + +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity + + +class TelethonMessageEntityMapper: + """Telethon Event Entity Mapper.""" + + class ChatPropsModel(BaseModel): + """Model for __map_chat_props method.""" + + chat_id: int + chat_title: str + + @staticmethod + async def to_finder_notification_facade_entity(message: Message, downloaded_media_info: Optional[MediaHandlingEntity]) -> \ + Optional[FinderNotificationMessageEntity]: + """Map Telethon Event to FinderNotificationMessageEntity.""" + if not message: + return None + + mapped_chat_props: TelethonMessageEntityMapper.ChatPropsModel = TelethonMessageEntityMapper.__map_chat_props( + entity=await message.get_chat(), + ) + + h_result: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=message.date, + raw_text=message.raw_text, + group_name=mapped_chat_props.chat_title, + group_id=mapped_chat_props.chat_id, + from_id=message.from_id.user_id if isinstance(message.from_id, PeerUser) else None, + to_id=message.to_id.channel_id if message.to_id is not None else None, + reply_to_msg_id=message.reply_to.reply_to_msg_id if message.is_reply and message.reply_to else None, + message_id=message.id, + is_reply=message.is_reply, + downloaded_media_info=downloaded_media_info, + ) + + return h_result + + @staticmethod + def __map_chat_props(entity: Union[Channel, User, Chat]) -> TelethonMessageEntityMapper.ChatPropsModel: + """Map Chat Specific Props.""" + if isinstance(entity, (Channel, Chat)): + return TelethonMessageEntityMapper.ChatPropsModel( + chat_id=entity.id, + chat_title=entity.title if entity.title else '', + ) + + if isinstance(entity, User): + return TelethonMessageEntityMapper.ChatPropsModel( + chat_id=entity.id, + chat_title=entity.username if entity.username else (entity.phone if entity.phone else ''), + ) + + raise AttributeError(entity, 'Invalid entity type') diff --git a/TEx/core/media_download_handling/do_nothing_media_downloader.py b/TEx/core/media_download_handling/do_nothing_media_downloader.py index 6e2e86e..ac847ab 100644 --- a/TEx/core/media_download_handling/do_nothing_media_downloader.py +++ b/TEx/core/media_download_handling/do_nothing_media_downloader.py @@ -3,7 +3,7 @@ from typing import Dict -from telethon.tl.types import Message +from telethon.tl.patched import Message class DoNothingMediaDownloader: diff --git a/TEx/core/media_download_handling/photo_media_downloader.py b/TEx/core/media_download_handling/photo_media_downloader.py index 6a2761b..705c175 100644 --- a/TEx/core/media_download_handling/photo_media_downloader.py +++ b/TEx/core/media_download_handling/photo_media_downloader.py @@ -4,7 +4,7 @@ import os from typing import Dict -from telethon.tl.types import Message +from telethon.tl.patched import Message class PhotoMediaDownloader: diff --git a/TEx/core/media_download_handling/std_media_downloader.py b/TEx/core/media_download_handling/std_media_downloader.py index f34fbda..ad170b9 100644 --- a/TEx/core/media_download_handling/std_media_downloader.py +++ b/TEx/core/media_download_handling/std_media_downloader.py @@ -4,7 +4,7 @@ import os from typing import Dict, List -from telethon.tl.types import Message +from telethon.tl.patched import Message class StandardMediaDownloader: diff --git a/TEx/core/media_handler.py b/TEx/core/media_handler.py index 882898a..8fd0cb7 100644 --- a/TEx/core/media_handler.py +++ b/TEx/core/media_handler.py @@ -21,6 +21,7 @@ from TEx.core.media_metadata_handling.text_handler import TextPlainHandler from TEx.core.media_metadata_handling.webimage_handler import WebImageStickerHandler from TEx.database.telegram_group_database import TelegramMediaDatabaseManager +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity logger = logging.getLogger('TelegramExplorer') @@ -77,7 +78,7 @@ class UniversalTelegramMediaHandler: }, } - async def handle_medias(self, message: Message, group_id: int, data_path: str) -> Optional[int]: + async def handle_medias(self, message: Message, group_id: int, data_path: str) -> Optional[MediaHandlingEntity]: """Handle Message Media, Photo, File, etc.""" executor_id: Optional[str] = self.__resolve_executor_id(message=message) @@ -124,7 +125,14 @@ async def handle_medias(self, message: Message, group_id: int, data_path: str) - # Update Reference into DB if media_metadata is not None: media_metadata['group_id'] = group_id - return TelegramMediaDatabaseManager.insert(entity_values=media_metadata) + media_id: int = TelegramMediaDatabaseManager.insert(entity_values=media_metadata) + + return MediaHandlingEntity( + media_id=media_id, + file_name=media_metadata['file_name'], + content_type=media_metadata['mime_type'], + size_bytes=media_metadata['size_bytes'], + ) return None diff --git a/TEx/core/media_metadata_handling/do_nothing_media_handler.py b/TEx/core/media_metadata_handling/do_nothing_media_handler.py index c10353b..5eab805 100644 --- a/TEx/core/media_metadata_handling/do_nothing_media_handler.py +++ b/TEx/core/media_metadata_handling/do_nothing_media_handler.py @@ -3,7 +3,7 @@ from typing import Dict, Optional -from telethon.tl.types import Message +from telethon.tl.patched import Message class DoNothingHandler: diff --git a/TEx/core/media_metadata_handling/generic_binary_handler.py b/TEx/core/media_metadata_handling/generic_binary_handler.py index 649fb9f..154ac14 100644 --- a/TEx/core/media_metadata_handling/generic_binary_handler.py +++ b/TEx/core/media_metadata_handling/generic_binary_handler.py @@ -3,7 +3,8 @@ from typing import Dict, List, Optional -from telethon.tl.types import DocumentAttributeFilename, Message, MessageMediaDocument +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, MessageMediaDocument class GenericBinaryMediaHandler: @@ -26,4 +27,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/geo_handler.py b/TEx/core/media_metadata_handling/geo_handler.py index 9d4164c..538e9db 100644 --- a/TEx/core/media_metadata_handling/geo_handler.py +++ b/TEx/core/media_metadata_handling/geo_handler.py @@ -3,7 +3,8 @@ from typing import Dict, Optional -from telethon.tl.types import Message, MessageMediaGeo +from telethon.tl.patched import Message +from telethon.tl.types import MessageMediaGeo class GeoMediaHandler: @@ -28,4 +29,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': None, 'title': f'{geo.lat}|{geo.long}', 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/mp4_handler.py b/TEx/core/media_metadata_handling/mp4_handler.py index c0eade6..1a30236 100644 --- a/TEx/core/media_metadata_handling/mp4_handler.py +++ b/TEx/core/media_metadata_handling/mp4_handler.py @@ -3,7 +3,8 @@ from typing import Dict, List, Optional -from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeVideo, Message, MessageMediaDocument +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeVideo, MessageMediaDocument class MediaMp4Handler: @@ -27,4 +28,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/pdf_handler.py b/TEx/core/media_metadata_handling/pdf_handler.py index 7767c02..f9d970f 100644 --- a/TEx/core/media_metadata_handling/pdf_handler.py +++ b/TEx/core/media_metadata_handling/pdf_handler.py @@ -3,7 +3,8 @@ from typing import Dict, Optional -from telethon.tl.types import DocumentAttributeFilename, Message, MessageMediaPhoto +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, MessageMediaPhoto class PdfMediaHandler: @@ -15,7 +16,8 @@ def handle_metadata(message: Message) -> Optional[Dict]: media: MessageMediaPhoto = message.media return { - 'file_name': [item for item in media.document.attributes if isinstance(item, DocumentAttributeFilename)][0].file_name, + 'file_name': [item for item in media.document.attributes if isinstance(item, DocumentAttributeFilename)][ + 0].file_name, 'telegram_id': media.document.id, 'extension': None, 'height': None, @@ -25,4 +27,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/photo_handler.py b/TEx/core/media_metadata_handling/photo_handler.py index a34f422..50f0482 100644 --- a/TEx/core/media_metadata_handling/photo_handler.py +++ b/TEx/core/media_metadata_handling/photo_handler.py @@ -3,7 +3,8 @@ from typing import Dict, Optional -from telethon.tl.types import Message, MessageMediaPhoto +from telethon.tl.patched import Message +from telethon.tl.types import MessageMediaPhoto class PhotoMediaHandler: @@ -25,4 +26,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': message.file.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/sticker_handler.py b/TEx/core/media_metadata_handling/sticker_handler.py index 2b20be0..8cc39ee 100644 --- a/TEx/core/media_metadata_handling/sticker_handler.py +++ b/TEx/core/media_metadata_handling/sticker_handler.py @@ -3,7 +3,8 @@ from typing import Dict, List, Optional -from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeImageSize, Message, MessageMediaDocument +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeImageSize, MessageMediaDocument class MediaStickerHandler: @@ -16,7 +17,9 @@ def handle_metadata(message: Message) -> Optional[Dict]: fn_attr_img: List = [item for item in media.document.attributes if isinstance(item, DocumentAttributeImageSize)] return { - 'file_name': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)][0].file_name, + 'file_name': + [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)][ + 0].file_name, 'telegram_id': media.document.id, 'extension': None, 'height': fn_attr_img[0].h if len(fn_attr_img) > 0 else None, @@ -26,4 +29,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/text_handler.py b/TEx/core/media_metadata_handling/text_handler.py index 103c193..3297097 100644 --- a/TEx/core/media_metadata_handling/text_handler.py +++ b/TEx/core/media_metadata_handling/text_handler.py @@ -3,7 +3,8 @@ from typing import Dict, Optional -from telethon.tl.types import DocumentAttributeFilename, Message, MessageMediaDocument +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, MessageMediaDocument class TextPlainHandler: @@ -26,4 +27,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/webimage_handler.py b/TEx/core/media_metadata_handling/webimage_handler.py index 3166063..48e38b6 100644 --- a/TEx/core/media_metadata_handling/webimage_handler.py +++ b/TEx/core/media_metadata_handling/webimage_handler.py @@ -3,7 +3,8 @@ from typing import Dict, List, Optional -from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeImageSize, Message, MessageMediaDocument +from telethon.tl.patched import Message +from telethon.tl.types import DocumentAttributeFilename, DocumentAttributeImageSize, MessageMediaDocument class WebImageStickerHandler: @@ -14,7 +15,8 @@ def handle_metadata(message: Message) -> Optional[Dict]: """Handle Media Metadata.""" media: MessageMediaDocument = message.media - fn_attr: List = [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)] + fn_attr: List = [item for item in message.media.document.attributes if + isinstance(item, DocumentAttributeFilename)] if not fn_attr or len(fn_attr) == 0: return None @@ -23,11 +25,15 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'file_name': fn_attr[0].file_name, 'telegram_id': media.document.id, 'extension': None, - 'height': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][0].h, - 'width': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][0].w, + 'height': + [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][ + 0].h, + 'width': + [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][ + 0].w, 'date_time': media.document.date, 'mime_type': media.document.mime_type, 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/state_file.py b/TEx/core/state_file.py index 3a8300c..55c018f 100644 --- a/TEx/core/state_file.py +++ b/TEx/core/state_file.py @@ -42,7 +42,7 @@ def write_file_text(path: str, content: str) -> None: """ # Delete if Exists DbManager.SESSIONS['temp'].execute( - StateFileOrmEntity.__table__.delete().where(StateFileOrmEntity.path == path), + StateFileOrmEntity.__table__.delete().where(StateFileOrmEntity.path == path), # type: ignore ) entity: StateFileOrmEntity = StateFileOrmEntity( diff --git a/TEx/core/temp_file.py b/TEx/core/temp_file.py index a11dd44..afd511b 100644 --- a/TEx/core/temp_file.py +++ b/TEx/core/temp_file.py @@ -35,7 +35,7 @@ def read_file_text(path: str) -> str: def remove_expired_entries() -> int: """Remove all Expired Entries.""" total: int = DbManager.SESSIONS['temp'].execute( - TempDataOrmEntity.__table__.delete().where( + TempDataOrmEntity.__table__.delete().where( # type: ignore TempDataOrmEntity.valid_at <= int(datetime.now(tz=pytz.UTC).timestamp()), ), ).rowcount @@ -47,7 +47,7 @@ def remove_expired_entries() -> int: @staticmethod def purge() -> int: """Remove all Entries.""" - total: int = DbManager.SESSIONS['temp'].execute(TempDataOrmEntity.__table__.delete()).rowcount + total: int = DbManager.SESSIONS['temp'].execute(TempDataOrmEntity.__table__.delete()).rowcount # type: ignore DbManager.SESSIONS['temp'].flush() DbManager.SESSIONS['temp'].commit() return total @@ -64,7 +64,7 @@ def write_file_text(path: str, content: str, validate_seconds: int = 3600) -> No """ # Delete if Exists DbManager.SESSIONS['temp'].execute( - TempDataOrmEntity.__table__.delete().where(TempDataOrmEntity.path == path), + TempDataOrmEntity.__table__.delete().where(TempDataOrmEntity.path == path), # type: ignore ) entity: TempDataOrmEntity = TempDataOrmEntity( diff --git a/TEx/database/telegram_group_database.py b/TEx/database/telegram_group_database.py index a2b037d..893ef96 100644 --- a/TEx/database/telegram_group_database.py +++ b/TEx/database/telegram_group_database.py @@ -104,7 +104,7 @@ def insert(entity_values: Dict) -> None: DbManager.SESSIONS['data'].commit() except sqlalchemy.exc.IntegrityError as exc: - if 'UNIQUE' in exc.orig.args[0]: + if 'UNIQUE' in exc.orig.args[0]: # type: ignore return raise @@ -294,11 +294,11 @@ def get_all_medias_from_group_and_mimetype(group_id: int, mime_type: str, file_d parts_or_filter: List[BinaryExpression] = [] for name_part in file_name_part: - parts_or_filter.append(TelegramMediaOrmEntity.file_name.contains(name_part)) + parts_or_filter.append(TelegramMediaOrmEntity.file_name.contains(name_part)) # type: ignore select_statement = select_statement.where(or_(*parts_or_filter)) - return DbManager.SESSIONS['data'].execute(select_statement) + return DbManager.SESSIONS['data'].execute(select_statement) # type: ignore @staticmethod def stats_all_medias_from_group_by_mimetype(group_id: int, file_datetime_limit_seconds: Optional[int] = None) -> Dict: @@ -346,7 +346,7 @@ def get_all_medias_by_age(group_id: int, media_limit_days: int) -> List[Telegram :param media_limit_days: Age of Media in Days :return: Number of Medias Removed """ - statement: Delete = select(TelegramMediaOrmEntity).where( + statement: Delete = select(TelegramMediaOrmEntity).where( # type: ignore TelegramMediaOrmEntity.date_time <= (datetime.datetime.now(tz=pytz.UTC) - datetime.timedelta(days=media_limit_days)), ) diff --git a/TEx/finder/finder_engine.py b/TEx/finder/finder_engine.py index c1451dc..48321d3 100644 --- a/TEx/finder/finder_engine.py +++ b/TEx/finder/finder_engine.py @@ -2,12 +2,11 @@ from __future__ import annotations from configparser import ConfigParser -from typing import Dict, List - -from telethon.events import NewMessage +from typing import Dict, List, Optional from TEx.finder.all_messages_finder import AllMessagesFinder from TEx.finder.regex_finder import RegexFinder +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.notifier_engine import NotifierEngine @@ -50,25 +49,25 @@ def configure(self, config: ConfigParser) -> None: self.__load_rules(config=config) self.notification_engine.configure(config=config) - async def run(self, message: NewMessage.Event, source: str) -> None: + async def run(self, entity: Optional[FinderNotificationMessageEntity], source: str) -> None: """Execute the Finder with Raw Text. - :param message: Message Object + :param entity: Facade Object :param source: Source Account/Phone Number :return: """ - if not self.is_finder_enabled: + if not self.is_finder_enabled or not entity: return for rule in self.rules: - is_found: bool = await rule['instance'].find(raw_text=message.raw_text) + is_found: bool = await rule['instance'].find(raw_text=entity.raw_text) if is_found: # Runt the Notification Engine await self.notification_engine.run( notifiers=rule['notifier'].split(','), - message=message, + entity=entity, rule_id=rule['id'], source=source, ) diff --git a/TEx/models/database/telegram_db_model.py b/TEx/models/database/telegram_db_model.py index 7ace47c..82756d8 100644 --- a/TEx/models/database/telegram_db_model.py +++ b/TEx/models/database/telegram_db_model.py @@ -8,7 +8,7 @@ from sqlalchemy.orm import DeclarativeBase, Mapped, mapped_column -class TelegramDataBaseDeclarativeBase(DeclarativeBase): # type: ignore +class TelegramDataBaseDeclarativeBase(DeclarativeBase): """Global Telegram DB Declarative Base.""" diff --git a/TEx/models/database/temp_db_models.py b/TEx/models/database/temp_db_models.py index 27a49ad..46bf4e0 100644 --- a/TEx/models/database/temp_db_models.py +++ b/TEx/models/database/temp_db_models.py @@ -7,7 +7,7 @@ from sqlalchemy.orm import DeclarativeBase, Mapped, mapped_column -class TempDataBaseDeclarativeBase(DeclarativeBase): # type: ignore +class TempDataBaseDeclarativeBase(DeclarativeBase): """Global Temporary Declarative Base.""" diff --git a/TEx/models/facade/finder_notification_facade_entity.py b/TEx/models/facade/finder_notification_facade_entity.py new file mode 100644 index 0000000..82c43d1 --- /dev/null +++ b/TEx/models/facade/finder_notification_facade_entity.py @@ -0,0 +1,26 @@ +"""Facade Entities for Finder e Notification Engine Modules.""" +from __future__ import annotations + +from datetime import datetime +from typing import Optional + +from pydantic import BaseModel, ConfigDict + +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity + + +class FinderNotificationMessageEntity(BaseModel): + """Facade Entity for Finder and Notification.""" + + model_config = ConfigDict(extra='forbid') + + date_time: datetime + raw_text: str + group_name: Optional[str] + group_id: int + from_id: Optional[int] + to_id: Optional[int] + reply_to_msg_id: Optional[int] + message_id: int + is_reply: bool + downloaded_media_info: Optional[MediaHandlingEntity] diff --git a/TEx/models/facade/media_handler_facade_entity.py b/TEx/models/facade/media_handler_facade_entity.py new file mode 100644 index 0000000..231b133 --- /dev/null +++ b/TEx/models/facade/media_handler_facade_entity.py @@ -0,0 +1,12 @@ +"""Facade Entities for Media Handling.""" + +from pydantic import BaseModel + + +class MediaHandlingEntity(BaseModel): + """Facade Entities for Media Handling.""" + + media_id: int + file_name: str + content_type: str + size_bytes: int diff --git a/TEx/models/facade/telegram_group_report_facade_entity.py b/TEx/models/facade/telegram_group_report_facade_entity.py index 5fa8741..f81890d 100644 --- a/TEx/models/facade/telegram_group_report_facade_entity.py +++ b/TEx/models/facade/telegram_group_report_facade_entity.py @@ -1,4 +1,7 @@ """Facade Entity for Report Generation.""" +from __future__ import annotations + +from typing import Optional from TEx.models.database.telegram_db_model import TelegramGroupOrmEntity @@ -19,11 +22,11 @@ class TelegramGroupReportFacadeEntity: scam: bool verified: bool - participants_count: int + participants_count: Optional[int] - photo_id: int - photo_base64: str - photo_name: str + photo_id: Optional[int] + photo_base64: Optional[str] + photo_name: Optional[str] source: str diff --git a/TEx/models/facade/telegram_message_report_facade_entity.py b/TEx/models/facade/telegram_message_report_facade_entity.py index 3eafa40..a6090b3 100644 --- a/TEx/models/facade/telegram_message_report_facade_entity.py +++ b/TEx/models/facade/telegram_message_report_facade_entity.py @@ -18,9 +18,9 @@ class TelegramMessageReportFacadeEntity: message: str raw: str - from_id: int - from_type: str - to_id: int + from_id: Optional[int] + from_type: Optional[str] + to_id: Optional[int] meta_next: bool meta_previous: bool diff --git a/TEx/modules/telegram_messages_listener.py b/TEx/modules/telegram_messages_listener.py index 93e094b..1512bec 100644 --- a/TEx/modules/telegram_messages_listener.py +++ b/TEx/modules/telegram_messages_listener.py @@ -3,19 +3,22 @@ import logging from configparser import ConfigParser -from typing import Dict, List, cast +from typing import Dict, List, Optional, cast import pytz from telethon import TelegramClient, events from telethon.events import NewMessage -from telethon.tl.types import Channel, Message, PeerUser, User +from telethon.tl.patched import Message +from telethon.tl.types import Channel, PeerUser, User from TEx.core.base_module import BaseModule from TEx.core.mapper.telethon_channel_mapper import TelethonChannelEntityMapper +from TEx.core.mapper.telethon_message_mapper import TelethonMessageEntityMapper from TEx.core.mapper.telethon_user_mapper import TelethonUserEntiyMapper from TEx.core.media_handler import UniversalTelegramMediaHandler from TEx.database.telegram_group_database import TelegramGroupDatabaseManager, TelegramMessageDatabaseManager, TelegramUserDatabaseManager from TEx.finder.finder_engine import FinderEngine +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity logger = logging.getLogger('TelegramExplorer') @@ -57,6 +60,7 @@ async def __handler(self, event: NewMessage.Event) -> None: await self.__ensure_group_exists(event=event) # Create Dict with All Value + downloaded_media: Optional[MediaHandlingEntity] = await self.media_handler.handle_medias(message, event.chat.id, self.data_path) if self.download_media else None values: Dict = { 'id': message.id, 'group_id': event.chat.id, @@ -64,10 +68,10 @@ async def __handler(self, event: NewMessage.Event) -> None: 'message': message.message, 'raw': message.raw_text, 'to_id': message.to_id.channel_id if message.to_id is not None else None, - 'media_id': await self.media_handler.handle_medias(message, event.chat.id, self.data_path) if self.download_media else None, + 'media_id': downloaded_media.media_id if downloaded_media else None, 'is_reply': message.is_reply, 'reply_to_msg_id': message.reply_to.reply_to_msg_id if message.is_reply else None, - } + } # Process Sender ID if message.from_id is not None: @@ -85,7 +89,7 @@ async def __handler(self, event: NewMessage.Event) -> None: # Execute Finder await self.finder.run( - message=message, + await TelethonMessageEntityMapper.to_finder_notification_facade_entity(message=message, downloaded_media_info=downloaded_media), source=self.target_phone_number, ) @@ -134,7 +138,7 @@ async def __ensure_group_exists(self, event: NewMessage.Event) -> None: group_dict_data: Dict = TelethonChannelEntityMapper.to_database_dict( entity=result, target_phone_numer=self.target_phone_number, - ) + ) TelegramGroupDatabaseManager.insert_or_update(group_dict_data) diff --git a/TEx/modules/telegram_messages_scrapper.py b/TEx/modules/telegram_messages_scrapper.py index 912862e..cd5decc 100644 --- a/TEx/modules/telegram_messages_scrapper.py +++ b/TEx/modules/telegram_messages_scrapper.py @@ -15,6 +15,7 @@ from TEx.core.media_handler import UniversalTelegramMediaHandler from TEx.database.telegram_group_database import TelegramGroupDatabaseManager, TelegramMessageDatabaseManager from TEx.models.database.telegram_db_model import TelegramGroupOrmEntity +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity logger = logging.getLogger('TelegramExplorer') @@ -115,6 +116,7 @@ async def __download_messages(self, group_id: int, group_name: str, client: Tele if message.reply_to_msg_id: pass + downloaded_media: Optional[MediaHandlingEntity] = await self.media_handler.handle_medias(message, group_id, data_path) if download_media else None values: Dict = { 'id': message.id, 'group_id': group_id, @@ -122,8 +124,8 @@ async def __download_messages(self, group_id: int, group_name: str, client: Tele 'message': message.message, 'raw': message.raw_text, 'to_id': message.to_id.channel_id if message.to_id is not None else None, - 'media_id': await self.media_handler.handle_medias(message, group_id, data_path) if download_media else None, - } + 'media_id': downloaded_media.media_id if downloaded_media else None, + } if message.from_id is not None: if isinstance(message.from_id, PeerUser): diff --git a/TEx/modules/telegram_report_generator/telegram_html_report_generator.py b/TEx/modules/telegram_report_generator/telegram_html_report_generator.py index 2b79af0..0a21305 100644 --- a/TEx/modules/telegram_report_generator/telegram_html_report_generator.py +++ b/TEx/modules/telegram_report_generator/telegram_html_report_generator.py @@ -220,7 +220,7 @@ async def process_messages(self, reppeating_messages_signatures.append(message_hash) # Get the From Message User - from_user: Optional[TelegramUserOrmEntity] = self.get_user(message.from_id) + from_user: Optional[TelegramUserOrmEntity] = self.get_user(message.from_id) if message.from_id else None # Check if Append the Message on Previous Message OR Creates a New One is_user_bot: bool = from_user is not None and not from_user.is_bot @@ -269,7 +269,7 @@ async def get_media(self, message: TelegramMessageReportFacadeEntity, assets_roo ) if media: - if media.mime_type == 'application/vnd.geo': + if media.mime_type == 'application/vnd.geo' and media.title: media_geo = media.title.replace('|', ',') else: @@ -305,7 +305,7 @@ async def get_media(self, message: TelegramMessageReportFacadeEntity, assets_roo def render_to_from_message_info(self, message: TelegramMessageReportFacadeEntity, from_user: Optional[TelegramUserOrmEntity]) -> str: """Build and Return the TO/FROM Information for Message.""" # Get Users - to_user: Optional[TelegramUserOrmEntity] = self.get_user(message.to_id) + to_user: Optional[TelegramUserOrmEntity] = self.get_user(message.to_id) if message.to_id else None to_from_information: str = '' if from_user: diff --git a/TEx/notifier/discord_notifier.py b/TEx/notifier/discord_notifier.py index bb88b31..6a0b179 100644 --- a/TEx/notifier/discord_notifier.py +++ b/TEx/notifier/discord_notifier.py @@ -2,8 +2,8 @@ from configparser import SectionProxy from discord_webhook import DiscordEmbed, DiscordWebhook -from telethon.events import NewMessage +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.notifier_base import BaseNotifier @@ -20,10 +20,10 @@ def configure(self, url: str, config: SectionProxy) -> None: self.url = url self.configure_base(config=config) - async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: + async def run(self, entity: FinderNotificationMessageEntity, rule_id: str, source: str) -> None: """Run Discord Notifier.""" # Check and Update Deduplication Control - is_duplicated, duplication_tag = self.check_is_duplicated(message=message.raw_text) + is_duplicated, duplication_tag = self.check_is_duplicated(message=entity.raw_text) if is_duplicated: return @@ -34,16 +34,16 @@ async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> Non ) embed = DiscordEmbed( - title=f'**{message.chat.title}** ({message.chat.id})', - description=message.raw_text, + title=f'**{entity.group_name}** ({entity.group_id})', + description=entity.raw_text, ) embed.add_embed_field(name='Source', value=source, inline=True) embed.add_embed_field(name='Rule', value=rule_id, inline=True) - embed.add_embed_field(name='Message ID', value=str(message.id), inline=False) - embed.add_embed_field(name='Group Name', value=message.chat.title, inline=True) - embed.add_embed_field(name='Group ID', value=message.chat.id, inline=True) - embed.add_embed_field(name='Message Date', value=str(message.date), inline=False) + embed.add_embed_field(name='Message ID', value=str(entity.message_id), inline=False) + embed.add_embed_field(name='Group Name', value=entity.group_name if entity.group_name else '', inline=True) + embed.add_embed_field(name='Group ID', value=str(entity.group_id), inline=True) + embed.add_embed_field(name='Message Date', value=str(entity.date_time), inline=False) embed.add_embed_field(name='Tag', value=duplication_tag, inline=False) # add embed object to webhook diff --git a/TEx/notifier/elastic_search_notifier.py b/TEx/notifier/elastic_search_notifier.py index 8d6e64e..c53d7fb 100644 --- a/TEx/notifier/elastic_search_notifier.py +++ b/TEx/notifier/elastic_search_notifier.py @@ -6,9 +6,8 @@ import pytz from elasticsearch import AsyncElasticsearch -from telethon.events import NewMessage -from telethon.tl.types import PeerUser +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.notifier_base import BaseNotifier @@ -19,7 +18,7 @@ def __init__(self) -> None: """Initialize Elastic Search Notifier.""" super().__init__() self.url: str = '' - self.client: AsyncElasticsearch = None + self.client: Optional[AsyncElasticsearch] = None self.index: str = '' self.pipeline: str = '' @@ -28,7 +27,7 @@ def configure(self, config: SectionProxy) -> None: hosts_list: Optional[str] = config.get('address', fallback=None) self.client = AsyncElasticsearch( - hosts=hosts_list.split(',') if hosts_list else None, + hosts=hosts_list.split(',') if hosts_list else None, # type: ignore api_key=config.get('api_key', fallback=None), verify_certs=config.get('verify_ssl_cert', fallback='True') == 'True', cloud_id=config.get('cloud_id', fallback=None), @@ -36,26 +35,29 @@ def configure(self, config: SectionProxy) -> None: self.index = config['index_name'] self.pipeline = config['pipeline_name'] - async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: + async def run(self, entity: FinderNotificationMessageEntity, rule_id: str, source: str) -> None: """Run Elastic Search Notifier.""" + if not self.client: + return + content: Dict = { - 'time': message.date.astimezone(tz=pytz.utc), + 'time': entity.date_time.astimezone(tz=pytz.utc), 'source': source, 'rule': rule_id, - 'raw': message.raw_text, - 'group_name': message.chat.title, - 'group_id': message.chat.id, - 'from_id': message.from_id.user_id if isinstance(message.from_id, PeerUser) else '', - 'to_id': message.to_id.channel_id if message.to_id is not None else None, - 'reply_to_msg_id': message.reply_to.reply_to_msg_id if message.is_reply and message.reply_to else None, - 'message_id': message.id, - 'is_reply': message.is_reply, + 'raw': entity.raw_text, + 'group_name': entity.group_name, + 'group_id': entity.group_id, + 'from_id': entity.from_id, + 'to_id': entity.to_id, + 'reply_to_msg_id': entity.reply_to_msg_id, + 'message_id': entity.message_id, + 'is_reply': entity.is_reply, } - if hasattr(message, 'file') and message.file: + if entity.downloaded_media_info: content['has_media'] = True - content['media_mime_type'] = message.file.mime_type if hasattr(message.file, 'mime_type') else None - content['media_size'] = message.file.size if hasattr(message.file, 'size') else None + content['media_mime_type'] = entity.downloaded_media_info.content_type + content['media_size'] = entity.downloaded_media_info.size_bytes else: content['has_media'] = False content['media_mime_type'] = None @@ -64,6 +66,6 @@ async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> Non await self.client.index( index=self.index, pipeline=self.pipeline, - id=f'{message.chat.id}_{message.id}', + id=f'{str(entity.group_id)}_{str(entity.message_id)}', document=content, ) diff --git a/TEx/notifier/notifier_base.py b/TEx/notifier/notifier_base.py index f01bc07..f557e11 100644 --- a/TEx/notifier/notifier_base.py +++ b/TEx/notifier/notifier_base.py @@ -7,7 +7,8 @@ from typing import Optional, Tuple from cachetools import TTLCache -from telethon.events import NewMessage + +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity class BaseNotifier: @@ -38,5 +39,5 @@ def check_is_duplicated(self, message: str) -> Tuple[bool, str]: return False, tag @abc.abstractmethod - async def run(self, message: NewMessage.Event, rule_id: str, source: str) -> None: + async def run(self, entity: FinderNotificationMessageEntity, rule_id: str, source: str) -> None: """Run the Notification Process.""" diff --git a/TEx/notifier/notifier_engine.py b/TEx/notifier/notifier_engine.py index 5d557be..f4308bd 100644 --- a/TEx/notifier/notifier_engine.py +++ b/TEx/notifier/notifier_engine.py @@ -4,8 +4,7 @@ from configparser import ConfigParser from typing import Dict, List -from telethon.events import NewMessage - +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.discord_notifier import DiscordNotifier from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier from TEx.notifier.notifier_base import BaseNotifier @@ -44,7 +43,7 @@ def configure(self, config: ConfigParser) -> None: """Configure Finder.""" self.__load_notifiers(config) - async def run(self, notifiers: List[str], message: NewMessage.Event, rule_id: str, source: str) -> None: + async def run(self, notifiers: List[str], entity: FinderNotificationMessageEntity, rule_id: str, source: str) -> None: """Dispatch all Notifications. :param notifiers: @@ -59,4 +58,4 @@ async def run(self, notifiers: List[str], message: NewMessage.Event, rule_id: st for dispatcher_name in notifiers: target_notifier: BaseNotifier = self.notifiers[dispatcher_name]['instance'] - await target_notifier.run(message=message, rule_id=rule_id, source=source) + await target_notifier.run(entity=entity, rule_id=rule_id, source=source) diff --git a/mypy.ini b/mypy.ini index 366e6ef..e40e72d 100644 --- a/mypy.ini +++ b/mypy.ini @@ -1,5 +1,5 @@ [mypy] -plugins = sqlalchemy.ext.mypy.plugin +plugins = sqlalchemy.ext.mypy.plugin, pydantic.mypy ignore_missing_imports = True @@ -24,7 +24,11 @@ warn_unreachable = True namespace_packages = True -follow_imports = skip +follow_imports = normal files = TEx/**/*.py +[pydantic-mypy] +init_forbid_extra = True +init_typed = True +warn_required_dynamic_aliases = True diff --git a/pyproject.toml b/pyproject.toml index 66c090c..a68c134 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -72,6 +72,7 @@ types-aiofiles = "23.2.0.0" python-socks = "2.4.3" async-timeout = "4.0.3" elasticsearch = {extras = ["async"], version = "8.10.0"} +pydantic = "2.4.2" [tool.poetry.dev-dependencies] pytest = ">=7.4.0" diff --git a/tests/finder/test_finder_engine.py b/tests/finder/test_finder_engine.py index 39f9e3f..273f5ee 100644 --- a/tests/finder/test_finder_engine.py +++ b/tests/finder/test_finder_engine.py @@ -6,7 +6,9 @@ from unittest import mock from unittest.mock import ANY, call +from TEx.core.mapper.telethon_message_mapper import TelethonMessageEntityMapper from TEx.finder.finder_engine import FinderEngine +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from tests.modules.common import TestsCommon from tests.modules.mockups_groups_mockup_data import channel_1_mocked @@ -23,8 +25,18 @@ def test_run_with_regex_finder(self): # Setup Mock notifier_engine_mock = mock.AsyncMock() - target_message = mock.MagicMock() - target_message.raw_text = "Mocked term3 Raw Text" + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime.datetime.utcnow(), + raw_text="Mocked term3 Raw Text", + group_name="Group 001", + group_id=123456, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=969696, + is_reply=False, + downloaded_media_info=None, + ) args: Dict = { 'config': 'unittest_configfile.config' @@ -46,7 +58,7 @@ def test_run_with_regex_finder(self): # Invoke Test Target target.run( - message=target_message, + entity=message_entity, source='+15558987453' ) ) @@ -54,7 +66,7 @@ def test_run_with_regex_finder(self): # Check if Webhook was Executed target.notification_engine.run.assert_awaited_once_with( notifiers=['NOTIFIER.DISCORD.NOT_002'], - message=target_message, + entity=message_entity, rule_id='FINDER.RULE.UT_Finder_Demo', source='+15558987453' ) diff --git a/tests/modules/mockups_groups_mockup_data.py b/tests/modules/mockups_groups_mockup_data.py index d69b408..36066a9 100644 --- a/tests/modules/mockups_groups_mockup_data.py +++ b/tests/modules/mockups_groups_mockup_data.py @@ -4,7 +4,6 @@ from telethon.tl.types import Chat, Channel, ChatBannedRights, ChatForbidden, ChatPhoto, Document, DocumentAttributeFilename, \ DocumentAttributeImageSize, DocumentAttributeSticker, DocumentAttributeVideo, InputStickerSetID, \ KeyboardButtonCallback, KeyboardButtonRow, \ - Message, \ MessageEntityBold, MessageEntityBotCommand, MessageEntityCode, MessageEntityMention, MessageEntityMentionName, \ MessageEntityUrl, \ MessageFwdHeader, \ @@ -12,6 +11,7 @@ MessageMediaPhoto, MessageMediaWebPage, MessageReplies, MessageReplyHeader, PeerChannel, \ PeerUser, Photo, PhotoPathSize, PhotoSize, PhotoStrippedSize, ReplyInlineMarkup, RestrictionReason, User, \ UserProfilePhoto, UserStatusOffline, UserStatusRecently, WebPage +from telethon.tl.patched import Message from telethon.tl.types.messages import Dialogs b64_group_pic_image = '' diff --git a/tests/modules/test_telegram_messages_listener.py b/tests/modules/test_telegram_messages_listener.py index 2e02863..6249de7 100644 --- a/tests/modules/test_telegram_messages_listener.py +++ b/tests/modules/test_telegram_messages_listener.py @@ -113,6 +113,7 @@ async def async_generator_side_effect(items): mocked_event = mock.AsyncMock() mocked_event.chat = mocked_channel mocked_event.get_chat = mock.AsyncMock(return_value=mocked_channel) + message.get_chat = mock.AsyncMock(return_value=mocked_channel) if message.from_id: mocked_event.from_id = mock.MagicMock() diff --git a/tests/notifier/test_discord_notifier.py b/tests/notifier/test_discord_notifier.py index 806bc9c..f9f95a3 100644 --- a/tests/notifier/test_discord_notifier.py +++ b/tests/notifier/test_discord_notifier.py @@ -5,6 +5,7 @@ from typing import Dict from unittest import mock +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.discord_notifier import DiscordNotifier from tests.modules.common import TestsCommon from tests.modules.mockups_groups_mockup_data import channel_1_mocked @@ -23,11 +24,18 @@ def test_run_no_duplication(self): discord_webhook_mock = mock.AsyncMock() discord_webhook_mock.add_embed = mock.MagicMock() - target_message = mock.MagicMock() - target_message.raw_text = "Mocked Raw Text" - target_message.id = 5975883 - target_message.data = datetime.datetime(2023, 10, 1, 9, 58, 22) - target_message.chat = channel_1_mocked + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + raw_text="Mocked Raw Text", + group_name="Channel 1972142108", + group_id=1972142108, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=5975883, + is_reply=False, + downloaded_media_info=None, + ) target: DiscordNotifier = DiscordNotifier() args: Dict = { @@ -48,7 +56,7 @@ def test_run_no_duplication(self): # Invoke Test Target target.run( - message=target_message, + entity=message_entity, rule_id='RULE_UT_01', source='+15558987453' ) @@ -66,7 +74,7 @@ def test_run_no_duplication(self): self.assertEqual(call_arg.fields[1], {'inline': True, 'name': 'Rule', 'value': 'RULE_UT_01'}) self.assertEqual(call_arg.fields[2], {'inline': False, 'name': 'Message ID', 'value': '5975883'}) self.assertEqual(call_arg.fields[3], {'inline': True, 'name': 'Group Name', 'value': 'Channel 1972142108'}) - self.assertEqual(call_arg.fields[4], {'inline': True, 'name': 'Group ID', 'value': 1972142108}) + self.assertEqual(call_arg.fields[4], {'inline': True, 'name': 'Group ID', 'value': '1972142108'}) self.assertEqual(call_arg.fields[6], {'inline': False, 'name': 'Tag', 'value': 'de33f5dda9c686c64d23b8aec2eebfc7'}) # Check if Webhook was Executed @@ -79,11 +87,18 @@ def test_run_duplication_control(self): discord_webhook_mock = mock.AsyncMock() discord_webhook_mock.add_embed = mock.MagicMock() - target_message = mock.MagicMock() - target_message.raw_text = "Mocked Raw Text 2" - target_message.id = 5975883 - target_message.data = datetime.datetime(2023, 10, 1, 9, 58, 22) - target_message.chat = channel_1_mocked + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + raw_text="Mocked Raw Text 2", + group_name="Channel 1972142108", + group_id=1972142108, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=5975883, + is_reply=False, + downloaded_media_info=None, + ) target: DiscordNotifier = DiscordNotifier() args: Dict = { @@ -104,7 +119,7 @@ def test_run_duplication_control(self): # Invoke Test Target target.run( - message=target_message, + entity=message_entity, rule_id='RULE_UT_01', source='+15558987453' ) @@ -114,7 +129,7 @@ def test_run_duplication_control(self): # Invoke Test Target Again target.run( - message=target_message, + entity=message_entity, rule_id='RULE_UT_01', source='+15558987453' ) diff --git a/tests/notifier/test_elastic_search_notifier.py b/tests/notifier/test_elastic_search_notifier.py index 915e3c5..50bcf24 100644 --- a/tests/notifier/test_elastic_search_notifier.py +++ b/tests/notifier/test_elastic_search_notifier.py @@ -1,69 +1,77 @@ -import asyncio -import datetime -import unittest -from configparser import ConfigParser -from typing import Dict -from unittest import mock - -from telethon.tl.types import Message, MessageFwdHeader, PeerChannel, PeerUser - -from TEx.notifier.discord_notifier import DiscordNotifier -from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier -from tests.modules.common import TestsCommon -from tests.modules.mockups_groups_mockup_data import base_groups_mockup_data, base_messages_mockup_data, \ - channel_1_mocked - - -class ElasticSearchNotifierTest(unittest.TestCase): - - def setUp(self) -> None: - self.config = ConfigParser() - self.config.read('../../config.ini') - - def test_run_without_file(self): - """Test Run Method Without Message File Attachment.""" - - # Setup Mock - elastic_search_api_mock = mock.AsyncMock() - elastic_search_api_mock.index = mock.AsyncMock() - - target: ElasticSearchNotifier = ElasticSearchNotifier() - args: Dict = { - 'config': 'unittest_configfile.config' - } - data: Dict = {} - TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) - - # Set Mock Message - origin_mock_message = base_messages_mockup_data[1] - mocked_message = mock.MagicMock(spec=origin_mock_message) - for attr_name in origin_mock_message.__dict__: - setattr(mocked_message, attr_name, getattr(origin_mock_message, attr_name)) - mocked_message.chat = channel_1_mocked - - with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): - # Execute Discord Notifier Configure Method - target.configure( - config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] - ) - - loop = asyncio.get_event_loop() - loop.run_until_complete( - - # Invoke Test Target - target.run( - message=mocked_message, - rule_id='RULE_UT_01', - source='+15558987453' - ) - ) - - # Check .index call - elastic_search_api_mock.index.assert_called_once() - call_arg = elastic_search_api_mock.index.call_args[1] - - self.assertEqual(call_arg['index'], 'test_index_name') - self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') - self.assertEqual(call_arg['id'], '1972142108_183017') - - submited_document = call_arg['document'] +# import asyncio +# import datetime +# import unittest +# from configparser import ConfigParser +# from typing import Dict +# from unittest import mock +# +# from telethon.tl.types import Message, MessageFwdHeader, PeerChannel, PeerUser +# +# from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity +# from TEx.notifier.discord_notifier import DiscordNotifier +# from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier +# from tests.modules.common import TestsCommon +# from tests.modules.mockups_groups_mockup_data import base_groups_mockup_data, base_messages_mockup_data, \ +# channel_1_mocked +# +# +# class ElasticSearchNotifierTest(unittest.TestCase): +# +# def setUp(self) -> None: +# self.config = ConfigParser() +# self.config.read('../../config.ini') +# +# def test_run_without_file(self): +# """Test Run Method Without Message File Attachment.""" +# +# # Setup Mock +# elastic_search_api_mock = mock.AsyncMock() +# elastic_search_api_mock.index = mock.AsyncMock() +# +# target: ElasticSearchNotifier = ElasticSearchNotifier() +# args: Dict = { +# 'config': 'unittest_configfile.config' +# } +# data: Dict = {} +# TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) +# +# # Set Message +# message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( +# date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), +# raw_text="Mocked Raw Text", +# group_name="Channel 1972142108", +# group_id=1972142108, +# from_id="1234", +# to_id=9876, +# reply_to_msg_id=5544, +# message_id=5975883, +# is_reply=False, +# downloaded_media_info=None, +# ) +# +# with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): +# # Execute Discord Notifier Configure Method +# target.configure( +# config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] +# ) +# +# loop = asyncio.get_event_loop() +# loop.run_until_complete( +# +# # Invoke Test Target +# target.run( +# message=mocked_message, +# rule_id='RULE_UT_01', +# source='+15558987453' +# ) +# ) +# +# # Check .index call +# elastic_search_api_mock.index.assert_called_once() +# call_arg = elastic_search_api_mock.index.call_args[1] +# +# self.assertEqual(call_arg['index'], 'test_index_name') +# self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') +# self.assertEqual(call_arg['id'], '1972142108_183017') +# +# submited_document = call_arg['document'] diff --git a/tests/notifier/test_notifier_engine.py b/tests/notifier/test_notifier_engine.py index 4da79cf..81549fc 100644 --- a/tests/notifier/test_notifier_engine.py +++ b/tests/notifier/test_notifier_engine.py @@ -1,10 +1,12 @@ import asyncio import unittest from configparser import ConfigParser +from datetime import datetime from typing import Dict from unittest import mock from unittest.mock import call +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity from TEx.notifier.notifier_engine import NotifierEngine from tests.modules.common import TestsCommon from tests.modules.mockups_groups_mockup_data import base_messages_mockup_data @@ -23,6 +25,9 @@ def test_run(self): discord_notifier_mockup = mock.AsyncMock() discord_notifier_mockup.run = mock.AsyncMock() + elastic_notifier_mockup = mock.AsyncMock() + elastic_notifier_mockup.run = mock.AsyncMock() + target: NotifierEngine = NotifierEngine() args: Dict = { 'export_text': True, @@ -37,19 +42,38 @@ def test_run(self): data: Dict = {} TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + # Set Message + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime(2023, 10, 1, 9, 58, 22), + raw_text="Mocked Raw Text", + group_name="Channel 1972142108", + group_id=1972142108, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=55, + is_reply=False, + downloaded_media_info=None, + ) + with mock.patch('TEx.notifier.notifier_engine.DiscordNotifier', return_value=discord_notifier_mockup): - target.configure(config=self.config) - loop = asyncio.get_event_loop() - loop.run_until_complete( - target.run( - notifiers=['NOTIFIER.DISCORD.NOT_001', 'NOTIFIER.DISCORD.NOT_002'], - message=base_messages_mockup_data[0], - rule_id='RULE_UT_01', - source='+15558987453' + with mock.patch('TEx.notifier.notifier_engine.ElasticSearchNotifier', return_value=elastic_notifier_mockup): + target.configure(config=self.config) + loop = asyncio.get_event_loop() + loop.run_until_complete( + target.run( + notifiers=['NOTIFIER.DISCORD.NOT_001', 'NOTIFIER.DISCORD.NOT_002', 'NOTIFIER.ELASTIC_SEARCH.UT_01'], + entity=message_entity, + rule_id='RULE_UT_01', + source='+15558987453' + ) ) - ) - discord_notifier_mockup.run.assert_has_awaits([ - call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01', source='+15558987453'), - call(message=base_messages_mockup_data[0], rule_id='RULE_UT_01', source='+15558987453'), - ]) + discord_notifier_mockup.run.assert_has_awaits([ + call(entity=message_entity, rule_id='RULE_UT_01', source='+15558987453'), + call(entity=message_entity, rule_id='RULE_UT_01', source='+15558987453') + ]) + + elastic_notifier_mockup.run.assert_has_awaits([ + call(entity=message_entity, rule_id='RULE_UT_01', source='+15558987453') + ]) From 2ee8ee86fc843d5e074178fae999f71b01346e95 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Fri, 20 Oct 2023 08:26:23 -0300 Subject: [PATCH 09/11] Added Unittests for Elastic Search Connector Signed-off-by: Guilherme Bacellar Moralez --- .../media_metadata_handling/geo_handler.py | 2 +- .../media_metadata_handling/mp4_handler.py | 2 +- .../media_metadata_handling/pdf_handler.py | 5 +- .../media_metadata_handling/photo_handler.py | 2 +- .../sticker_handler.py | 6 +- .../media_metadata_handling/text_handler.py | 2 +- .../webimage_handler.py | 13 +- .../notifier/test_elastic_search_notifier.py | 311 +++++++++++++----- 8 files changed, 246 insertions(+), 97 deletions(-) diff --git a/TEx/core/media_metadata_handling/geo_handler.py b/TEx/core/media_metadata_handling/geo_handler.py index 538e9db..1b3e59a 100644 --- a/TEx/core/media_metadata_handling/geo_handler.py +++ b/TEx/core/media_metadata_handling/geo_handler.py @@ -29,4 +29,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': None, 'title': f'{geo.lat}|{geo.long}', 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/mp4_handler.py b/TEx/core/media_metadata_handling/mp4_handler.py index 1a30236..ea23371 100644 --- a/TEx/core/media_metadata_handling/mp4_handler.py +++ b/TEx/core/media_metadata_handling/mp4_handler.py @@ -28,4 +28,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/pdf_handler.py b/TEx/core/media_metadata_handling/pdf_handler.py index f9d970f..efd1afb 100644 --- a/TEx/core/media_metadata_handling/pdf_handler.py +++ b/TEx/core/media_metadata_handling/pdf_handler.py @@ -16,8 +16,7 @@ def handle_metadata(message: Message) -> Optional[Dict]: media: MessageMediaPhoto = message.media return { - 'file_name': [item for item in media.document.attributes if isinstance(item, DocumentAttributeFilename)][ - 0].file_name, + 'file_name': [item for item in media.document.attributes if isinstance(item, DocumentAttributeFilename)][0].file_name, 'telegram_id': media.document.id, 'extension': None, 'height': None, @@ -27,4 +26,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/photo_handler.py b/TEx/core/media_metadata_handling/photo_handler.py index 50f0482..4dfe0cc 100644 --- a/TEx/core/media_metadata_handling/photo_handler.py +++ b/TEx/core/media_metadata_handling/photo_handler.py @@ -26,4 +26,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': message.file.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/sticker_handler.py b/TEx/core/media_metadata_handling/sticker_handler.py index 8cc39ee..cdf98ca 100644 --- a/TEx/core/media_metadata_handling/sticker_handler.py +++ b/TEx/core/media_metadata_handling/sticker_handler.py @@ -17,9 +17,7 @@ def handle_metadata(message: Message) -> Optional[Dict]: fn_attr_img: List = [item for item in media.document.attributes if isinstance(item, DocumentAttributeImageSize)] return { - 'file_name': - [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)][ - 0].file_name, + 'file_name': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)][0].file_name, 'telegram_id': media.document.id, 'extension': None, 'height': fn_attr_img[0].h if len(fn_attr_img) > 0 else None, @@ -29,4 +27,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/text_handler.py b/TEx/core/media_metadata_handling/text_handler.py index 3297097..0f0a2ed 100644 --- a/TEx/core/media_metadata_handling/text_handler.py +++ b/TEx/core/media_metadata_handling/text_handler.py @@ -27,4 +27,4 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/TEx/core/media_metadata_handling/webimage_handler.py b/TEx/core/media_metadata_handling/webimage_handler.py index 48e38b6..07c9e05 100644 --- a/TEx/core/media_metadata_handling/webimage_handler.py +++ b/TEx/core/media_metadata_handling/webimage_handler.py @@ -15,8 +15,7 @@ def handle_metadata(message: Message) -> Optional[Dict]: """Handle Media Metadata.""" media: MessageMediaDocument = message.media - fn_attr: List = [item for item in message.media.document.attributes if - isinstance(item, DocumentAttributeFilename)] + fn_attr: List = [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeFilename)] if not fn_attr or len(fn_attr) == 0: return None @@ -25,15 +24,11 @@ def handle_metadata(message: Message) -> Optional[Dict]: 'file_name': fn_attr[0].file_name, 'telegram_id': media.document.id, 'extension': None, - 'height': - [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][ - 0].h, - 'width': - [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][ - 0].w, + 'height': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][0].h, + 'width': [item for item in message.media.document.attributes if isinstance(item, DocumentAttributeImageSize)][0].w, 'date_time': media.document.date, 'mime_type': media.document.mime_type, 'size_bytes': media.document.size, 'title': None, 'name': None, - } + } diff --git a/tests/notifier/test_elastic_search_notifier.py b/tests/notifier/test_elastic_search_notifier.py index 50bcf24..6c9e8a0 100644 --- a/tests/notifier/test_elastic_search_notifier.py +++ b/tests/notifier/test_elastic_search_notifier.py @@ -1,77 +1,234 @@ -# import asyncio -# import datetime -# import unittest -# from configparser import ConfigParser -# from typing import Dict -# from unittest import mock -# -# from telethon.tl.types import Message, MessageFwdHeader, PeerChannel, PeerUser -# -# from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity -# from TEx.notifier.discord_notifier import DiscordNotifier -# from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier -# from tests.modules.common import TestsCommon -# from tests.modules.mockups_groups_mockup_data import base_groups_mockup_data, base_messages_mockup_data, \ -# channel_1_mocked -# -# -# class ElasticSearchNotifierTest(unittest.TestCase): -# -# def setUp(self) -> None: -# self.config = ConfigParser() -# self.config.read('../../config.ini') -# -# def test_run_without_file(self): -# """Test Run Method Without Message File Attachment.""" -# -# # Setup Mock -# elastic_search_api_mock = mock.AsyncMock() -# elastic_search_api_mock.index = mock.AsyncMock() -# -# target: ElasticSearchNotifier = ElasticSearchNotifier() -# args: Dict = { -# 'config': 'unittest_configfile.config' -# } -# data: Dict = {} -# TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) -# -# # Set Message -# message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( -# date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), -# raw_text="Mocked Raw Text", -# group_name="Channel 1972142108", -# group_id=1972142108, -# from_id="1234", -# to_id=9876, -# reply_to_msg_id=5544, -# message_id=5975883, -# is_reply=False, -# downloaded_media_info=None, -# ) -# -# with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): -# # Execute Discord Notifier Configure Method -# target.configure( -# config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] -# ) -# -# loop = asyncio.get_event_loop() -# loop.run_until_complete( -# -# # Invoke Test Target -# target.run( -# message=mocked_message, -# rule_id='RULE_UT_01', -# source='+15558987453' -# ) -# ) -# -# # Check .index call -# elastic_search_api_mock.index.assert_called_once() -# call_arg = elastic_search_api_mock.index.call_args[1] -# -# self.assertEqual(call_arg['index'], 'test_index_name') -# self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') -# self.assertEqual(call_arg['id'], '1972142108_183017') -# -# submited_document = call_arg['document'] +import asyncio +import datetime +import unittest +from configparser import ConfigParser +from typing import Dict +from unittest import mock + +import pytz + +from TEx.models.facade.finder_notification_facade_entity import FinderNotificationMessageEntity +from TEx.models.facade.media_handler_facade_entity import MediaHandlingEntity +from TEx.notifier.elastic_search_notifier import ElasticSearchNotifier +from tests.modules.common import TestsCommon + + +class ElasticSearchNotifierTest(unittest.TestCase): + + def setUp(self) -> None: + self.config = ConfigParser() + self.config.read('../../config.ini') + + def test_configure_with_hosts(self): + """Test configure method with hosts.""" + # Setup Mock + elastic_search_api_mock = mock.MagicMock() + + target: ElasticSearchNotifier = ElasticSearchNotifier() + args: Dict = { + 'config': 'unittest_configfile.config' + } + data: Dict = {} + TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + + # Change Config Map + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'].clear() + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['address'] = 'http://localhost:1,http://localhost:2' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['api_key'] = 'MyApiKey003' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['verify_ssl_cert'] = 'False' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['index_name'] = 'UT_IndexName_004' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['pipeline_name'] = 'UT_PipelineName_005' + + # Set Message + with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock) as patched_ctor: + # Execute Discord Notifier Configure Method + target.configure( + config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] + ) + + # Check Call Args + call_arg = patched_ctor.call_args[1] + self.assertEqual('http://localhost:1', call_arg['hosts'][0]) + self.assertEqual('http://localhost:2', call_arg['hosts'][1]) + self.assertEqual('MyApiKey003', call_arg['api_key']) + self.assertEqual(False, call_arg['verify_certs']) + self.assertIsNone(call_arg['cloud_id']) + + def test_configure_with_cloud_id(self): + """Test configure method with Cloud ID Info.""" + # Setup Mock + elastic_search_api_mock = mock.MagicMock() + + target: ElasticSearchNotifier = ElasticSearchNotifier() + args: Dict = { + 'config': 'unittest_configfile.config' + } + data: Dict = {} + TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + + # Change Config Map + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'].clear() + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['cloud_id'] = 'deployment-name:dXMtZWFzdDQuZ2Nw' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['index_name'] = 'UT_IndexName_007' + self.config['NOTIFIER.ELASTIC_SEARCH.UT_01']['pipeline_name'] = 'UT_PipelineName_008' + + # Set Message + with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', + return_value=elastic_search_api_mock) as patched_ctor: + # Execute Discord Notifier Configure Method + target.configure( + config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] + ) + + # Check Call Args + call_arg = patched_ctor.call_args[1] + self.assertEqual('deployment-name:dXMtZWFzdDQuZ2Nw', call_arg['cloud_id']) + self.assertEqual(True, call_arg['verify_certs']) + self.assertIsNone(call_arg['hosts']) + self.assertIsNone(call_arg['api_key']) + + def test_run_without_downloaded_file(self): + """Test Run Method Without Message File Attachment.""" + + # Setup Mock + elastic_search_api_mock = mock.AsyncMock() + elastic_search_api_mock.index = mock.AsyncMock() + + target: ElasticSearchNotifier = ElasticSearchNotifier() + args: Dict = { + 'config': 'unittest_configfile.config' + } + data: Dict = {} + TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + + # Set Message + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + raw_text="Mocked Raw Text", + group_name="Channel 1972142108", + group_id=1972142108, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=5975883, + is_reply=False, + downloaded_media_info=None, + ) + + with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): + # Execute Discord Notifier Configure Method + target.configure( + config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] + ) + + loop = asyncio.get_event_loop() + loop.run_until_complete( + + # Invoke Test Target + target.run( + entity=message_entity, + rule_id='RULE_UT_01', + source='+15558987453' + ) + ) + + # Check .index call + elastic_search_api_mock.index.assert_called_once() + call_arg = elastic_search_api_mock.index.call_args[1] + + self.assertEqual(call_arg['index'], 'test_index_name') + self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') + self.assertEqual(call_arg['id'], '1972142108_5975883') + + submited_document = call_arg['document'] + expected_document = { + 'time': datetime.datetime(2023, 10, 1, 12, 58, 22, tzinfo=pytz.UTC), + 'source': '+15558987453', + 'rule': 'RULE_UT_01', + 'raw': 'Mocked Raw Text', + 'group_name': 'Channel 1972142108', + 'group_id': 1972142108, + 'from_id': 1234, + 'to_id': 9876, + 'reply_to_msg_id': 5544, + 'message_id': 5975883, + 'is_reply': False, + 'has_media': False, + 'media_mime_type': None, + 'media_size': None + } + + self.assertEqual(submited_document, expected_document) + + def test_run_with_downloaded_file(self): + """Test Run Method With Message File Attachment.""" + + # Setup Mock + elastic_search_api_mock = mock.AsyncMock() + elastic_search_api_mock.index = mock.AsyncMock() + + target: ElasticSearchNotifier = ElasticSearchNotifier() + args: Dict = { + 'config': 'unittest_configfile.config' + } + data: Dict = {} + TestsCommon.execute_basic_pipeline_steps_for_initialization(config=self.config, args=args, data=data) + + # Set Message + message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + raw_text="Mocked Raw Text 2", + group_name="Channel 1972142101", + group_id=1972142108, + from_id="1234", + to_id=9876, + reply_to_msg_id=5544, + message_id=5975883, + is_reply=False, + downloaded_media_info=MediaHandlingEntity(media_id=99, file_name='utfile.pdf', content_type='application/pdf', size_bytes=5858), + ) + + with mock.patch('TEx.notifier.elastic_search_notifier.AsyncElasticsearch', return_value=elastic_search_api_mock): + # Execute Discord Notifier Configure Method + target.configure( + config=self.config['NOTIFIER.ELASTIC_SEARCH.UT_01'] + ) + + loop = asyncio.get_event_loop() + loop.run_until_complete( + + # Invoke Test Target + target.run( + entity=message_entity, + rule_id='RULE_UT_01', + source='+15558987453' + ) + ) + + # Check .index call + elastic_search_api_mock.index.assert_called_once() + call_arg = elastic_search_api_mock.index.call_args[1] + + self.assertEqual(call_arg['index'], 'test_index_name') + self.assertEqual(call_arg['pipeline'], 'test_pipeline_name') + self.assertEqual(call_arg['id'], '1972142108_5975883') + + submited_document = call_arg['document'] + expected_document = { + 'time': datetime.datetime(2023, 10, 1, 12, 58, 22, tzinfo=pytz.UTC), + 'source': '+15558987453', + 'rule': 'RULE_UT_01', + 'raw': 'Mocked Raw Text 2', + 'group_name': 'Channel 1972142101', + 'group_id': 1972142108, + 'from_id': 1234, + 'to_id': 9876, + 'reply_to_msg_id': 5544, + 'message_id': 5975883, + 'is_reply': False, + 'has_media': True, + 'media_mime_type': 'application/pdf', + 'media_size': 5858 + } + + self.assertEqual(submited_document, expected_document) From da1e56e9fc36434f5e8d196afcc7f1f5c832b417 Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Fri, 20 Oct 2023 08:54:13 -0300 Subject: [PATCH 10/11] Change Documentation Signed-off-by: Guilherme Bacellar Moralez --- docs/changelog/v030.md | 6 +- .../complete_configuration_file_example.md | 15 ++- docs/finder/finder_catchall.md | 24 ++++ docs/{ => finder}/finder_regex.md | 0 .../notification_discord.md | 0 .../notification_elasticsearch.md | 45 ++++++++ ...tification_elasticsearch_index_template.md | 107 ++++++++++++++++++ mkdocs.yml | 8 +- 8 files changed, 200 insertions(+), 5 deletions(-) create mode 100644 docs/finder/finder_catchall.md rename docs/{ => finder}/finder_regex.md (100%) rename docs/{ => notification}/notification_discord.md (100%) create mode 100644 docs/notification/notification_elasticsearch.md create mode 100644 docs/notification/notification_elasticsearch_index_template.md diff --git a/docs/changelog/v030.md b/docs/changelog/v030.md index 43cb47f..759e67a 100644 --- a/docs/changelog/v030.md +++ b/docs/changelog/v030.md @@ -4,6 +4,8 @@ - Proxy (HTTP, SOCKS4, SOCKS5) support ([#26](https://github.com/guibacellar/TEx/issues/26)) - Discord Notifications now have a source information with account/phone number +- New Message Finder Rule to Catch All Messages +- New Notification connector for Elastic Search ([#12](https://github.com/guibacellar/TEx/issues/12)) **🐛 Bug Fixes** @@ -11,4 +13,6 @@ **⚙️ Internal Improvements** -- Replace Pylint, PyDocStyle and Flake8 code quality tools for Ruff ([#22](https://github.com/guibacellar/TEx/issues/22)) \ No newline at end of file +- Replace Pylint, PyDocStyle and Flake8 code quality tools for Ruff ([#22](https://github.com/guibacellar/TEx/issues/22)) +- Fix Invalid TypeHint for Message Object from Telethon +- Changes in message finder and notification system to use a facade objects with Pydantic to reduce cognitive complexity and allow the construction of new connectors more easily diff --git a/docs/configuration/complete_configuration_file_example.md b/docs/configuration/complete_configuration_file_example.md index 7ea68ad..62c095f 100644 --- a/docs/configuration/complete_configuration_file_example.md +++ b/docs/configuration/complete_configuration_file_example.md @@ -1,6 +1,6 @@ # Complete Configuration File Example -This is an example of a complete configuration file with three finder rules using two discord hooks. +This is an example of a complete configuration file with four finder rules using two discord hooks and one elastic search connector. ```ini [CONFIGURATION] @@ -29,13 +29,17 @@ notifier=NOTIFIER.DISCORD.MY_HOOK_1 [FINDER.RULE.FindMessagesWithCreditCard] type=regex regex=(^4[0-9]{12}(?:[0-9]{3})?$)|(^(?:5[1-5][0-9]{2}|222[1-9]|22[3-9][0-9]|2[3-6][0-9]{2}|27[01][0-9]|2720)[0-9]{12}$)|(3[47][0-9]{13})|(^3(?:0[0-5]|[68][0-9])[0-9]{11}$)|(^6(?:011|5[0-9]{2})[0-9]{12}$)|(^(?:2131|1800|35\d{3})\d{11}$) -notifier=NOTIFIER.DISCORD.MY_HOOK_2 +notifier=NOTIFIER.DISCORD.MY_HOOK_2,NOTIFIER.ELASTIC_SEARCH.GENERAL [FINDER.RULE.FindMessagesWithEmail] type=regex regex=^[\w-\.]+@([\w-]+\.)+[\w-]{2,4}$ notifier=NOTIFIER.DISCORD.MY_HOOK_1,NOTIFIER.DISCORD.MY_HOOK_2 +[FINDER.RULE.CatchAll] +type=all +notifier=NOTIFIER.ELASTIC_SEARCH.GENERAL + [NOTIFIER.DISCORD.MY_HOOK_1] webhook=https://discord.com/api/webhooks/1157896186751897357/o7foobar4txvAvKSdeadHiI-9XYeXaGlQtd-5PtrrX_eCE0XElWktpPqjrZ0KbeefPtQC prevent_duplication_for_minutes=240 @@ -43,4 +47,11 @@ prevent_duplication_for_minutes=240 [NOTIFIER.DISCORD.MY_HOOK_2] webhook=https://discord.com/api/webhooks/1128765187657681875/foobarqOMFp_4tM2ic2mbeefNPOZqJnBZZdfaubQv2vJgbYzfdeadZd5aqGX6FmCmbNjX prevent_duplication_for_minutes=240 + +[NOTIFIER.ELASTIC_SEARCH.GENERAL] +address=https://localhost:9200 +api_key=bHJtVEg0c0JnNkwwTnYtFFDEADlo6NS1rXzd6NVFSUmEtQ21mQldiUjEwUQ== +verify_ssl_cert=False +index_name=index-name +pipeline_name=ent-search-generic-ingestion ``` diff --git a/docs/finder/finder_catchall.md b/docs/finder/finder_catchall.md new file mode 100644 index 0000000..3302ab0 --- /dev/null +++ b/docs/finder/finder_catchall.md @@ -0,0 +1,24 @@ +# Message Finder System - Catch All Messages + +**Compatibility:** Message Listener Command + +Telegram Explorer allows to catch all messages and redirect to one or more notifications connectior. + +**Configuration Spec:** + +For each rule to be used, you must set a configuration using the default name schema *FINDER.RULE.* + +**Parameters:** + + * **type** > Required - Fixed Value 'all' + * **notifier** > Required - Name of notifiers to be used to notify the triggered message (comma separated). + +**Changes on Configuration File** +```ini +[FINDER] +enabled=true + +[FINDER.RULE.CatchAll] +type=all +notifier=NOTIFIER.ELASTIC_SEARCH.GENERAL +``` \ No newline at end of file diff --git a/docs/finder_regex.md b/docs/finder/finder_regex.md similarity index 100% rename from docs/finder_regex.md rename to docs/finder/finder_regex.md diff --git a/docs/notification_discord.md b/docs/notification/notification_discord.md similarity index 100% rename from docs/notification_discord.md rename to docs/notification/notification_discord.md diff --git a/docs/notification/notification_elasticsearch.md b/docs/notification/notification_elasticsearch.md new file mode 100644 index 0000000..733a21c --- /dev/null +++ b/docs/notification/notification_elasticsearch.md @@ -0,0 +1,45 @@ +# Notification System - Elastic Search Connector + +Telegram Explorer allows to send notifications to Elastic Search through ingestion API. + +Every Notification is defined in the configuration files. + +!!! info "Elastic Search Compatibility" + + Tested on Elastic Search 8+ + +!!! warning "Index Template" + + If you want, and we recommend, create a new Index Template before create your indexes. Please, check on "Notification System" > "Elastic Search Connector" > "Index Template" for more information. + +**Configuration Spec:** + +For each connector you must set a configuration using the default name schema *NOTIFIER.ELASTIC_SEARCH.* + +**Parameters:** + + * **address** > Optional - Elastic Search Address. Multiple values comma separated. + * **api_key** > Required - Elastic Search API Key. + * **cloud_id** > Optional - Elastic Search Cloud ID. + * **verify_ssl_cert** > Optional - Configure if the connector checks the SSL cert. Default=True + * **index_name** > Required - Elastic Search Index Name. + * **pipeline_name** > Required - Elastic Search Ingestion Pipeline Name. + + +**Changes on Configuration File (with Address)** +```ini +address=https://elastic_search_url_1:9200,https://elastic_search_url_2:9200 +api_key=bHJtVEg0c0JnNkwwTnYtYTFdeadbeefrXzd6NVFSUmEtQ21mQldiUjEwUQ== +verify_ssl_cert=False +index_name=search-telegram_explorer +pipeline_name=ent-search-generic-ingestion +``` + +**Changes on Configuration File (with Cloud ID)** +```ini +cloud_id=deployment-name:dXMtZWFzdDQuZ2Nw +api_key=bHJtVEg0c0JnNkwwTnYtYTFdeadbeefrXzd6NVFSUmEtQ21mQldiUjEwUQ== +verify_ssl_cert=True +index_name=search-telegram_explorer +pipeline_name=ent-search-generic-ingestion +``` diff --git a/docs/notification/notification_elasticsearch_index_template.md b/docs/notification/notification_elasticsearch_index_template.md new file mode 100644 index 0000000..702b8fe --- /dev/null +++ b/docs/notification/notification_elasticsearch_index_template.md @@ -0,0 +1,107 @@ +# Notification System - Elastic Search Connector - Index Template + +If you want, create a new Index Template before create all Telegram Explorer indexes. + +This will help you to get the best of all data provided and allow's to extract many more value and informations from the data. + +**Index Template JSON** +```json +{ + "settings": { + "index": { + "routing": { + "allocation": { + "include": { + "_tier_preference": "data_content" + } + } + } + } + }, + "mappings": { + "dynamic": "true", + "dynamic_date_formats": [ + "strict_date_optional_time", + "yyyy/MM/dd HH:mm:ss Z||yyyy/MM/dd Z" + ], + "dynamic_templates": [], + "date_detection": true, + "numeric_detection": false, + "properties": { + "from_id": { + "type": "long" + }, + "group_id": { + "type": "long" + }, + "group_name": { + "type": "text", + "fielddata": true, + "fielddata_frequency_filter": { + "min": 0.01, + "max": 1, + "min_segment_size": 50 + } + }, + "has_media": { + "type": "boolean" + }, + "is_reply": { + "type": "boolean" + }, + "media_mime_type": { + "type": "text", + "fielddata": true, + "fielddata_frequency_filter": { + "min": 0.01, + "max": 1, + "min_segment_size": 50 + } + }, + "media_size": { + "type": "long" + }, + "message_id": { + "type": "text" + }, + "raw": { + "type": "text", + "fielddata": true, + "fielddata_frequency_filter": { + "min": 0.01, + "max": 1, + "min_segment_size": 50 + } + }, + "reply_to_msg_id": { + "type": "long" + }, + "rule": { + "type": "text", + "fielddata": true, + "fielddata_frequency_filter": { + "min": 0.01, + "max": 1, + "min_segment_size": 50 + } + }, + "source": { + "type": "text", + "fielddata": true, + "fielddata_frequency_filter": { + "min": 0.01, + "max": 1, + "min_segment_size": 50 + } + }, + "time": { + "type": "date" + }, + "to_id": { + "type": "long" + } + } + }, + "aliases": {} +} +``` diff --git a/mkdocs.yml b/mkdocs.yml index 0f3fc15..89bba85 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -31,9 +31,13 @@ nav: - 'Listen Messages': 'how_use/usage_message_listener.md' - 'Download Messages': 'how_use/usage_download_messages.md' - 'Notification System': - - 'Discord Notification Hook': 'notification_discord.md' + - 'Discord Notification Hook': 'notification/notification_discord.md' + - 'Elastic Search Connector': + - 'Configuration': 'notification/notification_elasticsearch.md' + - 'Index Template': 'notification/notification_elasticsearch_index_template.md' - 'Message Finder System': - - 'RegEx Finder': 'finder_regex.md' + - 'Catch All': 'finder/finder_catchall.md' + - 'RegEx Finder': 'finder/finder_regex.md' - 'Reports': - 'Export Files': 'report/report_export_files.md' - 'HTML Report': 'report/report_html.md' From 6b7094a7a99378bee29f0a65cbd48d7fcb146e6a Mon Sep 17 00:00:00 2001 From: Guilherme Bacellar Moralez Date: Fri, 20 Oct 2023 09:02:27 -0300 Subject: [PATCH 11/11] Added UTC Timezone on Tests that fails on UTC Machines but works on GTM-3 machines. Signed-off-by: Guilherme Bacellar Moralez --- tests/notifier/test_elastic_search_notifier.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/tests/notifier/test_elastic_search_notifier.py b/tests/notifier/test_elastic_search_notifier.py index 6c9e8a0..7dc3077 100644 --- a/tests/notifier/test_elastic_search_notifier.py +++ b/tests/notifier/test_elastic_search_notifier.py @@ -103,7 +103,7 @@ def test_run_without_downloaded_file(self): # Set Message message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( - date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22, tzinfo=pytz.UTC), raw_text="Mocked Raw Text", group_name="Channel 1972142108", group_id=1972142108, @@ -142,7 +142,7 @@ def test_run_without_downloaded_file(self): submited_document = call_arg['document'] expected_document = { - 'time': datetime.datetime(2023, 10, 1, 12, 58, 22, tzinfo=pytz.UTC), + 'time': datetime.datetime(2023, 10, 1, 9, 58, 22, tzinfo=pytz.UTC), 'source': '+15558987453', 'rule': 'RULE_UT_01', 'raw': 'Mocked Raw Text', @@ -176,7 +176,7 @@ def test_run_with_downloaded_file(self): # Set Message message_entity: FinderNotificationMessageEntity = FinderNotificationMessageEntity( - date_time=datetime.datetime(2023, 10, 1, 9, 58, 22), + date_time=datetime.datetime(2023, 10, 1, 9, 58, 22, tzinfo=pytz.UTC), raw_text="Mocked Raw Text 2", group_name="Channel 1972142101", group_id=1972142108, @@ -215,7 +215,7 @@ def test_run_with_downloaded_file(self): submited_document = call_arg['document'] expected_document = { - 'time': datetime.datetime(2023, 10, 1, 12, 58, 22, tzinfo=pytz.UTC), + 'time': datetime.datetime(2023, 10, 1, 9, 58, 22, tzinfo=pytz.UTC), 'source': '+15558987453', 'rule': 'RULE_UT_01', 'raw': 'Mocked Raw Text 2',