feat: init tg nodes, init web view
This commit is contained in:
parent
09c0cb6a44
commit
b50b9b8980
6
Dockerfile
Normal file
6
Dockerfile
Normal file
@ -0,0 +1,6 @@
|
||||
FROM python:3.12-slim
|
||||
WORKDIR /app
|
||||
COPY . /app
|
||||
RUN pip install --no-cache-dir -r requirements.txt
|
||||
EXPOSE 5000
|
||||
CMD ["python", "web/app.py"]
|
27
docker-compose.yaml
Normal file
27
docker-compose.yaml
Normal file
@ -0,0 +1,27 @@
|
||||
version: '3.8'
|
||||
|
||||
services:
|
||||
web:
|
||||
build: .
|
||||
container_name: tg-monitor
|
||||
ports:
|
||||
- "5000:5000"
|
||||
volumes:
|
||||
- .:/app
|
||||
command: python web/app.py
|
||||
depends_on:
|
||||
- tg_node_0
|
||||
- tg_node_1
|
||||
|
||||
tg_node_0:
|
||||
build: .
|
||||
container_name: tg-node-0
|
||||
command: python tg/node_tg_0.py
|
||||
|
||||
tg_node_1:
|
||||
build: .
|
||||
container_name: tg-node-1
|
||||
command: python tg/node_tg_1.py
|
||||
|
||||
volumes:
|
||||
pg_data:
|
402
patcher.py
402
patcher.py
@ -1,402 +0,0 @@
|
||||
#!/usr/bin/env python3
|
||||
# this module is part of undetected_chromedriver
|
||||
|
||||
from distutils.version import LooseVersion
|
||||
import io
|
||||
import json
|
||||
import logging
|
||||
import os
|
||||
import pathlib
|
||||
import platform
|
||||
import random
|
||||
import re
|
||||
import shutil
|
||||
import string
|
||||
import sys
|
||||
import time
|
||||
from urllib.request import urlopen
|
||||
from urllib.request import urlretrieve
|
||||
import zipfile
|
||||
from multiprocessing import Lock
|
||||
import secrets
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
IS_POSIX = sys.platform.startswith(("darwin", "cygwin", "linux", "linux2"))
|
||||
|
||||
|
||||
class Patcher(object):
|
||||
lock = Lock()
|
||||
exe_name = "chromedriver%s"
|
||||
|
||||
platform = sys.platform
|
||||
if platform.endswith("win32"):
|
||||
d = "~/appdata/roaming/undetected_chromedriver"
|
||||
elif "LAMBDA_TASK_ROOT" in os.environ:
|
||||
d = "/tmp/undetected_chromedriver"
|
||||
elif platform.startswith(("linux", "linux2")):
|
||||
d = "~/.local/share/undetected_chromedriver"
|
||||
elif platform.endswith("darwin"):
|
||||
d = "~/Library/Application Support/undetected_chromedriver"
|
||||
else:
|
||||
d = "~/.undetected_chromedriver"
|
||||
data_path = os.path.abspath(os.path.expanduser(d))
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
executable_path=None,
|
||||
force=False,
|
||||
version_main: int = 0,
|
||||
user_multi_procs=False,
|
||||
):
|
||||
"""
|
||||
Args:
|
||||
executable_path: None = automatic
|
||||
a full file path to the chromedriver executable
|
||||
force: False
|
||||
terminate processes which are holding lock
|
||||
version_main: 0 = auto
|
||||
specify main chrome version (rounded, ex: 82)
|
||||
"""
|
||||
self.force = force
|
||||
self._custom_exe_path = False
|
||||
prefix = secrets.token_hex(8)
|
||||
self.user_multi_procs = user_multi_procs
|
||||
|
||||
self.is_old_chromedriver = version_main and version_main <= 114
|
||||
# Needs to be called before self.exe_name is accessed
|
||||
self._set_platform_name()
|
||||
|
||||
if not os.path.exists(self.data_path):
|
||||
os.makedirs(self.data_path, exist_ok=True)
|
||||
|
||||
if not executable_path:
|
||||
self.executable_path = os.path.join(
|
||||
self.data_path, "_".join([prefix, self.exe_name])
|
||||
)
|
||||
|
||||
if not IS_POSIX:
|
||||
if executable_path:
|
||||
if not executable_path[-4:] == ".exe":
|
||||
executable_path += ".exe"
|
||||
|
||||
self.zip_path = os.path.join(self.data_path, prefix)
|
||||
|
||||
if not executable_path:
|
||||
if not self.user_multi_procs:
|
||||
self.executable_path = os.path.abspath(
|
||||
os.path.join(".", self.executable_path)
|
||||
)
|
||||
|
||||
if executable_path:
|
||||
self._custom_exe_path = True
|
||||
self.executable_path = executable_path
|
||||
|
||||
# Set the correct repository to download the Chromedriver from
|
||||
if self.is_old_chromedriver:
|
||||
self.url_repo = "https://chromedriver.storage.googleapis.com"
|
||||
else:
|
||||
self.url_repo = "https://googlechromelabs.github.io/chrome-for-testing"
|
||||
|
||||
self.version_main = version_main
|
||||
self.version_full = None
|
||||
|
||||
def _set_platform_name(self):
|
||||
"""
|
||||
Set the platform and exe name based on the platform undetected_chromedriver is running on
|
||||
in order to download the correct chromedriver.
|
||||
"""
|
||||
if self.platform.endswith("win32"):
|
||||
self.platform_name = "win32"
|
||||
self.exe_name %= ".exe"
|
||||
if self.platform.endswith(("linux", "linux2")):
|
||||
self.platform_name = "linux64"
|
||||
self.exe_name %= ""
|
||||
if self.platform.endswith("darwin"):
|
||||
if self.is_old_chromedriver:
|
||||
self.platform_name = "mac64"
|
||||
else:
|
||||
self.platform_name = "mac-x64"
|
||||
self.exe_name %= ""
|
||||
|
||||
def auto(self, executable_path=None, force=False, version_main=None, _=None):
|
||||
"""
|
||||
|
||||
Args:
|
||||
executable_path:
|
||||
force:
|
||||
version_main:
|
||||
|
||||
Returns:
|
||||
|
||||
"""
|
||||
p = pathlib.Path(self.data_path)
|
||||
if self.user_multi_procs:
|
||||
with Lock():
|
||||
files = list(p.rglob("*chromedriver*"))
|
||||
most_recent = max(files, key=lambda f: f.stat().st_mtime)
|
||||
files.remove(most_recent)
|
||||
list(map(lambda f: f.unlink(), files))
|
||||
if self.is_binary_patched(most_recent):
|
||||
self.executable_path = str(most_recent)
|
||||
return True
|
||||
|
||||
if executable_path:
|
||||
self.executable_path = executable_path
|
||||
self._custom_exe_path = True
|
||||
|
||||
if self._custom_exe_path:
|
||||
ispatched = self.is_binary_patched(self.executable_path)
|
||||
if not ispatched:
|
||||
return self.patch_exe()
|
||||
else:
|
||||
return
|
||||
|
||||
if version_main:
|
||||
self.version_main = version_main
|
||||
if force is True:
|
||||
self.force = force
|
||||
|
||||
try:
|
||||
os.unlink(self.executable_path)
|
||||
except PermissionError:
|
||||
if self.force:
|
||||
self.force_kill_instances(self.executable_path)
|
||||
return self.auto(force=not self.force)
|
||||
try:
|
||||
if self.is_binary_patched():
|
||||
# assumes already running AND patched
|
||||
return True
|
||||
except PermissionError:
|
||||
pass
|
||||
# return False
|
||||
except FileNotFoundError:
|
||||
pass
|
||||
|
||||
release = self.fetch_release_number()
|
||||
self.version_main = release.version[0]
|
||||
self.version_full = release
|
||||
self.unzip_package(self.fetch_package())
|
||||
return self.patch()
|
||||
|
||||
def driver_binary_in_use(self, path: str = None) -> bool:
|
||||
"""
|
||||
naive test to check if a found chromedriver binary is
|
||||
currently in use
|
||||
|
||||
Args:
|
||||
path: a string or PathLike object to the binary to check.
|
||||
if not specified, we check use this object's executable_path
|
||||
"""
|
||||
if not path:
|
||||
path = self.executable_path
|
||||
p = pathlib.Path(path)
|
||||
|
||||
if not p.exists():
|
||||
raise OSError("file does not exist: %s" % p)
|
||||
try:
|
||||
with open(p, mode="a+b") as fs:
|
||||
exc = []
|
||||
try:
|
||||
|
||||
fs.seek(0, 0)
|
||||
except PermissionError as e:
|
||||
exc.append(e) # since some systems apprently allow seeking
|
||||
# we conduct another test
|
||||
try:
|
||||
fs.readline()
|
||||
except PermissionError as e:
|
||||
exc.append(e)
|
||||
|
||||
if exc:
|
||||
|
||||
return True
|
||||
return False
|
||||
# ok safe to assume this is in use
|
||||
except Exception as e:
|
||||
# logger.exception("whoops ", e)
|
||||
pass
|
||||
|
||||
def cleanup_unused_files(self):
|
||||
p = pathlib.Path(self.data_path)
|
||||
items = list(p.glob("*undetected*"))
|
||||
for item in items:
|
||||
try:
|
||||
item.unlink()
|
||||
except:
|
||||
pass
|
||||
|
||||
def patch(self):
|
||||
self.patch_exe()
|
||||
return self.is_binary_patched()
|
||||
|
||||
def fetch_release_number(self):
|
||||
"""
|
||||
Gets the latest major version available, or the latest major version of self.target_version if set explicitly.
|
||||
:return: version string
|
||||
:rtype: LooseVersion
|
||||
"""
|
||||
# Endpoint for old versions of Chromedriver (114 and below)
|
||||
if self.is_old_chromedriver:
|
||||
path = f"/latest_release_{self.version_main}"
|
||||
path = path.upper()
|
||||
logger.debug("getting release number from %s" % path)
|
||||
return LooseVersion(urlopen(self.url_repo + path).read().decode())
|
||||
|
||||
# Endpoint for new versions of Chromedriver (115+)
|
||||
if not self.version_main:
|
||||
# Fetch the latest version
|
||||
path = "/last-known-good-versions-with-downloads.json"
|
||||
logger.debug("getting release number from %s" % path)
|
||||
with urlopen(self.url_repo + path) as conn:
|
||||
response = conn.read().decode()
|
||||
|
||||
last_versions = json.loads(response)
|
||||
return LooseVersion(last_versions["channels"]["Stable"]["version"])
|
||||
|
||||
# Fetch the latest minor version of the major version provided
|
||||
path = "/latest-versions-per-milestone-with-downloads.json"
|
||||
logger.debug("getting release number from %s" % path)
|
||||
with urlopen(self.url_repo + path) as conn:
|
||||
response = conn.read().decode()
|
||||
|
||||
major_versions = json.loads(response)
|
||||
return LooseVersion(major_versions["milestones"][str(self.version_main)]["version"])
|
||||
|
||||
def parse_exe_version(self):
|
||||
with io.open(self.executable_path, "rb") as f:
|
||||
for line in iter(lambda: f.readline(), b""):
|
||||
match = re.search(rb"platform_handle\x00content\x00([0-9.]*)", line)
|
||||
if match:
|
||||
return LooseVersion(match[1].decode())
|
||||
|
||||
def fetch_package(self):
|
||||
"""
|
||||
Downloads ChromeDriver from source
|
||||
|
||||
:return: path to downloaded file
|
||||
"""
|
||||
zip_name = f"chromedriver_{self.platform_name}.zip"
|
||||
if self.is_old_chromedriver:
|
||||
download_url = "%s/%s/%s" % (self.url_repo, self.version_full.vstring, zip_name)
|
||||
else:
|
||||
zip_name = zip_name.replace("_", "-", 1)
|
||||
download_url = "https://storage.googleapis.com/chrome-for-testing-public/%s/%s/%s"
|
||||
download_url %= (self.version_full.vstring, self.platform_name, zip_name)
|
||||
|
||||
logger.debug("downloading from %s" % download_url)
|
||||
return urlretrieve(download_url)[0]
|
||||
|
||||
def unzip_package(self, fp):
|
||||
"""
|
||||
Does what it says
|
||||
|
||||
:return: path to unpacked executable
|
||||
"""
|
||||
exe_path = self.exe_name
|
||||
if not self.is_old_chromedriver:
|
||||
# The new chromedriver unzips into its own folder
|
||||
zip_name = f"chromedriver-{self.platform_name}"
|
||||
exe_path = os.path.join(zip_name, self.exe_name)
|
||||
|
||||
logger.debug("unzipping %s" % fp)
|
||||
try:
|
||||
os.unlink(self.zip_path)
|
||||
except (FileNotFoundError, OSError):
|
||||
pass
|
||||
|
||||
os.makedirs(self.zip_path, mode=0o755, exist_ok=True)
|
||||
with zipfile.ZipFile(fp, mode="r") as zf:
|
||||
zf.extractall(self.zip_path)
|
||||
os.rename(os.path.join(self.zip_path, exe_path), self.executable_path)
|
||||
os.remove(fp)
|
||||
shutil.rmtree(self.zip_path)
|
||||
os.chmod(self.executable_path, 0o755)
|
||||
return self.executable_path
|
||||
|
||||
@staticmethod
|
||||
def force_kill_instances(exe_name):
|
||||
"""
|
||||
kills running instances.
|
||||
:param: executable name to kill, may be a path as well
|
||||
|
||||
:return: True on success else False
|
||||
"""
|
||||
exe_name = os.path.basename(exe_name)
|
||||
if IS_POSIX:
|
||||
r = os.system("kill -f -9 $(pidof %s)" % exe_name)
|
||||
else:
|
||||
r = os.system("taskkill /f /im %s" % exe_name)
|
||||
return not r
|
||||
|
||||
@staticmethod
|
||||
def gen_random_cdc():
|
||||
cdc = random.choices(string.ascii_letters, k=27)
|
||||
return "".join(cdc).encode()
|
||||
|
||||
def is_binary_patched(self, executable_path=None):
|
||||
executable_path = executable_path or self.executable_path
|
||||
try:
|
||||
with io.open(executable_path, "rb") as fh:
|
||||
return fh.read().find(b"undetected chromedriver") != -1
|
||||
except FileNotFoundError:
|
||||
return False
|
||||
|
||||
def patch_exe(self):
|
||||
start = time.perf_counter()
|
||||
logger.info("patching driver executable %s" % self.executable_path)
|
||||
with io.open(self.executable_path, "r+b") as fh:
|
||||
content = fh.read()
|
||||
# match_injected_codeblock = re.search(rb"{window.*;}", content)
|
||||
match_injected_codeblock = re.search(rb"\{window\.cdc.*?;\}", content)
|
||||
if match_injected_codeblock:
|
||||
target_bytes = match_injected_codeblock[0]
|
||||
new_target_bytes = (
|
||||
b'{console.log("undetected chromedriver 1337!")}'.ljust(
|
||||
len(target_bytes), b" "
|
||||
)
|
||||
)
|
||||
new_content = content.replace(target_bytes, new_target_bytes)
|
||||
if new_content == content:
|
||||
logger.warning(
|
||||
"something went wrong patching the driver binary. could not find injection code block"
|
||||
)
|
||||
else:
|
||||
logger.debug(
|
||||
"found block:\n%s\nreplacing with:\n%s"
|
||||
% (target_bytes, new_target_bytes)
|
||||
)
|
||||
fh.seek(0)
|
||||
fh.write(new_content)
|
||||
logger.debug(
|
||||
"patching took us {:.2f} seconds".format(time.perf_counter() - start)
|
||||
)
|
||||
|
||||
def __repr__(self):
|
||||
return "{0:s}({1:s})".format(
|
||||
self.__class__.__name__,
|
||||
self.executable_path,
|
||||
)
|
||||
|
||||
def __del__(self):
|
||||
if self._custom_exe_path:
|
||||
# if the driver binary is specified by user
|
||||
# we assume it is important enough to not delete it
|
||||
return
|
||||
else:
|
||||
timeout = 3 # stop trying after this many seconds
|
||||
t = time.monotonic()
|
||||
now = lambda: time.monotonic()
|
||||
while now() - t > timeout:
|
||||
# we don't want to wait until the end of time
|
||||
try:
|
||||
if self.user_multi_procs:
|
||||
break
|
||||
os.unlink(self.executable_path)
|
||||
logger.debug("successfully unlinked %s" % self.executable_path)
|
||||
break
|
||||
except (OSError, RuntimeError, PermissionError):
|
||||
time.sleep(0.01)
|
||||
continue
|
||||
except FileNotFoundError:
|
||||
break
|
@ -4,4 +4,7 @@ python-dotenv
|
||||
tls-client
|
||||
undetected-chromedriver
|
||||
selenium
|
||||
grpc_interceptor_headers
|
||||
grpc_interceptor_headers
|
||||
telethon
|
||||
schedule
|
||||
psycopg2-binary
|
14
runner.sh
14
runner.sh
@ -1,14 +0,0 @@
|
||||
#!/bin/bash
|
||||
|
||||
TARGET_DIR=$(python -c "import undetected_chromedriver as uc; print(uc.__path__[0])" 2>/dev/null)
|
||||
|
||||
if [ -d "$TARGET_DIR" ]; then
|
||||
echo "patcher.py в $TARGET_DIR"
|
||||
cp patcher.py "$TARGET_DIR"
|
||||
else
|
||||
echo "undetected_chromedriver не найден"
|
||||
fi
|
||||
|
||||
pip install -r requirements.txt
|
||||
|
||||
python initiator.py
|
73
tg/tg_crawler.py
Normal file
73
tg/tg_crawler.py
Normal file
@ -0,0 +1,73 @@
|
||||
import logging
|
||||
import psycopg2
|
||||
from datetime import datetime
|
||||
from telethon.sync import TelegramClient
|
||||
from telethon.tl.functions.messages import GetHistoryRequest
|
||||
|
||||
logging.basicConfig(
|
||||
level=logging.INFO,
|
||||
format='%(asctime)s - %(levelname)s - %(message)s',
|
||||
handlers=[
|
||||
logging.FileHandler('tg_nodes.log'),
|
||||
logging.StreamHandler()
|
||||
]
|
||||
)
|
||||
|
||||
class TelegramChannelMonitor:
|
||||
db_config = None
|
||||
|
||||
def __init__(self, session_name, api_id, api_hash, channel_username, source_name):
|
||||
self.session_name = session_name
|
||||
self.api_id = api_id
|
||||
self.api_hash = api_hash
|
||||
self.channel_username = channel_username
|
||||
self.source_name = source_name
|
||||
|
||||
@classmethod
|
||||
def set_db_config(cls, config):
|
||||
cls.db_config = config
|
||||
|
||||
def fetch_last_post(self):
|
||||
logging.info(f"[{self.source_name}] checking a new post...")
|
||||
|
||||
try:
|
||||
with TelegramClient(self.session_name, self.api_id, self.api_hash) as client:
|
||||
entity = client.get_entity(self.channel_username)
|
||||
history = client(GetHistoryRequest(
|
||||
peer=entity,
|
||||
limit=1,
|
||||
offset_date=None,
|
||||
offset_id=0,
|
||||
max_id=0,
|
||||
min_id=0,
|
||||
add_offset=0,
|
||||
hash=0
|
||||
))
|
||||
|
||||
if history.messages:
|
||||
msg = history.messages[0]
|
||||
logging.info(f"[{self.source_name}] received a post: {msg.message[:60]}...")
|
||||
self.save_to_db(self.source_name, msg.message)
|
||||
else:
|
||||
logging.info(f"[{self.source_name}] there is no new messages")
|
||||
except Exception as e:
|
||||
logging.error(f"[{self.source_name}] error when receiving a post: {e}")
|
||||
|
||||
def save_to_db(self, source, message):
|
||||
if not self.db_config:
|
||||
logging.error("DB config is not set")
|
||||
return
|
||||
|
||||
try:
|
||||
conn = psycopg2.connect(**self.db_config)
|
||||
cur = conn.cursor()
|
||||
cur.execute(
|
||||
"INSERT INTO leaks (source, message) VALUES (%s, %s)",
|
||||
(source, message)
|
||||
)
|
||||
conn.commit()
|
||||
cur.close()
|
||||
conn.close()
|
||||
logging.info(f"[{self.source_name}] message is recorded in the database")
|
||||
except Exception as e:
|
||||
logging.error(f"[{self.source_name}] error when writing to the database: {e}")
|
34
tg/tg_node_0.py
Normal file
34
tg/tg_node_0.py
Normal file
@ -0,0 +1,34 @@
|
||||
import asyncio
|
||||
import os
|
||||
from apscheduler.schedulers.asyncio import AsyncIOScheduler
|
||||
from pytz import timezone
|
||||
from tg_crawler import TelegramChannelMonitor
|
||||
from dotenv import load_dotenv
|
||||
|
||||
load_dotenv()
|
||||
|
||||
TelegramChannelMonitor.set_db_config({
|
||||
'host': os.getenv("HOST"),
|
||||
'port': os.getenv("PORT"),
|
||||
'database': os.getenv("DBNAME"),
|
||||
'user': os.getenv("USER"),
|
||||
'password': os.getenv("PASSWORD")
|
||||
})
|
||||
|
||||
monitor = TelegramChannelMonitor(
|
||||
session_name='session_trueosint',
|
||||
api_id=os.getenv("TELETHON_API_ID"),
|
||||
api_hash=os.getenv("TELETHON_API_HASH"),
|
||||
channel_username='trueosint',
|
||||
source_name='trueosint'
|
||||
)
|
||||
|
||||
def main():
|
||||
scheduler = AsyncIOScheduler()
|
||||
scheduler.add_job(monitor.fetch_last_post, "cron", hour=9, minute=0, timezone=timezone("Europe/Moscow"))
|
||||
scheduler.start()
|
||||
|
||||
asyncio.get_event_loop().run_forever()
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
34
tg/tg_node_1.py
Normal file
34
tg/tg_node_1.py
Normal file
@ -0,0 +1,34 @@
|
||||
import asyncio
|
||||
import os
|
||||
from apscheduler.schedulers.asyncio import AsyncIOScheduler
|
||||
from pytz import timezone
|
||||
from tg_crawler import TelegramChannelMonitor
|
||||
from dotenv import load_dotenv
|
||||
|
||||
load_dotenv()
|
||||
|
||||
TelegramChannelMonitor.set_db_config({
|
||||
'host': os.getenv("HOST"),
|
||||
'port': os.getenv("PORT"),
|
||||
'database': os.getenv("DBNAME"),
|
||||
'user': os.getenv("USER"),
|
||||
'password': os.getenv("PASSWORD")
|
||||
})
|
||||
|
||||
monitor = TelegramChannelMonitor(
|
||||
session_name='session_dataleak',
|
||||
api_id=os.getenv("TELETHON_API_ID"),
|
||||
api_hash=os.getenv("TELETHON_API_HASH"),
|
||||
channel_username='dataleak',
|
||||
source_name='dataleak'
|
||||
)
|
||||
|
||||
def main():
|
||||
scheduler = AsyncIOScheduler()
|
||||
scheduler.add_job(monitor.fetch_last_post, "cron", hour=9, minute=0, timezone=timezone("Europe/Moscow"))
|
||||
scheduler.start()
|
||||
|
||||
asyncio.get_event_loop().run_forever()
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
34
web/app.py
Normal file
34
web/app.py
Normal file
@ -0,0 +1,34 @@
|
||||
import os
|
||||
from flask import Flask, render_template
|
||||
import psycopg2
|
||||
|
||||
app = Flask(__name__)
|
||||
|
||||
DB_CONFIG = {
|
||||
'host': os.getenv("HOST"),
|
||||
'port': os.getenv("PORT"),
|
||||
'database': os.getenv("DBNAME"),
|
||||
'user': os.getenv("USER"),
|
||||
'password': os.getenv("PASSWORD")
|
||||
}
|
||||
|
||||
@app.route("/")
|
||||
def index():
|
||||
with psycopg2.connect(**DB_CONFIG) as conn:
|
||||
with conn.cursor() as cur:
|
||||
cur.execute("SELECT source, message, created_at FROM leaks ORDER BY created_at DESC LIMIT 50")
|
||||
leaks = cur.fetchall()
|
||||
return render_template("index.html", leaks=leaks)
|
||||
|
||||
@app.route("/logs")
|
||||
def logs():
|
||||
log_path = os.path.join(os.path.dirname(__file__), '..', 'tg_nodes.log')
|
||||
try:
|
||||
with open(log_path, 'r', encoding='utf-8') as f:
|
||||
lines = f.readlines()[-100:]
|
||||
except FileNotFoundError:
|
||||
lines = ["Лог-файл не найден"]
|
||||
return render_template("logs.html", logs=lines)
|
||||
|
||||
if __name__ == "__main__":
|
||||
app.run(debug=True)
|
368
web/templates/index.html
Normal file
368
web/templates/index.html
Normal file
@ -0,0 +1,368 @@
|
||||
<!DOCTYPE html>
|
||||
<html lang="ru">
|
||||
<head>
|
||||
<meta charset="UTF-8">
|
||||
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
||||
<title>Система мониторинга утечек данных</title>
|
||||
<link rel="stylesheet" href="https://unpkg.com/leaflet@1.7.1/dist/leaflet.css" />
|
||||
<style>
|
||||
body {
|
||||
background-color: #1e1e1e;
|
||||
color: #ffffff;
|
||||
font-family: 'Arial', sans-serif;
|
||||
margin: 0;
|
||||
padding: 0;
|
||||
display: flex;
|
||||
transition: margin-left 0.3s ease;
|
||||
min-height: 100vh;
|
||||
overflow: hidden;
|
||||
}
|
||||
.sidebar {
|
||||
width: 250px;
|
||||
background-color: #2e2e2e;
|
||||
padding: 20px;
|
||||
box-shadow: 2px 0 5px rgba(0, 0, 0, 0.3);
|
||||
transition: width 0.3s ease;
|
||||
overflow-y: auto;
|
||||
position: fixed;
|
||||
top: 0;
|
||||
left: 0;
|
||||
bottom: 0;
|
||||
z-index: 1;
|
||||
}
|
||||
.sidebar.collapsed {
|
||||
width: 60px;
|
||||
}
|
||||
.sidebar.collapsed h2,
|
||||
.sidebar.collapsed ul li a span {
|
||||
display: none;
|
||||
}
|
||||
.sidebar h2 {
|
||||
color: #3399FF;
|
||||
text-align: center;
|
||||
margin-bottom: 20px;
|
||||
font-size: 24px;
|
||||
transition: opacity 0.3s ease;
|
||||
}
|
||||
.sidebar ul {
|
||||
list-style: none;
|
||||
padding: 0;
|
||||
}
|
||||
.sidebar ul li {
|
||||
margin: 15px 0;
|
||||
}
|
||||
.sidebar ul li a {
|
||||
color: #ffffff;
|
||||
text-decoration: none;
|
||||
font-size: 16px;
|
||||
transition: color 0.3s ease;
|
||||
display: flex;
|
||||
align-items: center;
|
||||
}
|
||||
.sidebar ul li a:hover {
|
||||
color: #3399FF;
|
||||
}
|
||||
.sidebar ul li a i {
|
||||
margin-right: 10px;
|
||||
font-size: 20px;
|
||||
}
|
||||
.sidebar ul li a span {
|
||||
transition: opacity 0.3s ease;
|
||||
}
|
||||
.toggle-btn {
|
||||
position: fixed;
|
||||
left: 10px;
|
||||
top: 10px;
|
||||
background-color: #3399FF;
|
||||
border: none;
|
||||
color: #fff;
|
||||
padding: 10px;
|
||||
border-radius: 5px;
|
||||
cursor: pointer;
|
||||
z-index: 1000;
|
||||
}
|
||||
.container {
|
||||
flex: 1;
|
||||
padding: 20px;
|
||||
margin-left: 250px;
|
||||
transition: margin-left 0.3s ease;
|
||||
overflow-y: auto;
|
||||
height: 100vh;
|
||||
position: relative;
|
||||
z-index: 0;
|
||||
}
|
||||
.container.collapsed {
|
||||
margin-left: 60px;
|
||||
}
|
||||
h1 {
|
||||
color: #3399FF;
|
||||
text-align: center;
|
||||
margin-bottom: 20px;
|
||||
}
|
||||
.grid {
|
||||
display: grid;
|
||||
grid-template-columns: repeat(2, 1fr);
|
||||
gap: 20px;
|
||||
margin-top: 20px;
|
||||
}
|
||||
.card {
|
||||
background-color: #2e2e2e;
|
||||
padding: 20px;
|
||||
border-radius: 8px;
|
||||
box-shadow: 0 0 5px rgba(0, 0, 0, 0.2);
|
||||
}
|
||||
#map {
|
||||
height: 400px;
|
||||
border-radius: 8px;
|
||||
grid-column: span 2;
|
||||
}
|
||||
.screenshots {
|
||||
display: flex;
|
||||
overflow-x: auto;
|
||||
gap: 10px;
|
||||
padding: 10px;
|
||||
}
|
||||
.screenshots img {
|
||||
max-height: 200px;
|
||||
border-radius: 5px;
|
||||
border: 2px solid #3399FF;
|
||||
}
|
||||
.logs {
|
||||
background-color: #2e2e2e;
|
||||
padding: 15px;
|
||||
border-radius: 8px;
|
||||
height: 200px;
|
||||
overflow-y: auto;
|
||||
font-family: 'Courier New', monospace;
|
||||
font-size: 14px;
|
||||
color: #3399FF;
|
||||
}
|
||||
.logs p {
|
||||
margin: 5px 0;
|
||||
}
|
||||
|
||||
.leaflet-marker-icon {
|
||||
background-color: #3399FF;
|
||||
border: 2px solid #ffffff;
|
||||
border-radius: 50%;
|
||||
width: 20px !important;
|
||||
height: 20px !important;
|
||||
box-shadow: 0 0 10px rgba(51, 153, 255, 0.5);
|
||||
}
|
||||
.leaflet-popup-content {
|
||||
color: #1e1e1e;
|
||||
font-size: 14px;
|
||||
}
|
||||
.leaflet-popup-content-wrapper {
|
||||
border-radius: 8px;
|
||||
box-shadow: 0 0 10px rgba(0, 0, 0, 0.3);
|
||||
}
|
||||
</style>
|
||||
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0-beta3/css/all.min.css">
|
||||
</head>
|
||||
<body>
|
||||
<!-- Боковое меню -->
|
||||
<div class="sidebar" id="sidebar">
|
||||
<h2>Меню</h2>
|
||||
<ul>
|
||||
<li><a href="#"><i class="fas fa-home"></i><span>Главная</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-cog"></i><span>Настройки</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-chart-line"></i><span>Отчеты</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-code"></i><span>Парсеры</span></a></li>
|
||||
<li><a href="logs.html"><i class="fas fa-file-alt"></i><span>Логи</span></a></li>
|
||||
</ul>
|
||||
</div>
|
||||
|
||||
<!-- Кнопка для сворачивания/разворачивания меню -->
|
||||
<button class="toggle-btn" id="toggle-btn">
|
||||
<i class="fas fa-bars"></i>
|
||||
</button>
|
||||
|
||||
<!-- Основной контент -->
|
||||
<div class="container" id="main-content">
|
||||
<h1>Система мониторинга утечек данных</h1>
|
||||
|
||||
<!-- Карта -->
|
||||
<div class="card">
|
||||
<h2>Карта утечек</h2>
|
||||
<div id="map"></div>
|
||||
</div>
|
||||
|
||||
<!-- Графики, скриншоты и логи -->
|
||||
<div class="grid">
|
||||
<div class="card">
|
||||
<h2>Утечки за месяц</h2>
|
||||
<canvas id="monthlyLeaksChart"></canvas>
|
||||
</div>
|
||||
<div class="card">
|
||||
<h2>Состояние парсеров</h2>
|
||||
<canvas id="parsersStatusChart"></canvas>
|
||||
</div>
|
||||
<div class="card">
|
||||
<h2>Источники утечек</h2>
|
||||
<canvas id="sourcesChart"></canvas>
|
||||
</div>
|
||||
<div class="card">
|
||||
<h2>Скриншоты с форумов</h2>
|
||||
<div class="screenshots">
|
||||
<img src="https://via.placeholder.com/300x200.png?text=Скриншот+1" alt="Скриншот 1">
|
||||
<img src="https://via.placeholder.com/300x200.png?text=Скриншот+2" alt="Скриншот 2">
|
||||
<img src="https://via.placeholder.com/300x200.png?text=Скриншот+3" alt="Скриншот 3">
|
||||
<img src="https://via.placeholder.com/300x200.png?text=Скриншот+4" alt="Скриншот 4">
|
||||
<img src="https://via.placeholder.com/300x200.png?text=Скриншот+5" alt="Скриншот 5">
|
||||
</div>
|
||||
</div>
|
||||
<div class="card" style="grid-column: span 2;">
|
||||
<h2>Логи системы</h2>
|
||||
<div class="logs">
|
||||
<p>[2023-10-01 12:34] Парсер форума запущен.</p>
|
||||
<p>[2023-10-01 12:35] Найдена новая утечка на форуме X.</p>
|
||||
<p>[2023-10-01 12:36] Ошибка парсера Telegram: timeout.</p>
|
||||
<p>[2023-10-01 12:37] Утечка данных в Москве зафиксирована.</p>
|
||||
<p>[2023-10-01 12:38] Парсер даркнета завершил работу.</p>
|
||||
<p>[2023-10-01 12:39] Новый скриншот добавлен в базу.</p>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<script src="https://cdn.jsdelivr.net/npm/chart.js"></script>
|
||||
<script src="https://unpkg.com/leaflet@1.7.1/dist/leaflet.js"></script>
|
||||
<script>
|
||||
// График утечек за месяц
|
||||
const monthlyLeaksCtx = document.getElementById('monthlyLeaksChart').getContext('2d');
|
||||
new Chart(monthlyLeaksCtx, {
|
||||
type: 'line',
|
||||
data: {
|
||||
labels: ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11', '12', '13', '14', '15'],
|
||||
datasets: [{
|
||||
label: 'Утечки',
|
||||
data: [12, 19, 3, 5, 2, 3, 15, 20, 10, 8, 12, 14, 18, 20, 22],
|
||||
borderColor: '#3399FF',
|
||||
tension: 0.1,
|
||||
fill: true,
|
||||
backgroundColor: 'rgba(51, 153, 255, 0.1)',
|
||||
}]
|
||||
},
|
||||
options: {
|
||||
responsive: true,
|
||||
plugins: {
|
||||
legend: {
|
||||
labels: {
|
||||
color: '#fff',
|
||||
}
|
||||
}
|
||||
},
|
||||
scales: {
|
||||
y: {
|
||||
beginAtZero: true,
|
||||
grid: {
|
||||
color: '#444',
|
||||
},
|
||||
ticks: {
|
||||
color: '#fff',
|
||||
}
|
||||
},
|
||||
x: {
|
||||
grid: {
|
||||
color: '#444',
|
||||
},
|
||||
ticks: {
|
||||
color: '#fff',
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
});
|
||||
|
||||
// График состояния парсеров
|
||||
const parsersStatusCtx = document.getElementById('parsersStatusChart').getContext('2d');
|
||||
new Chart(parsersStatusCtx, {
|
||||
type: 'doughnut',
|
||||
data: {
|
||||
labels: ['Активны', 'Ошибки', 'Неактивны'],
|
||||
datasets: [{
|
||||
label: 'Состояние',
|
||||
data: [8, 1, 1],
|
||||
backgroundColor: ['#3399FF', '#ff4444', '#666666'],
|
||||
}]
|
||||
},
|
||||
options: {
|
||||
responsive: true,
|
||||
plugins: {
|
||||
legend: {
|
||||
labels: {
|
||||
color: '#fff',
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
});
|
||||
|
||||
// График источников утечек
|
||||
const sourcesCtx = document.getElementById('sourcesChart').getContext('2d');
|
||||
new Chart(sourcesCtx, {
|
||||
type: 'bar',
|
||||
data: {
|
||||
labels: ['Форумы', 'Даркнет', 'Telegram'],
|
||||
datasets: [{
|
||||
label: 'Количество утечек',
|
||||
data: [45, 30, 25],
|
||||
backgroundColor: ['#3399FF', '#00cc99', '#0099cc'],
|
||||
}]
|
||||
},
|
||||
options: {
|
||||
responsive: true,
|
||||
plugins: {
|
||||
legend: {
|
||||
labels: {
|
||||
color: '#fff',
|
||||
}
|
||||
}
|
||||
},
|
||||
scales: {
|
||||
y: {
|
||||
beginAtZero: true,
|
||||
grid: {
|
||||
color: '#444',
|
||||
},
|
||||
ticks: {
|
||||
color: '#fff',
|
||||
}
|
||||
},
|
||||
x: {
|
||||
grid: {
|
||||
color: '#444',
|
||||
},
|
||||
ticks: {
|
||||
color: '#fff',
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
});
|
||||
|
||||
const map = L.map('map').setView([55.7558, 37.6176], 5);
|
||||
L.tileLayer('https://{s}.basemaps.cartocdn.com/dark_all/{z}/{x}/{y}{r}.png', {
|
||||
attribution: '© OpenStreetMap contributors, © CARTO'
|
||||
}).addTo(map);
|
||||
|
||||
const marker1 = L.marker([55.7558, 37.6176], {
|
||||
icon: L.divIcon({ className: 'leaflet-marker-icon' })
|
||||
}).addTo(map).bindPopup('Утечка данных в Москве');
|
||||
|
||||
const marker2 = L.marker([59.9343, 30.3351], {
|
||||
icon: L.divIcon({ className: 'leaflet-marker-icon' })
|
||||
}).addTo(map).bindPopup('Утечка данных в Санкт-Петербурге');
|
||||
|
||||
const sidebar = document.getElementById('sidebar');
|
||||
const mainContent = document.getElementById('main-content');
|
||||
const toggleBtn = document.getElementById('toggle-btn');
|
||||
|
||||
toggleBtn.addEventListener('click', () => {
|
||||
sidebar.classList.toggle('collapsed');
|
||||
mainContent.classList.toggle('collapsed');
|
||||
});
|
||||
</script>
|
||||
</body>
|
||||
</html>
|
246
web/templates/logs.html
Normal file
246
web/templates/logs.html
Normal file
@ -0,0 +1,246 @@
|
||||
<!DOCTYPE html>
|
||||
<html lang="ru">
|
||||
<head>
|
||||
<meta charset="UTF-8">
|
||||
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
||||
<title>Логи системы</title>
|
||||
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.0.0-beta3/css/all.min.css">
|
||||
<style>
|
||||
body {
|
||||
margin: 0;
|
||||
padding: 0;
|
||||
font-family: 'Arial', sans-serif;
|
||||
color: #ffffff;
|
||||
overflow: hidden;
|
||||
display: flex;
|
||||
transition: margin-left 0.3s ease;
|
||||
}
|
||||
|
||||
/* Боковое меню */
|
||||
.sidebar {
|
||||
width: 250px;
|
||||
background-color: #2e2e2e;
|
||||
padding: 20px;
|
||||
box-shadow: 2px 0 5px rgba(0, 0, 0, 0.3);
|
||||
transition: width 0.3s ease;
|
||||
overflow-y: auto;
|
||||
position: fixed;
|
||||
top: 0;
|
||||
left: 0;
|
||||
bottom: 0;
|
||||
z-index: 2;
|
||||
}
|
||||
|
||||
.sidebar.collapsed {
|
||||
width: 60px;
|
||||
}
|
||||
|
||||
.sidebar.collapsed h2,
|
||||
.sidebar.collapsed ul li a span {
|
||||
display: none;
|
||||
}
|
||||
|
||||
.sidebar h2 {
|
||||
color: #3399FF;
|
||||
text-align: center;
|
||||
margin-bottom: 20px;
|
||||
font-size: 24px;
|
||||
transition: opacity 0.3s ease;
|
||||
}
|
||||
|
||||
.sidebar ul {
|
||||
list-style: none;
|
||||
padding: 0;
|
||||
}
|
||||
|
||||
.sidebar ul li {
|
||||
margin: 15px 0;
|
||||
}
|
||||
|
||||
.sidebar ul li a {
|
||||
color: #ffffff;
|
||||
text-decoration: none;
|
||||
font-size: 16px;
|
||||
transition: color 0.3s ease;
|
||||
display: flex;
|
||||
align-items: center;
|
||||
}
|
||||
|
||||
.sidebar ul li a:hover {
|
||||
color: #3399FF;
|
||||
}
|
||||
|
||||
.sidebar ul li a i {
|
||||
margin-right: 10px;
|
||||
font-size: 20px;
|
||||
}
|
||||
|
||||
.sidebar ul li a span {
|
||||
transition: opacity 0.3s ease;
|
||||
}
|
||||
|
||||
/* Кнопка для сворачивания/разворачивания меню */
|
||||
.toggle-btn {
|
||||
position: fixed;
|
||||
left: 10px;
|
||||
top: 10px;
|
||||
background-color: #3399FF;
|
||||
border: none;
|
||||
color: #fff;
|
||||
padding: 10px;
|
||||
border-radius: 5px;
|
||||
cursor: pointer;
|
||||
z-index: 1000;
|
||||
}
|
||||
|
||||
/* Основной контент */
|
||||
.container {
|
||||
flex: 1;
|
||||
padding: 20px;
|
||||
margin-left: 250px;
|
||||
transition: margin-left 0.3s ease;
|
||||
position: relative;
|
||||
z-index: 1;
|
||||
}
|
||||
|
||||
.container.collapsed {
|
||||
margin-left: 60px;
|
||||
}
|
||||
|
||||
/* Видео на фоне */
|
||||
.background-video {
|
||||
position: fixed;
|
||||
top: 0;
|
||||
left: 0;
|
||||
width: 100%;
|
||||
height: 100%;
|
||||
object-fit: cover;
|
||||
z-index: -1;
|
||||
opacity: 0.8; /* Полупрозрачность видео */
|
||||
}
|
||||
|
||||
/* Затемнение поверх видео */
|
||||
.overlay {
|
||||
position: fixed;
|
||||
top: 0;
|
||||
left: 0;
|
||||
width: 100%;
|
||||
height: 100%;
|
||||
background: rgba(0, 0, 0, 0.7); /* Черный полупрозрачный слой */
|
||||
z-index: -1;
|
||||
}
|
||||
|
||||
/* Контейнер для логов */
|
||||
.logs-container {
|
||||
position: absolute;
|
||||
top: 50%;
|
||||
left: 20px;
|
||||
transform: translateY(-50%);
|
||||
width: 40%;
|
||||
max-width: 600px;
|
||||
background-color: rgba(46, 46, 46, 0.9); /* Полупрозрачный фон */
|
||||
padding: 20px;
|
||||
border-radius: 10px;
|
||||
box-shadow: 0 0 20px rgba(51, 153, 255, 0.5);
|
||||
z-index: 1;
|
||||
}
|
||||
|
||||
.logs-container h2 {
|
||||
color: #3399FF;
|
||||
margin-bottom: 20px;
|
||||
font-size: 24px;
|
||||
}
|
||||
|
||||
/* Стили для логов */
|
||||
.logs {
|
||||
height: 60vh;
|
||||
overflow-y: auto;
|
||||
font-family: 'Courier New', monospace;
|
||||
font-size: 14px;
|
||||
color: #3399FF;
|
||||
padding-right: 10px;
|
||||
}
|
||||
|
||||
.logs p {
|
||||
margin: 10px 0;
|
||||
padding: 5px;
|
||||
background-color: rgba(0, 0, 0, 0.3);
|
||||
border-radius: 5px;
|
||||
}
|
||||
|
||||
/* Стили для скроллбара */
|
||||
.logs::-webkit-scrollbar {
|
||||
width: 8px;
|
||||
}
|
||||
|
||||
.logs::-webkit-scrollbar-track {
|
||||
background: rgba(0, 0, 0, 0.2);
|
||||
border-radius: 5px;
|
||||
}
|
||||
|
||||
.logs::-webkit-scrollbar-thumb {
|
||||
background: #00ffcc;
|
||||
border-radius: 5px;
|
||||
}
|
||||
|
||||
.logs::-webkit-scrollbar-thumb:hover {
|
||||
background: #00cc99;
|
||||
}
|
||||
</style>
|
||||
</head>
|
||||
<body>
|
||||
<!-- Боковое меню -->
|
||||
<div class="sidebar" id="sidebar">
|
||||
<h2>Меню</h2>
|
||||
<ul>
|
||||
<li><a href="index.html"><i class="fas fa-home"></i><span>Главная</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-cog"></i><span>Настройки</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-chart-line"></i><span>Отчеты</span></a></li>
|
||||
<li><a href="#"><i class="fas fa-code"></i><span>Парсеры</span></a></li>
|
||||
<li><a href="logs.html"><i class="fas fa-file-alt"></i><span>Логи</span></a></li>
|
||||
</ul>
|
||||
</div>
|
||||
|
||||
<!-- Кнопка для сворачивания/разворачивания меню -->
|
||||
<button class="toggle-btn" id="toggle-btn">
|
||||
<i class="fas fa-bars"></i>
|
||||
</button>
|
||||
|
||||
<!-- Основной контент -->
|
||||
<div class="container" id="main-content">
|
||||
<!-- Видео на фоне -->
|
||||
<video class="background-video" autoplay loop muted>
|
||||
<source src="{{ url_for('static', filename='alb_glob0411_1080p_24fps.mp4') }}" type="video/mp4">
|
||||
Ваш браузер не поддерживает видео.
|
||||
</video>
|
||||
<!-- Затемнение поверх видео -->
|
||||
<div class="overlay"></div>
|
||||
|
||||
<!-- Контейнер для логов -->
|
||||
<div class="logs-container">
|
||||
<h2>Логи системы</h2>
|
||||
<div class="logs">
|
||||
<p>[2023-10-01 12:34] Парсер форума запущен.</p>
|
||||
<p>[2023-10-01 12:35] Найдена новая утечка на форуме X.</p>
|
||||
<p>[2023-10-01 12:36] Ошибка парсера Telegram: timeout.</p>
|
||||
<p>[2023-10-01 12:37] Утечка данных в Москве зафиксирована.</p>
|
||||
<p>[2023-10-01 12:38] Парсер даркнета завершил работу.</p>
|
||||
<p>[2023-10-01 12:39] Новый скриншот добавлен в базу.</p>
|
||||
<!-- Добавьте больше логов по необходимости -->
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<script>
|
||||
// Сворачивание/разворачивание бокового меню
|
||||
const sidebar = document.getElementById('sidebar');
|
||||
const mainContent = document.getElementById('main-content');
|
||||
const toggleBtn = document.getElementById('toggle-btn');
|
||||
|
||||
toggleBtn.addEventListener('click', () => {
|
||||
sidebar.classList.toggle('collapsed');
|
||||
mainContent.classList.toggle('collapsed');
|
||||
});
|
||||
</script>
|
||||
</body>
|
||||
</html>
|
Loading…
Reference in New Issue
Block a user