Telegram bot: Gemini retells all voice messages that you receive in DM

MALWARE · Aug 24, 2024

Gemini пересказывает все голосовые сообщения, которые вам приходят
Возможность подключить этого бота к аккаунту есть только у Premium пользователей! Но использовать его, пересылая ГС боту можно и без Premium.

Это уже скриншоты уже в моём ЛС с людьми:
gemini_token = 'https://lolz.live/threads/6818835/'
bot_token = 'https://t.me/botfather'
allowed_users = [657195904, -1001537487920]

# Больше ничего редактировать не нужно

import asyncio
from aiogram import Router, Bot, Dispatcher, F, types
import logging
from io import BytesIO
from pydub import AudioSegment
import google.generativeai as gemini
from google.api_core.exceptions import InternalServerError
from google.api_core.exceptions import ResourceExhausted
from ssl import SSLError
from os import remove
from asyncio import sleep

bot = None
router = Router(name=__name__)
lock = asyncio.Lock()
logger = logging.getLogger(__name__)
logging.basicConfig(level=logging.INFO)

gemini.configure(api_key=gemini_token)

async def telegram_voice_gemini_tts(file_id: str, format: str, message_id: int) -> str:
wav_io = BytesIO()
AudioSegment.from_file((await bot.download_file((await bot.get_file(file_id)).file_path)), format=format).export(wav_io, format="wav")
wav_io.seek(0)
with open(f'vm{message_id}.wav', 'wb') as f: f.write(wav_io.getvalue())
audio_file = gemini.upload_file(f'vm{message_id}.wav', mime_type='audio/wav')
try:
return gemini.GenerativeModel(model_name="gemini-1.5-flash").generate_content([f'Перескажи голосовое сообщение на русском языке. Сообщи об эмоциях автора. В случае, если ты услышал речь, начни свой ответ со слов "В {"голосовом сообщении" if format == "ogg" else "видеосообщении"} говорится". В случае, если ты не услышал в записи речь, сообщи о том, что в {"голосовом сообщении" if format == "ogg" else "видеосообщении"} нет речи.', audio_file], safety_settings=[{"category": "HARM_CATEGORY_HARASSMENT","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_HATE_SPEECH","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","threshold": "BLOCK_NONE",},]).text
finally:
remove(f'vm{message_id}.wav')

@router.business_message(F.voice | F.video_note)
async def handle_message(message: types.Message):
async with lock:
if not (await bot.get_business_connection(message.business_connection_id)).user.id in allowed_users: return
logger.info(f"Received voice message from {message.from_user.id}")
recognition_message = await bot.send_message(message.chat.id, '<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini распознаёт голосовое сообщение<tg-emoji emoji-id="5220046725493828505">✍</tg-emoji>' if message.voice else '<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini распознаёт видеосообщение<tg-emoji emoji-id="5220070652756635426"></tg-emoji>', business_connection_id=message.business_connection_id, reply_to_message_id=message.message_id, parse_mode='HTML')
await bot.send_chat_action(message.chat.id, 'upload_voice' if message.voice else 'upload_video_note', business_connection_id=message.business_connection_id)
while True:
try:
tts_result = await telegram_voice_gemini_tts(message.voice.file_id if message.voice else message.video_note.file_id, 'ogg' if message.voice else 'mp4', message.message_id)
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini: ' + tts_result, business_connection_id=message.business_connection_id, parse_mode='HTML')
except ValueError:
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5807626765874499116"></tg-emoji><tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini посчитал этот запрос небезопасным.', business_connection_id=message.business_connection_id, parse_mode='HTML')
except (InternalServerError, SSLError):
sleep(3)
except ResourceExhausted:
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5456670136121434320"></tg-emoji><tg-emoji emoji-id="5296262629558340179"></tg-emoji>Достигнут лимит запросов к Gemini :(', business_connection_id=message.business_connection_id, parse_mode='HTML')
except Exception as e:
logger.error(e)
await bot.send_message(allowed_users[0], str(e))

# @router.message()
# async def echo(message: types.Message):
# print(message.html_text)

@router.message(F.chat.type == 'private', F.text)
async def handle_message(message: types.Message):
async with lock:
if not message.from_user.id in allowed_users: return
await bot.send_chat_action(message.chat.id, 'typing')
response = gemini.GenerativeModel(model_name="gemini-1.5-pro").generate_content(message.text)
await message.reply(response.text)

@router.message(F.voice | F.video_note)
async def handle_message(message: types.Message):
async with lock:
if not message.chat.id in allowed_users: return
logger.info(f"Received voice message from {message.from_user.id}")
recognition_message = await message.reply('Gemini распознаёт голосовое сообщение...' if message.voice else 'Gemini распознаёт видеосообщение...')
await bot.send_chat_action(message.chat.id, 'upload_voice' if message.voice else 'upload_video_note')
while True:
try:
tts_result = await telegram_voice_gemini_tts(message.voice.file_id if message.voice else message.video_note.file_id, 'ogg' if message.voice else 'mp4', message.message_id)
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Gemini: ' + tts_result, parse_mode='HTML')
except ValueError:
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Gemini посчитал этот запрос небезопасным.', parse_mode='HTML')
except (InternalServerError, SSLError):
sleep(3)
except ResourceExhausted:
return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Достигнут лимит запросов к Gemini :(')
except Exception as e:
logger.error(e)
await bot.send_message(allowed_users[0], str(e))
sleep(10)

async def main():
global bot
bot = Bot(token=bot_token)
dp = Dispatcher()
dp.include_router(router)
await bot.delete_webhook(drop_pending_updates=True)
await dp.start_polling(bot)

asyncio.run(main())

Python
gemini_token = 'https://lolz.live/threads/6818835/'

bot_token = 'https://t.me/botfather'

allowed_users = [657195904, -1001537487920]



# Больше ничего редактировать не нужно



import asyncio

from aiogram import Router, Bot, Dispatcher, F, types

import logging

from io import BytesIO

from pydub import AudioSegment

import google.generativeai as gemini

from google.api_core.exceptions import InternalServerError

from google.api_core.exceptions import ResourceExhausted

from ssl import SSLError

from os import remove

from asyncio import sleep



bot = None

router = Router(name=__name__)

lock = asyncio.Lock()

logger = logging.getLogger(__name__)

logging.basicConfig(level=logging.INFO)



gemini.configure(api_key=gemini_token)



async def telegram_voice_gemini_tts(file_id: str, format: str, message_id: int) -> str:

 wav_io = BytesIO()

 AudioSegment.from_file((await bot.download_file((await bot.get_file(file_id)).file_path)), format=format).export(wav_io, format="wav")

 wav_io.seek(0)

 with open(f'vm{message_id}.wav', 'wb') as f: f.write(wav_io.getvalue())

 audio_file = gemini.upload_file(f'vm{message_id}.wav', mime_type='audio/wav')

 try:

 return gemini.GenerativeModel(model_name="gemini-1.5-flash").generate_content([f'Перескажи голосовое сообщение на русском языке. Сообщи об эмоциях автора. В случае, если ты услышал речь, начни свой ответ со слов "В {"голосовом сообщении" if format == "ogg" else "видеосообщении"} говорится". В случае, если ты не услышал в записи речь, сообщи о том, что в {"голосовом сообщении" if format == "ogg" else "видеосообщении"} нет речи.', audio_file], safety_settings=[{"category": "HARM_CATEGORY_HARASSMENT","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_HATE_SPEECH","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","threshold": "BLOCK_NONE",},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","threshold": "BLOCK_NONE",},]).text

 finally:

 remove(f'vm{message_id}.wav')



@router.business_message(F.voice | F.video_note)

async def handle_message(message: types.Message):

 async with lock:

 if not (await bot.get_business_connection(message.business_connection_id)).user.id in allowed_users: return

 logger.info(f"Received voice message from {message.from_user.id}")

 recognition_message = await bot.send_message(message.chat.id, '<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini распознаёт голосовое сообщение<tg-emoji emoji-id="5220046725493828505">✍</tg-emoji>' if message.voice else '<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini распознаёт видеосообщение<tg-emoji emoji-id="5220070652756635426"></tg-emoji>', business_connection_id=message.business_connection_id, reply_to_message_id=message.message_id, parse_mode='HTML')

 await bot.send_chat_action(message.chat.id, 'upload_voice' if message.voice else 'upload_video_note', business_connection_id=message.business_connection_id)

 while True:

 try:

 tts_result = await telegram_voice_gemini_tts(message.voice.file_id if message.voice else message.video_note.file_id, 'ogg' if message.voice else 'mp4', message.message_id)

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini: ' + tts_result, business_connection_id=message.business_connection_id, parse_mode='HTML')

 except ValueError:

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5807626765874499116"></tg-emoji><tg-emoji emoji-id="5296262629558340179"></tg-emoji>Gemini посчитал этот запрос небезопасным.', business_connection_id=message.business_connection_id, parse_mode='HTML')

 except (InternalServerError, SSLError):

 sleep(3)

 except ResourceExhausted:

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='<tg-emoji emoji-id="5456670136121434320"></tg-emoji><tg-emoji emoji-id="5296262629558340179"></tg-emoji>Достигнут лимит запросов к Gemini :(', business_connection_id=message.business_connection_id, parse_mode='HTML')

 except Exception as e:

 logger.error(e)

 await bot.send_message(allowed_users[0], str(e))



# @router.message()

# async def echo(message: types.Message):

# print(message.html_text)



@router.message(F.chat.type == 'private', F.text)

async def handle_message(message: types.Message):

 async with lock:

 if not message.from_user.id in allowed_users: return

 await bot.send_chat_action(message.chat.id, 'typing')

 response = gemini.GenerativeModel(model_name="gemini-1.5-pro").generate_content(message.text)

 await message.reply(response.text)



@router.message(F.voice | F.video_note)

async def handle_message(message: types.Message):

 async with lock:

 if not message.chat.id in allowed_users: return

 logger.info(f"Received voice message from {message.from_user.id}")

 recognition_message = await message.reply('Gemini распознаёт голосовое сообщение...' if message.voice else 'Gemini распознаёт видеосообщение...')

 await bot.send_chat_action(message.chat.id, 'upload_voice' if message.voice else 'upload_video_note')

 while True:

 try:

 tts_result = await telegram_voice_gemini_tts(message.voice.file_id if message.voice else message.video_note.file_id, 'ogg' if message.voice else 'mp4', message.message_id)

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Gemini: ' + tts_result, parse_mode='HTML')

 except ValueError:

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Gemini посчитал этот запрос небезопасным.', parse_mode='HTML')

 except (InternalServerError, SSLError):

 sleep(3)

 except ResourceExhausted:

 return await bot.edit_message_text(chat_id=recognition_message.chat.id, message_id=recognition_message.message_id, text='Достигнут лимит запросов к Gemini :(')

 except Exception as e:

 logger.error(e)

 await bot.send_message(allowed_users[0], str(e))

 sleep(10)



async def main():

 global bot

 bot = Bot(token=bot_token)

 dp = Dispatcher()

 dp.include_router(router)

 await bot.delete_webhook(drop_pending_updates=True)

 await dp.start_polling(bot)





asyncio.run(main())
Бота можно хостить только на нероссийских серверах: API Gemini нельзя использовать с ру айпи.
Для установки:
1. Заполняем конфиг:
gemini_token — API ключ Gemini. Получать тут: https://aistudio.google.com/app/apikey

1. Включаем *** (или Comss DNS): https://lolz.live/threads/7025472/
2. Заходим на AI Studio
3. Create API Key
4. В окне с полем поиска тыкаем кнопку выше поля. Копируем ключ.

bot_token — токен бота Telegram

allowed_users — список [ID пользователей, которые смогут привязать бота к бизнесу, либо использовать его в ЛС с ботом] и [ID чатов, в котором бот будет автоматически распознавать все ГС]. Для определения ID используйте https://t.me/myidbot.

2. Включаем Business Mode в BotFather

3. Идём в настройки ТГ -> Telegram для бизнеса -> Чат-боты. Вставляем ссылку на своего бота.

4. Всё, ждём голосовых сообщений!

k1erry · Aug 24, 2024

Годная статья, теперь не придётся покупать премку чтобы не слушать гски

Копировать · Aug 24, 2024

мама я попала в телевизора, ну как тестер могу сказать что хорошая задумка, мне понравилось

Loss · Aug 24, 2024

мне слишком лень его ставить, поетому отложу на потом, лайк

RendixMars · Aug 25, 2024

Имба

llimonix · Aug 27, 2024

Задумка прикольная, но нахуя.
Боты которые расшифровывают гс - есть. Чтобы привязать бота к акку нужен премиум. Если у тебя премиум, то у тебя и так уже есть расшифровка от телеграм.

Использовать ИИ, чтобы он выдал комплексный ответ по голосовой, прикольно. Но может потеряться какая-то информация и простой расшифровки гс хватит с головой

Vova_Burry · Aug 27, 2024

Интересно, но бессмысленно. За старания

Кастория · Jul 21, 2025 at 12:39 AM

Hidden content. You need to be registered to see it.
Click to expand...

Crypto Casino - casino in telegram with Cryptobot

Unconfirmed orders - remark for fpc

Hello, help decrypt .db

Help with Python

Software for generating Octobrowser and acting proys

Software for changing passwords firstmail

[TG DRAIN] Telegram drainer

Autostatus in VK and autobio in Telegram with the current Spotify song

Script for cleaning friends VK

The simplest eternal online VKontakte

Playerok Universal - the first free bot for the Playerok trading platform

Bot for feedback from the admin panel | Bypassing spamblock.

Bot assistant for buying advertising | Checking statuses/pins + avatars

DICEBOT for forum | AIOGRAM bot with a beautiful menu

How to send premium emoji through the SUB?

Guys help with the script

How to send TG Prem Emoji through a bot?

Quick country change on multiple VK accounts

Smartvol - clamp and volume indicator

Pyanty - Web automation, module for managing dolphin via Selenium, and Dolphin API

Emunium - module for simulating human behavior in Selenium/Pyppeteer

Gram_tools | Utilities for simplified development of bots on aiogram 3

Cryptoscan - Python Library for Monitoring (Reception) Crypto Payments

Advise the cloud platform so that the most simple bot on python in TG works

Notifications that the user is online in VK

Telegram Parsing Benefit offers on LZT Market

[Actual] User Bot Auto Buying gifts telegrams

Scam BUSINESS BOOK GRABER GHUTAROV through TG BUSINESS

How can you work with PSD?

We delete all the libraries that we pumped (if there is another solution tell me)

Telegram bot: Gemini retells all voice messages that you receive in DM