insert2-cogs/transcription.py

import nextcord
from nextcord.ext import commands
import os
from os import path
import asyncio
from pydub import AudioSegment
import numpy as np
import speech_recognition as sr

def prepaudio(audiofile):
    st = sr.Recognizer()
    oggfile = AudioSegment.from_ogg(audiofile)
    oggfile.export("audio.wav", format="wav")
    convertemessage = sr.AudioFile("audio.wav")
    with convertemessage as sounds:
        transcribeaudo = st.record(sounds)
    return transcribeaudo

class transcription(commands.Cog):

    def __init__(self, bot: commands.Bot):
        self.bot = bot
        self.st = sr.Recognizer()


    @nextcord.message_command(name="Transcribe Using Sphinx")
    async def transcribesphinx(self, interaction: nextcord.Interaction, message: nextcord.Message):
        try:
            await interaction.response.defer(ephemeral='true')
            await message.attachments[0].save("audio.ogg")
            embed=nextcord.Embed(title="Audio Transcription",description=self.st.recognize_sphinx(prepaudio("audio.ogg")), color=0x3584e4)
            embed.set_author(name=message.author.display_name, url=message.jump_url, icon_url=message.author.display_avatar)
            embed.set_footer(text="Accuracy not guaranteed")
            await interaction.edit_original_message(embed=embed)
            os.remove("audio.ogg")
            os.remove("audio.wav")
        except Exception as e:
            await interaction.edit_original_message(content=f'an error appears to have occoured please report it to the developer: {e}')

    @nextcord.message_command(name="Transcribe Using Google")
    async def transcribegoogle(self, interaction: nextcord.Interaction, message: nextcord.Message):
        try:
            await interaction.response.defer(ephemeral='true')
            await message.attachments[0].save("audio.ogg")
            # WARNING Google is propritary, consider disabling however sphynix is currently not very good so this provides an option
            embed=nextcord.Embed(title="Audio Transcription",description=self.st.recognize_google(prepaudio("audio.ogg")), color=0x3584e4)
            embed.set_author(name=message.author.display_name, url=message.jump_url, icon_url=message.author.display_avatar)
            embed.set_footer(text="Accuracy not guaranteed")
            await interaction.edit_original_message(embed=embed)
            await asyncio.sleep(3)
            os.remove("audio.ogg")
            os.remove("audio.wav")
        except Exception as e:
            await interaction.edit_original_message(content=f'an error appears to have occoured please report it to the developer: {e}')

def setup(bot: commands.Bot):
    bot.add_cog(transcription(bot))
rewrite transcription 2024-08-07 18:44:50 +00:00			`import nextcord`
			`from nextcord.ext import commands`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00			`import os`
			`from os import path`
			`import asyncio`
			`from pydub import AudioSegment`
			`import numpy as np`
			`import speech_recognition as sr`

			`def prepaudio(audiofile):`
			`st = sr.Recognizer()`
			`oggfile = AudioSegment.from_ogg(audiofile)`
			`oggfile.export("audio.wav", format="wav")`
			`convertemessage = sr.AudioFile("audio.wav")`
			`with convertemessage as sounds:`
			`transcribeaudo = st.record(sounds)`
			`return transcribeaudo`

			`class transcription(commands.Cog):`

			`def __init__(self, bot: commands.Bot):`
			`self.bot = bot`
			`self.st = sr.Recognizer()`


revert 5feb9e0adcc64a4fabce9741c9cb5d100814846e revert Update 2024-08-12 12:53:52 +00:00			`@nextcord.message_command(name="Transcribe Using Sphinx")`
			`async def transcribesphinx(self, interaction: nextcord.Interaction, message: nextcord.Message):`
			`try:`
			`await interaction.response.defer(ephemeral='true')`
			`await message.attachments[0].save("audio.ogg")`
			`embed=nextcord.Embed(title="Audio Transcription",description=self.st.recognize_sphinx(prepaudio("audio.ogg")), color=0x3584e4)`
			`embed.set_author(name=message.author.display_name, url=message.jump_url, icon_url=message.author.display_avatar)`
			`embed.set_footer(text="Accuracy not guaranteed")`
			`await interaction.edit_original_message(embed=embed)`
			`os.remove("audio.ogg")`
			`os.remove("audio.wav")`
			`except Exception as e:`
			`await interaction.edit_original_message(content=f'an error appears to have occoured please report it to the developer: {e}')`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00
rewrite transcription 2024-08-07 18:44:50 +00:00			`@nextcord.message_command(name="Transcribe Using Google")`
			`async def transcribegoogle(self, interaction: nextcord.Interaction, message: nextcord.Message):`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00			`try:`
rewrite transcription 2024-08-07 18:44:50 +00:00			`await interaction.response.defer(ephemeral='true')`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00			`await message.attachments[0].save("audio.ogg")`
			`# WARNING Google is propritary, consider disabling however sphynix is currently not very good so this provides an option`
rewrite transcription 2024-08-07 18:44:50 +00:00			`embed=nextcord.Embed(title="Audio Transcription",description=self.st.recognize_google(prepaudio("audio.ogg")), color=0x3584e4)`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00			`embed.set_author(name=message.author.display_name, url=message.jump_url, icon_url=message.author.display_avatar)`
			`embed.set_footer(text="Accuracy not guaranteed")`
rewrite transcription 2024-08-07 18:44:50 +00:00			`await interaction.edit_original_message(embed=embed)`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00			`await asyncio.sleep(3)`
			`os.remove("audio.ogg")`
			`os.remove("audio.wav")`
			`except Exception as e:`
rewrite transcription 2024-08-07 18:44:50 +00:00			`await interaction.edit_original_message(content=f'an error appears to have occoured please report it to the developer: {e}')`
Update 8-05-24 15:11 2024-08-05 19:12:11 +00:00
			`def setup(bot: commands.Bot):`
			`bot.add_cog(transcription(bot))`