transcribe voice message command

2025-06-08 06:03:04 -04:00 · 2023-04-15 19:17:40 +02:00 · 2023-04-15 19:17:40 +02:00 · f408733d83
commit f408733d83
parent 26a305ea8b
3 changed files with 61 additions and 0 deletions
--- a/commands/message/google/transcribe.js
+++ b/commands/message/google/transcribe.js
@ -0,0 +1,54 @@
 const { createEmbed } = require('../../../labscore/utils/embed')
 const { editOrReply } = require('../../../labscore/utils/message')
 const { searchAudio, googleSpeechRecognition } = require('../../../labscore/api');
 const { getRecentVideo } = require('../../../labscore/utils/attachment');
 const { renderMusicButtons } = require('../../../labscore/utils/buttons');
 const superagent = require('superagent');
 const { STATICS } = require('../../../labscore/utils/statics');
 const { codeblock } = require('../../../labscore/utils/markdown');
 const urlr = /(https?:\/\/(?:www\.|(?!www))[a-zA-Z0-9][a-zA-Z0-9-]+[a-zA-Z0-9]\.[^\s]{2,}|www\.[a-zA-Z0-9][a-zA-Z0-9-]+[a-zA-Z0-9]\.[^\s]{2,}|https?:\/\/(?:www\.|(?!www))[a-zA-Z0-9]+\.[^\s]{2,}|www\.[a-zA-Z0-9]+\.[^\s]{2,})/g
 module.exports = {
  name: 'transcribe',
  aliases: ['tcr'],
  metadata: {
    description: '__Replying__ to a voice message when using this command will transcribe the contents of the voice message.',
    description_short: 'Discord voice message transcription',
    examples: ['tcr'],
    category: 'search',
    usage: 'transcribe'
  },
  run: async (context) => {
    context.triggerTyping();
    if (!context.message.messageReference) return editOrReply(context, { embeds: [createEmbed("warning", context, "You need to reply to a voice message.")] })
    try {
      let msg;
      try {
        msg = await context.message.channel.fetchMessage(context.message.messageReference.messageId)
      } catch (e) {
        return editOrReply(context, { embeds: [createEmbed("error", context, "Unable to fetch message.")] })
      }
      if(!msg.attachments.first()) return editOrReply(context, { embeds: [createEmbed("warning", context, "No voice message found.")] })
      if(!msg.attachments.first().url.endsWith('voice-message.ogg')) return editOrReply(context, { embeds: [createEmbed("warning", context, "No voice message found.")] })
      const recog = await googleSpeechRecognition(context, msg.attachments.first().url)
      return editOrReply(context, createEmbed("default", context, {
        description: codeblock("ansi", [ recog.response.body.transcription ]),
        footer: {
          iconUrl: STATICS.google,
          text: `Google Cloud • Confidence: ${(recog.response.body.confidence* 100).toFixed(1)}% • ${context.application.name}`
        }
      }))
    } catch (e) {
      console.log(e)
      if(e.response?.body?.status && e.response.body.status == 2) return editOrReply(context, {embeds:[createEmbed("warning", context, e.response.body.message)]})
      return editOrReply(context, { embeds: [createEmbed("error", context, `Unable to transcribe audio.`)] })
    }
  },
 };
--- a/labscore/api/endpoints.js
+++ b/labscore/api/endpoints.js
@ -8,6 +8,7 @@ const Api = Object.freeze({
  HOST: Hosts.prod,
  GOOGLE_PERSPECTIVE: '/google/perspective/analyze',
  GOOGLE_SPEECH_RECOGNIZE: '/google/speech/recognize',
  GOOGLE_TRANSLATE: '/google/translate/text',
  GOOGLE_VISION_COLORS: '/google/vision/colors',
  GOOGLE_VISION_FACES: '/google/vision/faces',
--- a/labscore/api/index.js
+++ b/labscore/api/index.js
@ -48,6 +48,12 @@ module.exports.googlePerspective = async function(context, text){
  })
 }
 module.exports.googleSpeechRecognition = async function(context, url){
  return await request(Api.GOOGLE_SPEECH_RECOGNIZE, "GET", {}, {
    url
  })
 }
 module.exports.googleTranslate = async function(context, text, to, from){
  return await request(Api.GOOGLE_TRANSLATE, "GET", {}, {
    text: text,