transcribe voice message command

This commit is contained in:
derpystuff 2023-04-15 19:17:40 +02:00
parent 26a305ea8b
commit f408733d83
3 changed files with 61 additions and 0 deletions

View file

@ -0,0 +1,54 @@
const { createEmbed } = require('../../../labscore/utils/embed')
const { editOrReply } = require('../../../labscore/utils/message')
const { searchAudio, googleSpeechRecognition } = require('../../../labscore/api');
const { getRecentVideo } = require('../../../labscore/utils/attachment');
const { renderMusicButtons } = require('../../../labscore/utils/buttons');
const superagent = require('superagent');
const { STATICS } = require('../../../labscore/utils/statics');
const { codeblock } = require('../../../labscore/utils/markdown');
const urlr = /(https?:\/\/(?:www\.|(?!www))[a-zA-Z0-9][a-zA-Z0-9-]+[a-zA-Z0-9]\.[^\s]{2,}|www\.[a-zA-Z0-9][a-zA-Z0-9-]+[a-zA-Z0-9]\.[^\s]{2,}|https?:\/\/(?:www\.|(?!www))[a-zA-Z0-9]+\.[^\s]{2,}|www\.[a-zA-Z0-9]+\.[^\s]{2,})/g
module.exports = {
name: 'transcribe',
aliases: ['tcr'],
metadata: {
description: '__Replying__ to a voice message when using this command will transcribe the contents of the voice message.',
description_short: 'Discord voice message transcription',
examples: ['tcr'],
category: 'search',
usage: 'transcribe'
},
run: async (context) => {
context.triggerTyping();
if (!context.message.messageReference) return editOrReply(context, { embeds: [createEmbed("warning", context, "You need to reply to a voice message.")] })
try {
let msg;
try {
msg = await context.message.channel.fetchMessage(context.message.messageReference.messageId)
} catch (e) {
return editOrReply(context, { embeds: [createEmbed("error", context, "Unable to fetch message.")] })
}
if(!msg.attachments.first()) return editOrReply(context, { embeds: [createEmbed("warning", context, "No voice message found.")] })
if(!msg.attachments.first().url.endsWith('voice-message.ogg')) return editOrReply(context, { embeds: [createEmbed("warning", context, "No voice message found.")] })
const recog = await googleSpeechRecognition(context, msg.attachments.first().url)
return editOrReply(context, createEmbed("default", context, {
description: codeblock("ansi", [ recog.response.body.transcription ]),
footer: {
iconUrl: STATICS.google,
text: `Google Cloud • Confidence: ${(recog.response.body.confidence* 100).toFixed(1)}% • ${context.application.name}`
}
}))
} catch (e) {
console.log(e)
if(e.response?.body?.status && e.response.body.status == 2) return editOrReply(context, {embeds:[createEmbed("warning", context, e.response.body.message)]})
return editOrReply(context, { embeds: [createEmbed("error", context, `Unable to transcribe audio.`)] })
}
},
};

View file

@ -8,6 +8,7 @@ const Api = Object.freeze({
HOST: Hosts.prod, HOST: Hosts.prod,
GOOGLE_PERSPECTIVE: '/google/perspective/analyze', GOOGLE_PERSPECTIVE: '/google/perspective/analyze',
GOOGLE_SPEECH_RECOGNIZE: '/google/speech/recognize',
GOOGLE_TRANSLATE: '/google/translate/text', GOOGLE_TRANSLATE: '/google/translate/text',
GOOGLE_VISION_COLORS: '/google/vision/colors', GOOGLE_VISION_COLORS: '/google/vision/colors',
GOOGLE_VISION_FACES: '/google/vision/faces', GOOGLE_VISION_FACES: '/google/vision/faces',

View file

@ -48,6 +48,12 @@ module.exports.googlePerspective = async function(context, text){
}) })
} }
module.exports.googleSpeechRecognition = async function(context, url){
return await request(Api.GOOGLE_SPEECH_RECOGNIZE, "GET", {}, {
url
})
}
module.exports.googleTranslate = async function(context, text, to, from){ module.exports.googleTranslate = async function(context, text, to, from){
return await request(Api.GOOGLE_TRANSLATE, "GET", {}, { return await request(Api.GOOGLE_TRANSLATE, "GET", {}, {
text: text, text: text,