natural-language-api-google/utils/speechToTextJob.js

// Imports the Google Cloud client library
const speech = require('@google-cloud/speech')
const path = require('path')
const fs = require('fs')
const getAudioDuration = require('./getAudioDuration')
const audioUploadToBucket = require('./audioUploadToBucket')
const { StatusCodes } = require("http-status-codes")


async function speechToTextJob(filename, languageCode = 'pt-Br', bucket = 'speect-to-text-bucket', sampleRateHertz = 16000, encoding = 'LINEAR16') {

    const client = new speech.SpeechClient()

    let audio

    const config = {
        encoding: encoding,
        sampleRateHertz: sampleRateHertz,
        languageCode: languageCode,
    }

    const seconds = await getAudioDuration(filename)

    if (seconds >= 28800) {
        return { msg: 'Audio file is higher than 480 minute', status: StatusCodes.BAD_REQUEST }
    }
    else if (seconds <= 59) {
        audio = {
            content: fs.readFileSync(filename).toString('base64'),
        }
    } else if (seconds >= 60) {
        const uploaded = await audioUploadToBucket(bucket, filename, path.basename(filename))

        if (uploaded) {
            audio = {
                uri: `gs://${bucket}/${path.basename(filename)}`,
            }
        }
    }

    if (!audio) return { msg: `Error on try upload the file to google cloud bucket(${bucket}) storage`, status: StatusCodes.INTERNAL_SERVER_ERROR }

    const request = {
        config: config,
        audio: audio,
    }

    try {
        // Detects speech in the audio file. This creates a recognition job that you
        // can wait for now, or get its result later.
        const [operation] = await client.longRunningRecognize(request)

        console.log('===========> operationName: ', operation.name)

        return { msg: `success`, status: StatusCodes.OK, operationName: operation.name }
    } catch (error) {
        console.log('ERROR ON TRY TRANSCRIPT: ', error)
        return { msg: `Error on try transcript the file`, status: StatusCodes.INTERNAL_SERVER_ERROR }
    }
}

module.exports = speechToTextJob