Update app.mjs

Avs163 · web-flow · commit b9120a0916ba · 2025-03-11T12:47:40.000+05:30
diff --git a/apigw-lambda-transcribe-sam-js/src/app.mjs b/apigw-lambda-transcribe-sam-js/src/app.mjs
@@ -1,37 +1,76 @@
-import { TranscribeClient, StartTranscriptionJobCommand } from "@aws-sdk/client-transcribe";
-import { randomUUID } from 'crypto';
+import { S3Client, GetObjectCommand } from '@aws-sdk/client-s3';
+import { TranscribeClient, StartTranscriptionJobCommand } from '@aws-sdk/client-transcribe';
 
-export const lambda_handler = async (event, context) => {
-    try {
-        const requestBody = JSON.parse(event.body);
-        const s3_url = requestBody.audio_url;
-        
-        const transcribe = new TranscribeClient();
-        const job_name = `transcribe-${randomUUID()}`;
-        
-        const command = new StartTranscriptionJobCommand({
-            TranscriptionJobName: job_name,
-            Media: { MediaFileUri: s3_url },
-            MediaFormat: 'mp3',  // Adjust based on your needs
-            LanguageCode: 'en-US'  // Adjust based on your needs
-        });
-        
-        await transcribe.send(command);
-        
-        return {
-            statusCode: 200,
-            body: JSON.stringify({
-                job_name: job_name,
-                status: 'IN_PROGRESS'
-            })
-        };
-        
-    } catch (e) {
-        return {
-            statusCode: 500,
-            body: JSON.stringify({
-                error: e.toString()
-            })
-        };
+const s3Client = new S3Client({ region: process.env.REGION });
+const transcribeClient = new TranscribeClient({ region: process.env.REGION });
+
+export const handler = async (event) => {
+  try {
+    // Get the S3 bucket and key from the event
+    const bucket = event.Records[0].s3.bucket.name;
+    const key = decodeURIComponent(event.Records[0].s3.object.key.replace(/\+/g, ' '));
+    
+    console.log(`Processing file: s3://${bucket}/${key}`);
+
+    // Extract file name and extension for the transcription job
+    const fileName = key.split('/').pop();
+    const fileNameWithoutExt = fileName.substring(0, fileName.lastIndexOf('.')) || fileName;
+    const fileExt = fileName.substring(fileName.lastIndexOf('.') + 1).toLowerCase();
+    
+    // Determine media format based on file extension
+    let mediaFormat;
+    switch (fileExt) {
+      case 'mp3':
+        mediaFormat = 'mp3';
+        break;
+      case 'wav':
+        mediaFormat = 'wav';
+        break;
+      case 'flac':
+        mediaFormat = 'flac';
+        break;
+      default:
+        throw new Error(`Unsupported file format: ${fileExt}`);
     }
-};
+    
+    const transcriptionJobName = `${fileNameWithoutExt}-${Date.now()}`;
+    
+    const mediaFileUri = `s3://${bucket}/${key}`;
+
+    const startTranscriptionParams = {
+      TranscriptionJobName: transcriptionJobName,
+      LanguageCode: 'en-US', 
+      MediaFormat: mediaFormat,
+      Media: {
+        MediaFileUri: mediaFileUri
+      },
+      OutputBucketName: bucket,
+      OutputKey: `transcriptions/${fileNameWithoutExt}.json`
+    };
+
+    const transcriptionCommand = new StartTranscriptionJobCommand(startTranscriptionParams);
+    const transcriptionResponse = await transcribeClient.send(transcriptionCommand);
+    
+    console.log(`Started transcription job: ${transcriptionJobName}`);
+    console.log(`Transcription job response: ${JSON.stringify(transcriptionResponse)}`);
+    
+    return {
+      statusCode: 200,
+      body: JSON.stringify({
+        message: 'Transcription job started successfully',
+        jobName: transcriptionJobName,
+        jobStatus: transcriptionResponse.TranscriptionJob.TranscriptionJobStatus
+      })
+    };
+  } catch (error) {
+    console.error('Error processing the file:', error);
+    
+    return {
+      statusCode: 500,
+      body: JSON.stringify({
+        message: 'Error starting transcription job',
+        error: error.message
+      })
+    };
+  }
+};