add cmd flags

aashish-joshi · aashish-joshi · commit c9e7f542c21f · 2024-08-05T18:48:04.000+05:30
diff --git a/README.md b/README.md
@@ -7,9 +7,31 @@ The project is written in Go and executables are provided for Windows, MacOS, an
 ## Usage
 
 1. Get an API key from [Deepgram](https://www.deepgram.com/) and add it to your environment variables as `DEEPGRAM_API_KEY`.
-2. Create a CSV file with the following columns:
+2. Create a CSV file with the following columns (use the provided `sample-scripts.csv` as a template)
     - `label`: The label for the script. This will be used as the file name.
     - `script`: The text to be converted to speech.
-3. Run the executable. It will try and read the csv locally from `./scripts.csv`. If it doesn't exist, it will ask for the path to the CSV file.
-4. The audio files will be saved in the `audio/` directory.
+3. Download the executable for your OS from the [releases](https://github.com/aashish-joshi/tts-bulk/releases) page.
+4. The tool will try and read the csv locally from `scripts.csv`. If it doesn't exist, it will ask for the path to the CSV file.
 
+### Commandline flags
+
+The following flags are supported at the moment.
+
+- `-format`: The format of the audio file. Supported formats are `wav` and `mp3`. Default is `mp3`.
+- `-output`: The output directory where the audio files will be saved. Default is `audio/`.
+- `-csv`: The path to the CSV file. Default is `scripts.csv`.
+- `-output`: The output directory where the audio files will be saved. Default is `audio/`.
+
+### Example
+
+1. Generate mp3 files in the default location.
+    
+    ```bash
+    ./tts-bulk
+    ```
+
+2. Generate wav files in a custom location.
+
+    ```bash
+    ./tts-bulk -format=wav -output=/path/to/output
+    ```
diff --git a/tts-bulk.go b/tts-bulk.go
@@ -3,9 +3,11 @@ package main
 import (
 	"context"
 	"encoding/csv"
+	"flag"
 	"fmt"
 	"os"
 	"path/filepath"
+	"strings"
 	"sync"
 	"time"
 
@@ -24,6 +26,29 @@ func checkDeepgramKey() error {
 
 func main() {
 
+	var dgContainer, dgEncoding string
+
+	// Define the commandline flags
+	dgModelName := flag.String("model", "aura-asteria-en", "Deepgram model name. Defaults to aura-asteria-en")
+	dgFileFormat := flag.String("format", "mp3", "File format for the generated audio files. Defaults to mp3")
+	outputFolder := flag.String("output", "audio", "Output folder for the generated audio files.")
+	csvLocation := flag.String("csv", "scripts.csv", "Location of the CSV file containing the scripts to convert to audio.")
+	// parse the commandline flags
+	flag.Parse()
+
+	// If the DG file format is neither wav nor mp3, raise error.
+	if strings.ToLower(*dgFileFormat) != "wav" && strings.ToLower(*dgFileFormat) != "mp3" {
+		fmt.Println("Invalid file format. Only wav and mp3 are supported.")
+		return
+	}
+
+	if strings.ToLower(*dgFileFormat) == "wav" {
+		dgContainer = "wav"
+		dgEncoding = "linear16"
+	} else {
+		dgContainer = ""
+		dgEncoding = "mp3"
+	}
 	// First check if the Deepgram API key is set
 	if dgErr := checkDeepgramKey(); dgErr != nil {
 		fmt.Println(dgErr)
@@ -38,22 +63,23 @@ func main() {
 
 	// set the Transcription options
 	options := &interfaces.SpeakOptions{
-		Model: "aura-asteria-en",
+		Model:     strings.ToLower(*dgModelName),
+		Container: dgContainer,
+		Encoding:  dgEncoding,
 	}
 
 	// create a Deepgram client
 	c := client.NewRESTWithDefaults()
 	dg := api.New(c)
 
 	// Check if the file exists
-	fileName := "scripts.csv"
-	if _, err := os.Stat(fileName); os.IsNotExist(err) {
-		fmt.Print("Enter the name of the CSV file: ")
-		fmt.Scanln(&fileName)
+	if _, err := os.Stat(*csvLocation); os.IsNotExist(err) {
+		fmt.Print("The file does not exist. Please enter the correct file path.")
+		return
 	}
 
 	// Open the CSV file
-	file, err := os.Open(fileName)
+	file, err := os.Open(*csvLocation)
 	if err != nil {
 		fmt.Printf("Error opening CSV file: %s\n", err)
 		return
@@ -71,7 +97,7 @@ func main() {
 	}
 
 	// Create the "audio" directory if it doesn't exist
-	audioDir := "audio"
+	audioDir := strings.ToLower(*outputFolder)
 	if _, err := os.Stat(audioDir); os.IsNotExist(err) {
 		err := os.Mkdir(audioDir, 0755)
 		if err != nil {
@@ -101,7 +127,7 @@ func main() {
 			defer wg.Done()
 
 			// Perform TTS and save to disk
-			audioPath := filepath.Join(audioDir, fmt.Sprintf("%s.mp3", label))
+			audioPath := filepath.Join(audioDir, fmt.Sprintf("%s.%s", label, *dgFileFormat))
 			err := generateTTSAndSave(ctx, dg, script, options, audioPath)
 			if err != nil {
 				fmt.Printf("Could not generate TTS for row %v - %v: %v\n", i, label, err)