Change default output filename in the audiogen app

gmiodice · kshitij-sisodia-arm · commit e5dcc9d1ff3f · 2025-09-09T13:10:42.000+01:00
- The new default output filename is &lt;prompt&gt;_&lt;seed&gt;.wav

Signed-off-by: Gian Marco Iodice &lt;gianmarco.iodice@arm.com&gt;
diff --git a/kleidiai-examples/audiogen/app/README.md b/kleidiai-examples/audiogen/app/README.md
@@ -68,10 +68,10 @@ From there, you can then run the `audiogen` application, which requires just thr
 - **CPU Threads (-t)**: The number of CPU threads to use (e.g., `4`)
 
 ```bash
-./audiogen -m . -p "warm arpeggios on house beats 120BPM with drums effect" -t 4
+./audiogen -m $LITERT_MODELS_PATH -p "warm arpeggios on house beats 120BPM with drums effect" -t 4
 ```
 
-If everything runs successfully, the generated audio will be saved in `.wav` format (`output.wav`) in the `audiogen_app` folder. At this point, you can play it on your laptop or PC.
+If everything runs successfully, the generated audio will be saved in `.wav` format (`warm_arpeggios_on_house_beats_120bpm_with_drums_effect_99.wav`) in the `audiogen_app` folder. At this point, you can play it on your laptop or PC.
 
 ### Build the audiogen app on Linux® (HOST) or macOS® (HOST) for Android™ (TARGET)
 
@@ -168,8 +168,8 @@ From there, you can then run the `audiogen` application, which requires just thr
 ./audiogen -m . -p "warm arpeggios on house beats 120BPM with drums effect" -t 4
 ```
 
-If everything runs successfully, the generated audio will be saved in `.wav` format (`output.wav`) in the same directory as the `audiogen` binary. At this point, you can then retrieve it using the `adb` tool from a different Terminal and play it on your laptop or PC.
+If everything runs successfully, the generated audio will be saved in `.wav` format (`warm_arpeggios_on_house_beats_120bpm_with_drums_effect_99.wav`) in the same directory as the `audiogen` binary. At this point, you can then retrieve it using the `adb` tool from a different Terminal and play it on your laptop or PC.
 
 ```bash
-adb pull data/local/tmp/output.wav
+adb pull data/local/tmp/warm_arpeggios_on_house_beats_120bpm_with_drums_effect_99.wav
 ```
diff --git a/kleidiai-examples/audiogen/app/audiogen.cpp b/kleidiai-examples/audiogen/app/audiogen.cpp
@@ -43,7 +43,6 @@
 constexpr size_t k_seed_default = 99;
 constexpr size_t k_audio_len_sec_default = 10;
 constexpr size_t k_num_steps_default = 8;
-const std::string k_output_file_default = "output.wav";
 
 // -- Update the tensor index based on your model configuration.
 constexpr size_t k_t5_ids_in_idx = 0;
@@ -85,13 +84,23 @@ static void print_usage(const char *name) {
         "  -s <seed>               (Optional) Random seed for reproducibility. Different seeds generate different audio samples (Default: %zu)\n"
         "  -l <audio_len_sec>      (Optional) Length of generated audio (Default: %zu s)\n"
         "  -n <num_steps>          (Optional) Number of steps (Default: %zu)\n"
-        "  -o <output_file>        (Optional) Output audio file name (Default: %s)\n"
+        "  -o <output_file>        (Optional) Output audio file name (Default: <prompt>_<seed>.wav)\n"
         "  -h                      Show this help message\n",
         name,
         k_seed_default,
         k_audio_len_sec_default,
-        k_num_steps_default,
-        k_output_file_default.c_str());
+        k_num_steps_default);
+}
+
+static std::string get_filename(std::string prompt, size_t seed) {
+    // Convert spaces to underscores
+    std::replace(prompt.begin(), prompt.end(), ' ', '_');
+
+    // Convert to lowercase
+    std::transform(prompt.begin(), prompt.end(), prompt.begin(),
+                   [](unsigned char c) { return std::tolower(c); });
+
+    return prompt + "_" + std::to_string(seed) + ".wav";
 }
 
 static std::vector<int32_t> convert_prompt_to_ids(const std::string& prompt, const std::string& spiece_model_path) {
@@ -220,7 +229,7 @@ int main(int32_t argc, char** argv) {
     std::string prompt           = "";
     size_t num_threads           = 0;
     // Optional arguments
-    std::string output_file      = k_output_file_default;
+    std::string output_file      = "";
     size_t seed                  = k_seed_default;
     size_t num_steps             = k_num_steps_default;
     float audio_len_sec          = static_cast<float>(k_audio_len_sec_default);
@@ -436,6 +445,11 @@ int main(int32_t argc, char** argv) {
     const float* left_ch = autoencoder_out_data;
     const float* right_ch = autoencoder_out_data + num_audio_samples;
 
+    // If output filename empty -> filename = <prompt>_<seed>.wav
+    if (output_file.empty()) {
+        output_file = get_filename(prompt, seed);
+    }
+
     save_as_wav(output_file.c_str(), left_ch, right_ch, num_audio_samples);
 
     // Save the file