Spaces:

lamm-mit
/

PDF2Audio

Running

App Files Files Community

mjbuehler commited on Apr 17

Commit

f14db37

verified ·

1 Parent(s): d3c5cbe

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -8

app.py CHANGED Viewed

@@ -476,6 +476,14 @@ STANDARD_TEXT_MODELS = [
     "openai/custom_model",
 ]
 STANDARD_AUDIO_MODELS = [
     "tts-1",
     "tts-1-hd",
@@ -536,27 +544,29 @@ def get_mp3(text: str, voice: str, audio_model: str, api_key: str = None,
 from functools import wraps
-def conditional_llm(model, api_base=None, api_key=None):
     """
     Conditionally apply the @llm decorator based on the api_base parameter.
     If api_base is provided, it applies the @llm decorator with api_base.
     Otherwise, it applies the @llm decorator without api_base.
     """
-    #for o-x reasoning models (o1, o3, o4, ...)
-    reasoning_effort="high"
     def decorator(func):
         if api_base:
-            return llm(model=model, api_base=api_base, reasoning_effort=reasoning_effort)(func)
         else:
-            return llm(model=model, api_key=api_key, reasoning_effort=reasoning_effort)(func)
     return decorator
 def generate_audio(
     files: list,
     openai_api_key: str = None,
     text_model: str = "o4-mini", #o1-2024-12-17", #"o1-preview-2024-09-12",
     audio_model: str = "tts-1",
     speaker_1_voice: str = "alloy",
     speaker_2_voice: str = "echo",
@@ -781,6 +791,13 @@ with gr.Blocks(title="PDF to Audio", css="""
                 value="o3-mini", #"o4-mini", #"o1-preview-2024-09-12", #"gpt-4o-mini",
                 info="Select the model to generate the dialogue text.",
             )
             audio_model = gr.Dropdown(
                 label="Audio Generation Model",
                 choices=STANDARD_AUDIO_MODELS,
@@ -890,7 +907,7 @@ with gr.Blocks(title="PDF to Audio", css="""
     submit_btn.click(
         fn=validate_and_generate_audio,
         inputs=[
-            files, openai_api_key, text_model, audio_model,
             speaker_1_voice, speaker_2_voice, speaker_1_instructions, speaker_2_instructions,
             api_base,
             intro_instructions, text_instructions, scratch_pad_instructions,
@@ -920,7 +937,7 @@ with gr.Blocks(title="PDF to Audio", css="""
         ),
         inputs=[
             use_edited_transcript, edited_transcript,
-            files, openai_api_key, text_model, audio_model,
             speaker_1_voice, speaker_2_voice, speaker_1_instructions, speaker_2_instructions,
             api_base,
             intro_instructions, text_instructions, scratch_pad_instructions,

     "openai/custom_model",
 ]
+REASONING_EFFORTS = [
+    "N/A",
+    "low",
+    "medium",
+    "high",
+]
 STANDARD_AUDIO_MODELS = [
     "tts-1",
     "tts-1-hd",
 from functools import wraps
+def conditional_llm(model, api_base=None, api_key=None, reasoning_effort=None):
     """
     Conditionally apply the @llm decorator based on the api_base parameter.
     If api_base is provided, it applies the @llm decorator with api_base.
     Otherwise, it applies the @llm decorator without api_base.
     """
     def decorator(func):
         if api_base:
+            return llm(model=model, api_base=api_base, )(func)
         else:
+            if reasoning_effort=="N/A":
+                return llm(model=model, api_key=api_key, )(func)
+            else:
+                return llm(model=model, api_key=api_key, reasoning_effort=reasoning_effort)(func)
     return decorator
 def generate_audio(
     files: list,
     openai_api_key: str = None,
     text_model: str = "o4-mini", #o1-2024-12-17", #"o1-preview-2024-09-12",
+    reasoning_effort: str = None
     audio_model: str = "tts-1",
     speaker_1_voice: str = "alloy",
     speaker_2_voice: str = "echo",
                 value="o3-mini", #"o4-mini", #"o1-preview-2024-09-12", #"gpt-4o-mini",
                 info="Select the model to generate the dialogue text.",
             )
+            reasoning_effort = gr.Dropdown(
+                label="Reasoning effort (for reasoning models, e.g. o1, o3, o4)",
+                choices=REASONING_EFFORTS,
+                value=None #"o3-mini", #"o4-mini", #"o1-preview-2024-09-12", #"gpt-4o-mini",
+                info="Select reasoning effort used.",
+            )
             audio_model = gr.Dropdown(
                 label="Audio Generation Model",
                 choices=STANDARD_AUDIO_MODELS,
     submit_btn.click(
         fn=validate_and_generate_audio,
         inputs=[
+            files, openai_api_key, text_model, reasoning_effort, audio_model,
             speaker_1_voice, speaker_2_voice, speaker_1_instructions, speaker_2_instructions,
             api_base,
             intro_instructions, text_instructions, scratch_pad_instructions,
         ),
         inputs=[
             use_edited_transcript, edited_transcript,
+            files, openai_api_key, text_model, reasoning_effort, audio_model,
             speaker_1_voice, speaker_2_voice, speaker_1_instructions, speaker_2_instructions,
             api_base,
             intro_instructions, text_instructions, scratch_pad_instructions,