Spaces:

gabrielchua
/

open-notebooklm

Running on T4

App Files Files Community

knowsuchagency commited on Jul 20

Commit

3cf1f43

•

1 Parent(s): 8729c75

replace gemini with gpt 4o-mini

Browse files

Files changed (1) hide show

main.py +5 -14

main.py CHANGED Viewed

@@ -60,24 +60,19 @@ def get_mp3(text: str, voice: str, api_key: str = None) -> bytes:
             return file.getvalue()
-def generate_audio(
-    file: str,
-    openai_api_key: str = None,
-    gemini_api_key: str = None,
-) -> bytes:
     if not os.getenv("OPENAI_API_KEY", openai_api_key):
         raise gr.Error("OpenAI API key is required")
-    if not os.getenv("GEMINI_API_KEY", gemini_api_key):
-        raise gr.Error("Gemini API key is required")
     with Path(file).open("rb") as f:
         reader = PdfReader(f)
         text = "\n\n".join([page.extract_text() for page in reader.pages])
     @retry(retry=retry_if_exception_type(ValidationError))
-    @llm(model="gemini/gemini-1.5-flash", max_tokens=8192, api_key=gemini_api_key)
     def generate_dialogue(text: str) -> Dialogue:
         """
         Your task is to take the input text provided and turn it into an engaging, informative podcast dialogue. The input text may be messy or unstructured, as it could come from a variety of sources like PDFs or web pages. Don't worry about the formatting issues or any irrelevant information; your goal is to extract the key points and interesting facts that could be discussed in a podcast.
@@ -166,16 +161,12 @@ demo = gr.Interface(
             label="OpenAI API Key",
             visible=not os.getenv("OPENAI_API_KEY"),
         ),
-        gr.Textbox(
-            label="Gemini API Key",
-            visible=not os.getenv("GEMINI_API_KEY"),
-        ),
     ],
     outputs=[
         gr.Audio(label="Audio", format="mp3"),
         gr.Textbox(label="Transcript"),
     ],
-    allow_flagging=False,
     clear_btn=None,
     head=os.getenv("HEAD", "") + Path("head.html").read_text(),
     cache_examples="lazy",

             return file.getvalue()
+def generate_audio(file: str, openai_api_key: str = None) -> bytes:
     if not os.getenv("OPENAI_API_KEY", openai_api_key):
         raise gr.Error("OpenAI API key is required")
     with Path(file).open("rb") as f:
         reader = PdfReader(f)
         text = "\n\n".join([page.extract_text() for page in reader.pages])
     @retry(retry=retry_if_exception_type(ValidationError))
+    @llm(
+        model="gpt-4o-mini",
+    )
     def generate_dialogue(text: str) -> Dialogue:
         """
         Your task is to take the input text provided and turn it into an engaging, informative podcast dialogue. The input text may be messy or unstructured, as it could come from a variety of sources like PDFs or web pages. Don't worry about the formatting issues or any irrelevant information; your goal is to extract the key points and interesting facts that could be discussed in a podcast.
             label="OpenAI API Key",
             visible=not os.getenv("OPENAI_API_KEY"),
         ),
     ],
     outputs=[
         gr.Audio(label="Audio", format="mp3"),
         gr.Textbox(label="Transcript"),
     ],
+    allow_flagging="never",
     clear_btn=None,
     head=os.getenv("HEAD", "") + Path("head.html").read_text(),
     cache_examples="lazy",