Spaces:
Running
on
T4
Running
on
T4
""" | |
constants.py | |
""" | |
import os | |
from pathlib import Path | |
# Key constants | |
APP_TITLE = "Open NotebookLM" | |
CHARACTER_LIMIT = 100_000 | |
# Gradio-related constants | |
GRADIO_CACHE_DIR = "./gradio_cached_examples/tmp/" | |
GRADIO_CLEAR_CACHE_OLDER_THAN = 1 * 24 * 60 * 60 # 1 day | |
# Error messages-related constants | |
ERROR_MESSAGE_NO_INPUT = "Please provide at least one PDF file or a URL." | |
ERROR_MESSAGE_NOT_PDF = "The provided file is not a PDF. Please upload only PDF files." | |
ERROR_MESSAGE_NOT_SUPPORTED_IN_MELO_TTS = "The selected language is not supported without advanced audio generation. Please enable advanced audio generation or choose a supported language." | |
ERROR_MESSAGE_READING_PDF = "Error reading the PDF file" | |
ERROR_MESSAGE_TOO_LONG = "The total content is too long. Please ensure the combined text from PDFs and URL is fewer than {CHARACTER_LIMIT} characters." | |
# Fireworks API-related constants | |
FIREWORKS_API_KEY = os.getenv("FIREWORKS_API_KEY") | |
FIREWORKS_BASE_URL = "https://api.fireworks.ai/inference/v1" | |
FIREWORKS_MAX_TOKENS = 16_384 | |
FIREWORKS_MODEL_ID = "accounts/fireworks/models/llama-v3p1-405b-instruct" | |
FIREWORKS_TEMPERATURE = 0.1 | |
FIREWORKS_JSON_RETRY_ATTEMPTS = 3 | |
# MeloTTS | |
MELO_API_NAME = "/synthesize" | |
MELO_TTS_SPACES_ID = "mrfakename/MeloTTS" | |
MELO_RETRY_ATTEMPTS = 3 | |
MELO_RETRY_DELAY = 5 # in seconds | |
MELO_TTS_LANGUAGE_MAPPING = { | |
"en": "EN", | |
"es": "ES", | |
"fr": "FR", | |
"zh": "ZJ", | |
"ja": "JP", | |
"ko": "KR", | |
} | |
# Suno related constants | |
SUNO_LANGUAGE_MAPPING = { | |
"English": "en", | |
"Chinese": "zh", | |
"French": "fr", | |
"German": "de", | |
"Hindi": "hi", | |
"Italian": "it", | |
"Japanese": "ja", | |
"Korean": "ko", | |
"Polish": "pl", | |
"Portuguese": "pt", | |
"Russian": "ru", | |
"Spanish": "es", | |
"Turkish": "tr", | |
} | |
# General audio-related constants | |
NOT_SUPPORTED_IN_MELO_TTS = list( | |
set(SUNO_LANGUAGE_MAPPING.values()) - set(MELO_TTS_LANGUAGE_MAPPING.keys()) | |
) | |
NOT_SUPPORTED_IN_MELO_TTS = [ | |
key for key, id in SUNO_LANGUAGE_MAPPING.items() if id in NOT_SUPPORTED_IN_MELO_TTS | |
] | |
# Jina Reader-related constants | |
JINA_READER_URL = "https://r.jina.ai/" | |
JINA_RETRY_ATTEMPTS = 3 | |
JINA_RETRY_DELAY = 5 # in seconds | |
# UI-related constants | |
UI_DESCRIPTION = """ | |
<table style="border-collapse: collapse; border: none; padding: 20px;"> | |
<tr style="border: none;"> | |
<td style="border: none; vertical-align: top; padding-right: 30px; padding-left: 30px;"> | |
<img src="https://raw.githubusercontent.com/gabrielchua/daily-ai-papers/main/_includes/icon.png" alt="Open NotebookLM" width="120" style="margin-bottom: 10px;"> | |
</td> | |
<td style="border: none; vertical-align: top; padding: 10px;"> | |
<p style="margin-bottom: 15px;">Convert your PDFs into podcasts with open-source AI models (<a href="https://huggingface.co/meta-llama/Llama-3.1-405B">Llama 3.1 405B</a>, <a href="https://huggingface.co/myshell-ai/MeloTTS-English">MeloTTS</a>, <a href="https://huggingface.co/suno/bark">Bark</a>).</p> | |
<p style="margin-top: 15px;">Note: Only the text content of the PDFs will be processed. Images and tables are not included. The total content should be no more than 100,000 characters due to the context length of Llama 3.1 405B.</p> | |
</td> | |
</tr> | |
</table> | |
""" | |
UI_AVAILABLE_LANGUAGES = list(set(SUNO_LANGUAGE_MAPPING.keys())) | |
UI_INPUTS = { | |
"file_upload": { | |
"label": "1. π Upload your PDF(s)", | |
"file_types": [".pdf"], | |
"file_count": "multiple", | |
}, | |
"url": { | |
"label": "2. π Paste a URL (optional)", | |
"placeholder": "Enter a URL to include its content", | |
}, | |
"question": { | |
"label": "3. π€ Do you have a specific question or topic in mind?", | |
"placeholder": "Enter a question or topic", | |
}, | |
"tone": { | |
"label": "4. π Choose the tone", | |
"choices": ["Fun", "Formal"], | |
"value": "Fun", | |
}, | |
"length": { | |
"label": "5. β±οΈ Choose the length", | |
"choices": ["Short (1-2 min)", "Medium (3-5 min)"], | |
"value": "Medium (3-5 min)", | |
}, | |
"language": { | |
"label": "6. π Choose the language", | |
"choices": UI_AVAILABLE_LANGUAGES, | |
"value": "English", | |
}, | |
"advanced_audio": { | |
"label": "7. π Use advanced audio generation? (Experimental)", | |
"value": False, | |
}, | |
} | |
UI_OUTPUTS = { | |
"audio": {"label": "π Podcast", "format": "mp3"}, | |
"transcript": { | |
"label": "π Transcript", | |
}, | |
} | |
UI_API_NAME = "generate_podcast" | |
UI_ALLOW_FLAGGING = "never" | |
UI_CONCURRENCY_LIMIT = 3 | |
UI_EXAMPLES = [ | |
[ | |
[str(Path("examples/1310.4546v1.pdf"))], | |
"", | |
"Explain this paper to me like I'm 5 years old", | |
"Fun", | |
"Short (1-2 min)", | |
"English", | |
True, | |
], | |
[ | |
[], | |
"https://en.wikipedia.org/wiki/Hugging_Face", | |
"How did Hugging Face become so successful?", | |
"Fun", | |
"Short (1-2 min)", | |
"English", | |
False, | |
], | |
[ | |
[], | |
"https://simple.wikipedia.org/wiki/Taylor_Swift", | |
"Why is Taylor Swift so popular?", | |
"Fun", | |
"Short (1-2 min)", | |
"English", | |
False, | |
], | |
] | |
UI_CACHE_EXAMPLES = True | |
UI_SHOW_API = True | |