Spaces:

hsienchen
/

todo

Sleeping

App Files Files Community

todo / app.py

hsienchen

Update app.py

128b53d verified 9 months ago

raw

history blame

3.79 kB

	# refer to repo https://github.com/gradio-app/gradio/blob/main/demo/chatbot_multimodal/run.ipynb for enhancement

	import PIL.Image
	import gradio as gr
	import base64
	import time
	import os
	import google.generativeai as genai
	import requests

	import pathlib

	txt_model = genai.GenerativeModel('gemini-pro')
	vis_model = genai.GenerativeModel('gemini-pro-vision')

	txt_prompt_1 = """The image contains the contents of a letter. I'd like to follow the request mentioned in the letter. Please provide 3 actionable items to assist me. When responding, use the following format:

	# Sender and Subject #
	1- Action 1 (no more than 20 words)
	2- Action 2 (no more than 20 words)
	3- Action 3 (no more than 20 words)

	For example:
	# From Richard regarding 'Shipping to Customer ABC' #
	1- Pack Product A
	2- Ship before 3:00 PM today
	3- Notify Richard after shipment
	"""

	txt_display_1 = 'content of the letter: '
	import os
	GOOGLE_API_KEY=os.getenv('GOOGLE_API_KEY')
	genai.configure(api_key=GOOGLE_API_KEY)
	SMS_URL =os.getenv('SMS_URL')
	SMS_TOK =os.getenv('SMS_TOK')

	sms_text ="..."
	# Image to Base 64 Converter
	def image_to_base64(image_path):
	with open(image_path, 'rb') as img:
	encoded_string = base64.b64encode(img.read())
	return encoded_string.decode('utf-8')

	# Function that takes User Inputs, generates Response and displays on Chat UI
	def app1_response(img):
	if not img:
	response = txt_model.generate_content(txt_prompt_1)
	return response

	else:
	img = PIL.Image.open(img)
	response = vis_model.generate_content([txt_prompt_1,img])
	return response.text

	# SMS service ends in March 2024, to restore service @Sinch Simple Text
	def send_SMS(resp_text):
	url = SMS_URL
	headers = {
	"Authorization": SMS_TOK,
	"Content-Type": "application/json"
	}

	data = {
	"from": "12085686834",
	"to": ["18587331029"],
	"body": resp_text
	}

	response = requests.post(url, json=data, headers=headers)
	return response.text

	# gradio block
	with gr.Blocks() as app1:
	with gr.Column():
	gr.Markdown("```for email and/or instruction, paste screenshot here...```")
	image_box = gr.Image(type="filepath")
	btn1 = gr.Button("generate To-Dos")
	out1 = gr.Textbox(label="here are the actionables...")
	btn2 = gr.Button("Send to Mobile")
	out2 = gr.Textbox(label="response from SMS gateway...")

	btn1.click(fn=app1_response, inputs=[image_box], outputs=out1)
	btn2.click(fn=send_SMS, inputs=out1, outputs=out2)

	gr.Markdown("""
	# Make a Plan #

	- screen capture (Win + shift + S)
	- click Make a Plan to upload
	- await LLM Bot (Gemini, in this case) response
	- receive THREE actionable items

	[demo](https://youtu.be/lJ4jIAEVRNY)

	""")

	with gr.Blocks() as app2:
	with gr.Column():
	gr.Markdown("```Stock-Out Shamer, paste ERP Inv screenshot here...```")
	image_box = gr.Image(type="filepath")
	btn1 = gr.Button("check ROQ")
	out1 = gr.Textbox(label="here is the watch list...")
	btn2 = gr.Button("send out reminders")
	out2 = gr.Textbox(label="response or feed back?")

	btn1.click(fn=app1_response, inputs=[image_box], outputs=out1)
	btn2.click(fn=send_SMS, inputs=out1, outputs=out2)

	gr.Markdown("""
	# Make a Plan #

	- screen capture (Win + shift + S)
	- click Make a Plan to upload
	- await LLM Bot (Gemini, in this case) response
	- receive THREE actionable items

	[demo](https://youtu.be/lJ4jIAEVRNY)

	""")

	with gr.Blocks() as demo:
	gr.Markdown("## Workflow Bot ##")
	gr.TabbedInterface([app1, app2], ["To-Dos", "SOS"])

	demo.queue()
	demo.launch()