modified summarization to openai

joshsoftware · Aug 23, 2024 · 2a245d5 · 2a245d5
1 parent 64d01be
commit 2a245d5
Show file tree

Hide file tree

Showing 5 changed files with 56 additions and 23 deletions.
diff --git a/app.py b/app.py
@@ -2,57 +2,84 @@
 import whisper
 import gradio as gr
 import ollama
+import logging
+from logger import logger
+import openai
+
+# Load environment variables
+load_dotenv()
 
 # Import configurations and functions from modules
 from config import openai_api_key, model_id, model_path
 from load_model import load_model
 #from extract_entities import extract_entities
 
-# Load environment variables
-load_dotenv()
-
+openai.api_key = openai_api_key
 #Load whisher model
 model = load_model(model_id, model_path)
 
+
 #transcripe the audio to its original language
+def process_all_steps(audio):
+    #transcription =transcribe(audio)
+    translation = translate_with_whisper(audio)
+    #translation = translate_with_ollama(transcription)
+    #summary = summarize_using_llama(translation)
+    summary = summarize_using_openai(translation)
+    #return [transcription, translation, summary]
+    return [translation, summary]
+
 def transcribe(audio):
-    result = model.transcribe(audio)
+    logger.info("Started transciption")
+    result = model.transcribe(audio,fp16=False)
     transcription = result["text"]
-    #translation = translate_with_whisper(audio)
-    translation = translate_with_ollama(transcription)
-    summary = summarize(translation)
-    return [transcription, translation, summary]
+    return transcription
 
 #translate the audio file to English language using whisper model
 def translate_with_whisper(audio): 
+    logger.info("Started transciption through whishper")
     options = dict(beam_size=5, best_of=5)
     translate_options = dict(task="translate", **options)
     result = model.transcribe(audio,**translate_options)
     return result["text"]
 
 #translate the text from transciption to English language
 def translate_with_ollama(text):
-    #Uncomment any of the below line to test the translation if don't have an audio file
-    #text = "मुलाखतकार: आम्ही जेनीशी बोलत आहोत. तर तुमचा सध्याचा व्यवसाय काय आहे?\nमुलाखत घेणारा: मी एक सहाय्यक दिग्दर्शक आहे [???] मुळात [???].\nमुलाखतकर्ता: आणि म्हणून तुम्ही या विशिष्ट पदावर किती काळ आहात?\nमुलाखत घेणारा: आम्ही जेनीशी बोलत आहोत. . तर तुमचा सध्याचा व्यवसाय काय आहे?\nमुलाखत घेणारा: मी एक सहाय्यक दिग्दर्शक आहे [???] मुळात [???].\nमुलाखत घेणारा: आणि म्हणून तुम्ही या विशिष्ट पदावर किती काळ आहात?\nमुलाखत घेणारा: मी या विशिष्ट पदावर आहे. स्थिती - ४ वर्षे झाली आहेत.\nमुलाखतकार: तुम्ही आजपर्यंतच्या तुमच्या कामाचे किंवा करिअरच्या इतिहासाचे थोडक्यात वर्णन करू शकता का?\nमुलाखत घेणारा: माझी कारकीर्द अशी आहे की, सुरुवातीच्या काळात ती स्पेशलायझेशनच्या वेगवेगळ्या क्षेत्रात अनेक क्लिनिकल भूमिकांसह सुरू झाली. नर्सिंग [???] उद्योग आणि [???] प्लॅस्टिक [???] संपूर्ण भिन्न प्रकार आणि नंतर मी पुनर्वसन मध्ये हलविले. मी 15 वर्षे [???] होतो आणि नंतर मुळात मी 26 वर्षांचा होतो तेव्हा व्यवस्थापनाच्या भूमिकेत गेलो आणि गेली 27 वर्षे व्यवस्थापनाच्या भूमिकेत काम करत होतो आणि होय, सुमारे 20 वर्षे मी व्यवस्थापनात काम करत आहे आणि मुळात ते केले पुनर्वसन समुपदेशनातील एक पुनर्वसन पदवी, जी मला वाटते [???] खेळली, त्यामुळे [???] नर्सिंगच्या पारंपारिक क्लिनिकल भूमिकेपासून काही बाबतीत भिन्न विलंब.\nमुलाखतकार: होय, मला पहिली गोष्ट वाटते [???] व्यापकपणे सांगायचे तर, तुम्ही नर्सिंगमध्ये जाण्याचे का निवडले?\nमुलाखत घेणारा: कारण मला प्रशिक्षण आणि नोकरीसाठी एकाच वेळी पैसे दिले गेले. 70 च्या दशकात, नोकऱ्या आणि नोकरीमध्ये गोष्टी खूप वेगळ्या होत्या... मुलाखत घेणारा: मी या विशिष्ट स्थितीत आहे - त्याला 4 वर्षे झाली आहेत.]n मुलाखतकार: तुम्ही तुमच्या कामाचे किंवा करिअरच्या इतिहासाचे थोडक्यात वर्णन करू शकता का? आजपर्यंत?\nमुलाखत घेणारा: माझी कारकीर्द अशी आहे की, सुरुवातीला नर्सिंग [???] उद्योग आणि [???] प्लॅस्टिक [???] ते संपूर्ण भिन्न क्षेत्रात विशेषीकरणाच्या विविध क्षेत्रांमध्ये क्लिनिकल भूमिकांपासून सुरुवात झाली. विविधता आणि नंतर मी पुनर्वसन मध्ये हलविले. मी 15 वर्षे [???] होतो आणि नंतर मुळात मी 26 वर्षांचा होतो तेव्हा व्यवस्थापनाच्या भूमिकेत गेलो आणि गेली 27 वर्षे व्यवस्थापनाच्या भूमिकेत काम करत होतो आणि होय, सुमारे 20 वर्षे मी व्यवस्थापनात काम करत आहे आणि मुळात ते केले पुनर्वसन समुपदेशनातील एक पुनर्वसन पदवी, जी मला वाटते [???] खेळली, त्यामुळे [???] नर्सिंगच्या पारंपारिक क्लिनिकल भूमिकेपासून काही बाबतीत भिन्न विलंब.\nमुलाखतकार: होय, मला पहिली गोष्ट वाटते [???] व्यापकपणे सांगायचे तर, तुम्ही नर्सिंगमध्ये जाण्याचे का निवडले?\nमुलाखत घेणारा: कारण मला प्रशिक्षण आणि नोकरीसाठी एकाच वेळी पैसे दिले गेले. 70 च्या दशकात, नोकऱ्या आणि रोजगारामध्ये गोष्टी खूप वेगळ्या होत्या..."
-    #text="नागपूर:महाविकास आघाडीचा मुंबईत मोठा मेळावा झाला. या मेळाव्यात मुख्यमंत्रिपदाचा उमेदवार कोण? हा विषय जास्त गाजला. उद्धव ठाकरेंनी मुख्यमंत्रिपदाचा उमेदवार कोण हे जाहीर करा, मी पाठींबा देतो असे वक्तव्य केले. पण त्याला राष्ट्रवादी काँग्रेसचे अध्यक्ष शरद पवार यांनी प्रतिसाद दिला नाही. त्यांना यावर बोलणेच टाळले. तर काँग्रेस प्रदेशाध्यक्ष नाना पटोलेंनी मात्र आधी निवडणूक जिंकू नंतर मुख्यमंत्री ठरवू अशी भूमिका मांडली. यावर आता संजय राऊत यांनी प्रतिक्रिया दिली आहे. मला मुख्यमंत्री व्हायचे आहे असे उद्धव ठाकरे कधीच बोलले नाहीत असं राऊत यांनी स्पष्ट केले आहे. मात्र त्या पुढे जे वक्तव्य त्यांनी केलं त्यामुळे मविआमध्ये पुन्हा एकदा ठिणगी पडण्याची शक्यता आहे. "
+    logger.info("Started transciption through llama")
     response = ollama.generate(model= "llama3.1", prompt = "Translate the following text to English:"+text+"\n SUMMARY:\n")
     translation = response["response"]
     return translation
 
-
 #Using Ollama and llama3.1 modle, summarize the English translation
-def summarize(text):
-    #Uncomment the following line to test the summarization if don't the audio file
-    #text = "Interviewer: We are talking with Jenny. So what is your current occupation?\nInterviewee: I am an assistant director [???] basically [???].\nInterviewer: And so how long you have been in this particular position?\nInterviewer: We are talking with Jenny. So what is your current occupation?\nInterviewee: I am an assistant director [???] basically [???].\nInterviewer: And so how long you have been in this particular position?\nInterviewee: I am in this particular position - it has been 4 years.\nInterviewer: Are you able to briefly describe your work or career history to date?\nInterviewee: My career has been, it initially started with a lot of clinical roles in very different areas of specialization within the nursing [???] industry and [???] plastics [???] to whole different variety and then I moved into rehabs. I was [???] for 15 years and then basically moved into management role when I was 26 and had been working in the management role for the last 27 years and yeah, about 20 years I have been working in management, and basically did a rehab degree in rehab counseling, which I think played a [???], so [???] sort of varying delay in some respects from the traditional clinical role of nursing.\nInterviewer: Yeah, sort of I guess first thing [???] broadly speaking, why did you choose to go into nursing?\nInterviewee: Because I was paid to train and employed at the same time. In the 70s, things were very different in [???] of jobs and employment...nterviewee: I am in this particular position - it has been 4 years.]nInterviewer: Are you able to briefly describe your work or career history to date?\nInterviewee: My career has been, it initially started with a lot of clinical roles in very different areas of specialization within the nursing [???] industry and [???] plastics [???] to whole different variety and then I moved into rehabs. I was [???] for 15 years and then basically moved into management role when I was 26 and had been working in the management role for the last 27 years and yeah, about 20 years I have been working in management, and basically did a rehab degree in rehab counseling, which I think played a [???], so [???] sort of varying delay in some respects from the traditional clinical role of nursing.\nInterviewer: Yeah, sort of I guess first thing [???] broadly speaking, why did you choose to go into nursing?\nInterviewee: Because I was paid to train and employed at the same time. In the 70s, things were very different in [???] of jobs and employment..."
-    #response = ollama.generate(model='llama3.1', prompt="Write a concise summary of the text that cover the key points of the textspacing_size=gr.themes.sizes.spacing_sm, radius_size=gr.themes.sizes.radius_none.\n SUMMARY: \N"+text)
-    response = ollama.generate(model= "llama3.1", prompt = "summarize the following text:"+text+"\n SUMMARY:\n")
+def summarize_using_llama(text):
+    response = ollama.generate(model= "llama3.1", prompt = "Provide the summary wiht bullet points:"+text+"\n SUMMARY:\n")
     summary = response["response"]
     return summary
 
 
+#Using openaie, summarize the English translation
+def summarize_using_openai(text):
+    logger.info("Started summarization")
+    prompt = "Summarize the following text: " +text
+    try:
+        response = openai.chat.completions.create(
+            model="gpt-4o",
+            messages=[
+                {"role": "system", "content": "You are a helpful assistant that extracts information from Indian multilingual text."},
+                {"role": "user", "content": prompt}
+            ],
+            max_tokens=500
+        )
+        summary  = response.choices[0].message.content
+    except Exception as e:
+        logger.error(e)
+        summary = "Unable to  exract summary"
+    return summary
+
+
 #UI with tabs, 
 theme = gr.themes.Glass(spacing_size="lg", radius_size="lg",primary_hue="blue", font=["Optima","Candara"])
-with gr.Blocks(theme) as block:
+with gr.Blocks(theme, title="Voice Summarization") as block:
     #Tab for recording the audio and upload it for transription, translation and summarization
     with gr.Tab("Record"):
         with gr.Row():
@@ -64,14 +91,15 @@ def summarize(text):
                 elem_classes=["primary"]
             )
         with gr.Row():
-            out_transcribe = gr.TextArea(label="Transcipt")
+            #out_transcribe = gr.TextArea(label="Transcipt")
             out_translate = gr.TextArea(label="Translate")
         with gr.Row():
             out_summary = gr.TextArea(label="Call Summary")
         with gr.Row():   
             submit_btn = gr.Button("Submit")
 
-        submit_btn.click(transcribe, inputs=[inp_audio], outputs=[out_transcribe,out_translate, out_summary])
+        #submit_btn.click(transcribe, inputs=[inp_audio], outputs=[out_transcribe,out_translate, out_summary])
+        submit_btn.click(process_all_steps, inputs=[inp_audio], outputs=[out_translate, out_summary])
 
     #Tab for uploading the audio file for transription, translation and summarization
     with gr.Tab("Upload"):

diff --git a/audio.mp4 b/audio.mp4
diff --git a/config.py b/config.py
@@ -4,5 +4,6 @@
 load_dotenv()
 
 openai_api_key = os.getenv("OPENAI_KEY")
-model_id = os.getenv('MODEL_ID', 'large-v3')
-model_path = os.getenv('MODEL_PATH', 'whisper_model')
+#model_id = os.getenv('MODEL_ID', 'large-v3')
+model_id = os.getenv('MODEL_ID')
+model_path = os.getenv('MODEL_PATH')
diff --git a/load_model.py b/load_model.py
@@ -4,7 +4,8 @@
 #load the whisper model from net if it isn't stored locally
 def load_model(model_id, model_path):
     #check GPU is avaialbe
-    device = "cuda" if torch.cuda.is_available() else "cpu"
+    #device = "cuda" if torch.cuda.is_available() else "cpu"
+    device = "cpu"
     model = whisper.load_model(model_id, device=device, download_root=model_path)
     print(
         f"Model will be run on {device}\n"

diff --git a/requirements.txt b/requirements.txt
@@ -2,3 +2,6 @@ openai-whisper
 ollama
 gradio
 load_dotenv
+openai
+logging
+logging-conf
-Original file line number
+Diff line change
@@ Expand Up / @@ -2,3 +2,6 @@ openai-whisper @@
     ollama
     gradio
     load_dotenv
+    openai
+    logging
+    logging-conf