Spaces:

seiching
/

ainotes

Sleeping

App Files Files Community

seiching commited on Feb 29

Commit

5e5f20d

•

1 Parent(s): 44d039c

add summary

Browse files

Files changed (1) hide show

app.py +27 -5

app.py CHANGED Viewed

@@ -41,6 +41,24 @@ def call_openai_api(openaiobj,transcription):
         ]
     )
     return response.choices[0].message.content
 def split_into_chunks(text, tokens=3500):
@@ -70,8 +88,11 @@ def process_chunks(openaikeystr,inputtext):
     chunks = split_into_chunks(text)
     response=''
     for chunk in chunks:
-       response=response+call_openai_api(openaiobj,chunk)
-    return response
     # # Processes chunks in parallel
     # with ThreadPoolExecutor() as executor:
     #     responses = list(executor.map(call_openai_api, [openaiobj,chunks]))
@@ -188,7 +209,8 @@ def writenotes( apikeystr,inputscript):
   print('ok')
   if len(inputscript)>10:
     transcribe_text=inputscript
-    ainotestext=process_chunks(apikeystr,transcribe_text)
    # ainotestext=inputscript
   #ainotestext=""
   # with open('asr_resul.txt', 'w') as f:
@@ -200,13 +222,13 @@ def writenotes( apikeystr,inputscript):
   return ainotestext
 ainotes = gr.Interface(
     fn=writenotes,
-    inputs=[gr.Textbox(label="OPEN AI API KEY",placeholder="請輸入sk..."),gr.Textbox(label="逐字稿",placeholder="請輸入逐字稿")],
     outputs="text",
     layout="horizontal",
     theme="huggingface",
     title="會議紀錄小幫手AINotes",
     description=(
-        "可由麥克風錄音或上傳語音檔"
         f" 使用這個模型 [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}) 先做語音辨識再做會議紀錄摘要"
         " 長度沒有限制"
     ),

         ]
     )
     return response.choices[0].message.content
+def call_openai_summary(openaiobj,transcription):
+    response = openaiobj.chat.completions.create(
+        model="gpt-3.5-turbo",
+        temperature=0,
+        messages=[
+            {
+                "role": "system",
+                "content": "你是專業的文書處理員，請根據由語音辨識軟體將會議錄音所轉錄的逐字稿，摘錄重點，要用比較正式及容易閱讀的寫法，避免口語化"
+            },
+            {
+                "role": "user",
+                "content": transcription
+            }
+        ]
+    )
+    return response.choices[0].message.content
 def split_into_chunks(text, tokens=3500):
     chunks = split_into_chunks(text)
     response=''
     for chunk in chunks:
+      #response=response+call_openai_api(openaiobj,chunk)
+       response=response+call_openai_summary(openaiobj,chunk)
+    finalresponse=response+' summary \n\n' +call_openai_api(openaiobj,response)
+    return finalresponse
     # # Processes chunks in parallel
     # with ThreadPoolExecutor() as executor:
     #     responses = list(executor.map(call_openai_api, [openaiobj,chunks]))
   print('ok')
   if len(inputscript)>10:
     transcribe_text=inputscript
+  ainotestext=process_chunks(apikeystr,transcribe_text)
    # ainotestext=inputscript
   #ainotestext=""
   # with open('asr_resul.txt', 'w') as f:
   return ainotestext
 ainotes = gr.Interface(
     fn=writenotes,
+    inputs=[gr.Textbox(label="OPEN AI API KEY",placeholder="請輸入sk..."),gr.Textbox(label="逐字稿",placeholder="若沒有做語音辨識，請輸入逐字稿")],
     outputs="text",
     layout="horizontal",
     theme="huggingface",
     title="會議紀錄小幫手AINotes",
     description=(
+        "可由麥克風錄音或上傳語音檔若有逐字稿可以直接貼在逐字稿"
         f" 使用這個模型 [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}) 先做語音辨識再做會議紀錄摘要"
         " 長度沒有限制"
     ),