update summary generation prompt and remove common answer prefixes

2026-03-10 08:51:17 +00:00 · 2023-08-05 12:32:47 -04:00
parent d198eda582
commit 2e9444b426
1 changed files with 11 additions and 4 deletions
--- a/roller-vllm.py
+++ b/roller-vllm.py
@@ -30,11 +30,16 @@ Consider the current context when summarizing the given transcription part.
 Respond ONLY with a JSON object with 3 keys in the following format:
 {
 Speaker-Map: A map of speakers to their names, for example { "SPEAKER 1": "Bob Dole", "SPEAKER 2": "Jane Doe" }.  Once a speaker is identified, it must not change.
- Summary: "A detailed, point-by-point summary of the current transcription.  Write at least five sentences, including details of all major points.",
+ Summary: "A detailed, point-by-point summary of the current transcription.  Include details of major points.  Write at least 3 sentences but no more then 6 sentences.",
 Next-Context: "List of topics from the transcription Summary above."
 }
 """

+answer_prefixes = [
+   "In this part of the transcription, ",
+   "In this transcription part, " 
+]
+
 import sys
 sys.path.append('../can-ai-code/')
 from interview_cuda import InterviewVLLM
@@ -82,6 +87,8 @@ def main(prefix: str, model_name: str, gpu_split: str = "", init_speakers: str =

        # the trailing } is sometimes lost
        if not answer.endswith('}'): answer += '}'
+        for prefix in answer_prefixes:
+            answer = answer.replace(prefix, '')

        #print(answer)
        answer_json = {}
@@ -96,9 +103,9 @@ def main(prefix: str, model_name: str, gpu_split: str = "", init_speakers: str =
            print(answer)
            print('Error parsing response: ', str(e))
        
-        summary = answer_json.get('Summary')
-        new_context = str(answer_json.get('Next-Context'))
-        new_speakers = str(answer_json.get('Speaker-Map'))
+        summary = answer_json.get('Summary','')
+        new_context = str(answer_json.get('Next-Context',''))
+        new_speakers = str(answer_json.get('Speaker-Map',''))

        if summary == '' or new_context == '' or new_speakers == '':
            print('extraction failed:', new_context, new_speakers, summary)