Eh

2026-03-10 08:51:17 +00:00 · 2024-05-09 18:12:23 -07:00
parent ed966d2fb7
commit 828665d9c6
43 changed files with 101 additions and 102 deletions
--- a/.gitignore
+++ b/.gitignore
--- a/README.md
+++ b/README.md
@@ -65,6 +65,7 @@ GUI
  4. Llama.cpp
  5. Kobold.cpp
  6. Oobabooga
+  7. HuggingFace
 - **Planned to Support**
  1. TabbyAPI

@@ -203,6 +204,11 @@ By default videos, transcriptions and summaries are stored in a folder with the
      * `llama3-8b-8192`
      * `llama3-70b-8192`
      * `mixtral-8x7b-32768`
+    - HuggingFace:
+      * `CohereForAI/c4ai-command-r-plus`
+      * `meta-llama/Meta-Llama-3-70B-Instruct`
+      * `meta-llama/Meta-Llama-3-8B-Instruct`
+      * Supposedly you can use any model on there, but this is for reference for the free demo instance, in case you'd like to host your own.
    - OpenAI:
      * `gpt-4-turbo`
      * `gpt-4-turbo-preview`
--- a/config.txt
+++ b/config.txt
@@ -7,6 +7,9 @@ groq_api_key = idk
 groq_model = FIXME
 openai_api_key = <openai_api_key>
 openai_model = gpt-4-turbo
+huggingface_api_token = <huggingface_api_token>
+huggingface_model = CohereForAI/c4ai-command-r-plus
+

 [Local-API]
 kobold_api_key = <kobold api key>
@@ -16,9 +19,11 @@ llama_api_IP = http://127.0.0.1:8080/completion
 ooba_api_key = <ooba api key>
 ooba_api_IP = http://127.0.0.1:5000/v1/chat/completions

+
 [Paths]
 output_path = Results
 logging_file = Logs

+
 [Processing]
 processing_choice = cuda
--- a/summarize.py
+++ b/summarize.py
@@ -70,12 +70,14 @@ anthropic_api_key = config.get('API', 'anthropic_api_key', fallback=None)
 cohere_api_key = config.get('API', 'cohere_api_key', fallback=None)
 groq_api_key = config.get('API', 'groq_api_key', fallback=None)
 openai_api_key = config.get('API', 'openai_api_key', fallback=None)
+huggingface_api_token = config.get('API', 'huhuggingface_api_token', fallback=None)

 # Models
 anthropic_model = config.get('API', 'anthropic_model', fallback='claude-3-sonnet-20240229')
 cohere_model = config.get('API', 'cohere_model', fallback='command-r-plus')
 groq_model = config.get('API', 'groq_model', fallback='FIXME')
 openai_model = config.get('API', 'openai_model', fallback='gpt-4-turbo')
+huggingface_model = config.get('API', 'huggingface_model', fallback='CohereForAI/c4ai-command-r-plus')

 # Local-Models
 kobold_api_IP = config.get('Local-API', 'kobold_api_IP', fallback='http://127.0.0.1:5000/api/v1/generate')
@@ -329,6 +331,27 @@ def process_local_file(file_path):
 # Video Download/Handling
 #

+def process_url(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+    try:
+        results = main(input_path, api_name=api_name, api_key=api_key, num_speakers=num_speakers, whisper_model=whisper_model, offset=offset, vad_filter=vad_filter, download_video_flag=download_video_flag)
+        
+        if results:
+            transcription_result = results[0]
+            json_file_path = transcription_result['audio_file'].replace('.wav', '.segments.json')
+            with open(json_file_path, 'r') as file:
+                json_data = json.load(file)
+            
+            summary = transcription_result.get('summary', '')
+            
+            return json_data, summary, json_file_path, json_file_path.replace('.segments.json', '_summary.txt')
+        else:
+            return None, "No results found.", None, None
+    except Exception as e:
+        error_message = f"An error occurred: {str(e)}"
+        return None, error_message, None, None
+
+
+
 def create_download_directory(title):
    base_dir = "Results"
    # Remove characters that are illegal in Windows filenames and normalize
@@ -1110,24 +1133,43 @@ def save_summary_to_file(summary, file_path):
 # Gradio UI
 #

-def process_url(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+# Only to be used when configured with Gradio for HF Space
+def summarize_with_huggingface(api_key, file_path):
    try:
-        results = main(input_path, api_name=api_name, api_key=api_key, num_speakers=num_speakers, whisper_model=whisper_model, offset=offset, vad_filter=vad_filter, download_video_flag=download_video_flag)
+        logging.debug("huggingface: Loading json data for summarization")
+        with open(file_path, 'r') as file:
+            segments = json.load(file)
        
-        if results:
-            transcription_result = results[0]
-            json_file_path = transcription_result['audio_file'].replace('.wav', '.segments.json')
-            with open(json_file_path, 'r') as file:
-                json_data = json.load(file)
-            
-            summary = transcription_result.get('summary', '')
-            
-            return json_data, summary, json_file_path, json_file_path.replace('.segments.json', '_summary.txt')
+        logging.debug("huggingface: Extracting text from the segments")
+        text = extract_text_from_segments(segments)
+
+        API_TOKEN = huggingface_api_token
+        headers = {"Authorization": f"Bearer {API_TOKEN}"}
+
+        logging.debug("huggingface: Creating query...")
+        data = query("Can you please let us know more details about your ")
+
+        API_URL = f"https://api-inference.huggingface.co/models/{huggingface_model}"
+        response = requests.post(API_URL, headers=headers, json=data)
+        
+        if response.status_code == 200:
+            summary = response.json()['choices'][0]['message']['content'].strip()
+            logging.debug("huggingface: Summarization successful")
+            print("Summarization successful.")
+            return summary
        else:
-            return None, "No results found.", None, None
+            logging.debug("huggingface: Summarization failed")
+            print("Failed to process summary:", response.text)
+            return None
    except Exception as e:
-        error_message = f"An error occurred: {str(e)}"
-        return None, error_message, None, None
+        logging.debug("huggingface: Error in processing: %s", str(e))
+        print("Error occurred while processing summary with huggingface:", str(e))
+        return None
+
+
+
+    def same_auth(username, password):
+        return username == password



@@ -1142,7 +1184,7 @@ def launch_ui():
        fn=process_url,
        inputs=[
            gr.components.Textbox(label="URL"),
-            gr.components.Dropdown(choices=["openai", "anthropic", "cohere", "groq", "llama", "kobold", "ooba"], label="API Name"),
+            gr.components.Dropdown(choices=["huggingface", "openai", "anthropic", "cohere", "groq", "llama", "kobold", "ooba"], label="API Name"),
            gr.components.Textbox(label="API Key"),
            gr.components.Number(value=2, label="Number of Speakers"),
            gr.components.Dropdown(choices=whisper_models, value="small.en", label="Whisper Model"),
@@ -1161,64 +1203,8 @@ def launch_ui():
        allow_flagging="never"
    )

-
-# FIXME - c/p from openai - only to be used when configured with Gradio for HF Space
-def summarize_with_huggingface(api_key, file_path):
-    try:
-        logging.debug("openai: Loading json data for summarization")
-        with open(file_path, 'r') as file:
-            segments = json.load(file)
-        
-        logging.debug("openai: Extracting text from the segments")
-        text = extract_text_from_segments(segments)
-
-        headers = {
-            'Authorization': f'Bearer {api_key}',
-            'Content-Type': 'application/json'
-        }
-        
-        logging.debug("openai: Preparing data + prompt for submittal")
-        prompt_text = f"{text} \n\n\n\nPlease provide a detailed, bulleted list of the points made throughout the transcribed video and any supporting arguments made for said points"
-        data = {
-            "model": "CohereForAI/c4ai-command-r-plus",
-            "messages": [
-                {
-                    "role": "system",
-                    "content": "You are a professional summarizer."
-                },
-                {
-                    "role": "user",
-                    "content": prompt_text
-                }
-            ],
-            "max_tokens": 4096,  # Adjust tokens as needed
-            "temperature": 0.7
-        }
-        logging.debug("openai: Posting request")
-        response = requests.post('https://api.openai.com/v1/chat/completions', headers=headers, json=data)
-        
-        if response.status_code == 200:
-            summary = response.json()['choices'][0]['message']['content'].strip()
-            logging.debug("openai: Summarization successful")
-            print("Summarization successful.")
-            return summary
-        else:
-            logging.debug("openai: Summarization failed")
-            print("Failed to process summary:", response.text)
-            return None
-    except Exception as e:
-        logging.debug("openai: Error in processing: %s", str(e))
-        print("Error occurred while processing summary with openai:", str(e))
-        return None
-
-
-
-    def same_auth(username, password):
-        return username == password
-
-
-
-    iface.launch(auth=same_auth,share=True)
+    #iface.launch(auth=same_auth,share=False)
+    iface.launch()

 #
 #
@@ -1235,6 +1221,8 @@ def summarize_with_huggingface(api_key, file_path):
 #

 def main(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+    if input_path is None and args.user_interface:
+        return []
    start_time = time.monotonic()
    paths = []  # Initialize paths as an empty list
    if os.path.isfile(input_path) and input_path.endswith('.txt'):
@@ -1373,40 +1361,40 @@ if __name__ == "__main__":
    if args.user_interface:
        launch_ui()
    else:
-        if args.input_path is None:
+        if not args.input_path:
            parser.print_help()
            sys.exit(1)

-    logging.basicConfig(level=getattr(logging, args.log_level), format='%(asctime)s - %(levelname)s - %(message)s')
+        logging.basicConfig(level=getattr(logging, args.log_level), format='%(asctime)s - %(levelname)s - %(message)s')

-    logging.info('Starting the transcription and summarization process.')
-    logging.info(f'Input path: {args.input_path}')
-    logging.info(f'API Name: {args.api_name}')
-    logging.debug(f'API Key: {args.api_key}') # ehhhhh
-    logging.info(f'Number of speakers: {args.num_speakers}')
-    logging.info(f'Whisper model: {args.whisper_model}')
-    logging.info(f'Offset: {args.offset}')
-    logging.info(f'VAD filter: {args.vad_filter}')
-    logging.info(f'Log Level: {args.log_level}') #lol
+        logging.info('Starting the transcription and summarization process.')
+        logging.info(f'Input path: {args.input_path}')
+        logging.info(f'API Name: {args.api_name}')
+        logging.debug(f'API Key: {args.api_key}') # ehhhhh
+        logging.info(f'Number of speakers: {args.num_speakers}')
+        logging.info(f'Whisper model: {args.whisper_model}')
+        logging.info(f'Offset: {args.offset}')
+        logging.info(f'VAD filter: {args.vad_filter}')
+        logging.info(f'Log Level: {args.log_level}') #lol

-    if args.api_name and args.api_key:
-        logging.info(f'API: {args.api_name}')
-        logging.info('Summarization will be performed.')
-    else:
-        logging.info('No API specified. Summarization will not be performed.')
+        if args.api_name and args.api_key:
+            logging.info(f'API: {args.api_name}')
+            logging.info('Summarization will be performed.')
+        else:
+            logging.info('No API specified. Summarization will not be performed.')

-    logging.debug("Platform check being performed...")
-    platform_check()
-    logging.debug("CUDA check being performed...")
-    cuda_check()
-    logging.debug("ffmpeg check being performed...")
-    check_ffmpeg()
+        logging.debug("Platform check being performed...")
+        platform_check()
+        logging.debug("CUDA check being performed...")
+        cuda_check()
+        logging.debug("ffmpeg check being performed...")
+        check_ffmpeg()

-    try:
-        results = main(args.input_path, api_name=args.api_name, api_key=args.api_key, num_speakers=args.num_speakers, whisper_model=args.whisper_model, offset=args.offset, vad_filter=args.vad_filter, download_video_flag=args.video)
-        logging.info('Transcription process completed.')
-    except Exception as e:
-        logging.error('An error occurred during the transcription process.')
-        logging.error(str(e))
-        sys.exit(1)
+        try:
+            results = main(args.input_path, api_name=args.api_name, api_key=args.api_key, num_speakers=args.num_speakers, whisper_model=args.whisper_model, offset=args.offset, vad_filter=args.vad_filter, download_video_flag=args.video)
+            logging.info('Transcription process completed.')
+        except Exception as e:
+            logging.error('An error occurred during the transcription process.')
+            logging.error(str(e))
+            sys.exit(1)

--- a/tldw-original-scripts/Samples/compare/aoe-english.json
+++ b/tldw-original-scripts/Samples/compare/aoe-english.json
--- a/tldw-original-scripts/Samples/compare/aoe.yaml
+++ b/tldw-original-scripts/Samples/compare/aoe.yaml
--- a/tldw-original-scripts/Samples/compare/ufo-13b-english.json
+++ b/tldw-original-scripts/Samples/compare/ufo-13b-english.json
--- a/tldw-original-scripts/Samples/compare/ufo-13b.yaml
+++ b/tldw-original-scripts/Samples/compare/ufo-13b.yaml
--- a/tldw-original-scripts/Samples/compare/ufo-english.json
+++ b/tldw-original-scripts/Samples/compare/ufo-english.json
--- a/tldw-original-scripts/Samples/compare/ufo.yaml
+++ b/tldw-original-scripts/Samples/compare/ufo.yaml
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/Elon
+++ b/tldw-original-scripts/Samples/data/Elon
--- a/tldw-original-scripts/Samples/data/GRAND
+++ b/tldw-original-scripts/Samples/data/GRAND
--- a/tldw-original-scripts/Samples/data/GRAND
+++ b/tldw-original-scripts/Samples/data/GRAND
--- a/tldw-original-scripts/Samples/data/Sam
+++ b/tldw-original-scripts/Samples/data/Sam
--- a/tldw-original-scripts/Samples/data/Sam
+++ b/tldw-original-scripts/Samples/data/Sam
--- a/tldw-original-scripts/Samples/data/Sam
+++ b/tldw-original-scripts/Samples/data/Sam
--- a/tldw-original-scripts/Samples/data/Subcommittee
+++ b/tldw-original-scripts/Samples/data/Subcommittee
--- a/tldw-original-scripts/Samples/data/Subcommittee
+++ b/tldw-original-scripts/Samples/data/Subcommittee
--- a/tldw-original-scripts/Samples/interview_aoe-small-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017407.ndjson
+++ b/tldw-original-scripts/Samples/interview_aoe-small-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017407.ndjson
--- a/tldw-original-scripts/Samples/interview_elon-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017434.ndjson
+++ b/tldw-original-scripts/Samples/interview_elon-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017434.ndjson
--- a/tldw-original-scripts/Samples/interview_lex-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017487.ndjson
+++ b/tldw-original-scripts/Samples/interview_lex-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017487.ndjson
--- a/tldw-original-scripts/Samples/interview_ufo-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017596.ndjson
+++ b/tldw-original-scripts/Samples/interview_ufo-300_english_airoboros-l2-context_none_summary_jondurbin-airoboros-l2-13b-gpt4-1.4.1_1691017596.ndjson
--- a/tldw-original-scripts/Samples/prepare_airoboros-l2-context-300_english_airoboros-l2-context.ndjson
+++ b/tldw-original-scripts/Samples/prepare_airoboros-l2-context-300_english_airoboros-l2-context.ndjson
--- a/tldw-original-scripts/Samples/prepare_aoe-small-300_english_airoboros-l2-context.ndjson
+++ b/tldw-original-scripts/Samples/prepare_aoe-small-300_english_airoboros-l2-context.ndjson
--- a/tldw-original-scripts/Samples/prepare_elon-300_english_airoboros-l2-context.ndjson
+++ b/tldw-original-scripts/Samples/prepare_elon-300_english_airoboros-l2-context.ndjson
--- a/tldw-original-scripts/Samples/prepare_lex-300_english_airoboros-l2-context.ndjson
+++ b/tldw-original-scripts/Samples/prepare_lex-300_english_airoboros-l2-context.ndjson
--- a/tldw-original-scripts/Samples/prepare_ufo-300_english_airoboros-l2-context.ndjson
+++ b/tldw-original-scripts/Samples/prepare_ufo-300_english_airoboros-l2-context.ndjson
--- a/tldw-original-scripts/Samples/prompts/airoboros-l2-context.txt
+++ b/tldw-original-scripts/Samples/prompts/airoboros-l2-context.txt
--- a/tldw-original-scripts/chunker.py
+++ b/tldw-original-scripts/chunker.py
--- a/tldw-original-scripts/compare-app.py
+++ b/tldw-original-scripts/compare-app.py
--- a/tldw-original-scripts/compare.py
+++ b/tldw-original-scripts/compare.py
--- a/tldw-original-scripts/merger.py
+++ b/tldw-original-scripts/merger.py
--- a/tldw-original-scripts/params/summary.json
+++ b/tldw-original-scripts/params/summary.json
--- a/tldw-original-scripts/pyannote.py
+++ b/tldw-original-scripts/pyannote.py
--- a/tldw-original-scripts/roller-chatgpt-v2.py
+++ b/tldw-original-scripts/roller-chatgpt-v2.py
--- a/tldw-original-scripts/roller-chatgpt.py
+++ b/tldw-original-scripts/roller-chatgpt.py
--- a/tldw-original-scripts/roller-exllama.py
+++ b/tldw-original-scripts/roller-exllama.py
--- a/tldw-original-scripts/roller-vllm.py
+++ b/tldw-original-scripts/roller-vllm.py