Eh

rmusser01 · May 10, 2024 · 828665d · 828665d
1 parent ed966d2
commit 828665d
Show file tree

Hide file tree

Showing 43 changed files with 103 additions and 104 deletions.
diff --git a/.gitignore b/.gitignore
diff --git a/README.md b/README.md
@@ -65,6 +65,7 @@ GUI
   4. Llama.cpp
   5. Kobold.cpp
   6. Oobabooga
+  7. HuggingFace
 - **Planned to Support**
   1. TabbyAPI
 
@@ -203,6 +204,11 @@ By default videos, transcriptions and summaries are stored in a folder with the
       * `llama3-8b-8192`
       * `llama3-70b-8192`
       * `mixtral-8x7b-32768`
+    - HuggingFace:
+      * `CohereForAI/c4ai-command-r-plus`
+      * `meta-llama/Meta-Llama-3-70B-Instruct`
+      * `meta-llama/Meta-Llama-3-8B-Instruct`
+      * Supposedly you can use any model on there, but this is for reference for the free demo instance, in case you'd like to host your own.
     - OpenAI:
       * `gpt-4-turbo`
       * `gpt-4-turbo-preview`

diff --git a/config.txt b/config.txt
@@ -7,6 +7,9 @@ groq_api_key = idk
 groq_model = FIXME
 openai_api_key = <openai_api_key>
 openai_model = gpt-4-turbo
+huggingface_api_token = <huggingface_api_token>
+huggingface_model = CohereForAI/c4ai-command-r-plus
+
 
 [Local-API]
 kobold_api_key = <kobold api key>
@@ -16,9 +19,11 @@ llama_api_IP = http://127.0.0.1:8080/completion
 ooba_api_key = <ooba api key>
 ooba_api_IP = http://127.0.0.1:5000/v1/chat/completions
 
+
 [Paths]
 output_path = Results
 logging_file = Logs
 
+
 [Processing]
 processing_choice = cuda
diff --git a/summarize.py b/summarize.py
@@ -70,12 +70,14 @@
 cohere_api_key = config.get('API', 'cohere_api_key', fallback=None)
 groq_api_key = config.get('API', 'groq_api_key', fallback=None)
 openai_api_key = config.get('API', 'openai_api_key', fallback=None)
+huggingface_api_token = config.get('API', 'huhuggingface_api_token', fallback=None)
 
 # Models
 anthropic_model = config.get('API', 'anthropic_model', fallback='claude-3-sonnet-20240229')
 cohere_model = config.get('API', 'cohere_model', fallback='command-r-plus')
 groq_model = config.get('API', 'groq_model', fallback='FIXME')
 openai_model = config.get('API', 'openai_model', fallback='gpt-4-turbo')
+huggingface_model = config.get('API', 'huggingface_model', fallback='CohereForAI/c4ai-command-r-plus')
 
 # Local-Models
 kobold_api_IP = config.get('Local-API', 'kobold_api_IP', fallback='http://127.0.0.1:5000/api/v1/generate')
@@ -329,6 +331,27 @@ def process_local_file(file_path):
 # Video Download/Handling
 #
 
+def process_url(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+    try:
+        results = main(input_path, api_name=api_name, api_key=api_key, num_speakers=num_speakers, whisper_model=whisper_model, offset=offset, vad_filter=vad_filter, download_video_flag=download_video_flag)
+
+        if results:
+            transcription_result = results[0]
+            json_file_path = transcription_result['audio_file'].replace('.wav', '.segments.json')
+            with open(json_file_path, 'r') as file:
+                json_data = json.load(file)
+
+            summary = transcription_result.get('summary', '')
+
+            return json_data, summary, json_file_path, json_file_path.replace('.segments.json', '_summary.txt')
+        else:
+            return None, "No results found.", None, None
+    except Exception as e:
+        error_message = f"An error occurred: {str(e)}"
+        return None, error_message, None, None
+
+
+
 def create_download_directory(title):
     base_dir = "Results"
     # Remove characters that are illegal in Windows filenames and normalize
@@ -1110,24 +1133,43 @@ def save_summary_to_file(summary, file_path):
 # Gradio UI
 #
 
-def process_url(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+# Only to be used when configured with Gradio for HF Space
+def summarize_with_huggingface(api_key, file_path):
     try:
-        results = main(input_path, api_name=api_name, api_key=api_key, num_speakers=num_speakers, whisper_model=whisper_model, offset=offset, vad_filter=vad_filter, download_video_flag=download_video_flag)
+        logging.debug("huggingface: Loading json data for summarization")
+        with open(file_path, 'r') as file:
+            segments = json.load(file)
 
-        if results:
-            transcription_result = results[0]
-            json_file_path = transcription_result['audio_file'].replace('.wav', '.segments.json')
-            with open(json_file_path, 'r') as file:
-                json_data = json.load(file)
-
-            summary = transcription_result.get('summary', '')
-
-            return json_data, summary, json_file_path, json_file_path.replace('.segments.json', '_summary.txt')
+        logging.debug("huggingface: Extracting text from the segments")
+        text = extract_text_from_segments(segments)
+
+        API_TOKEN = huggingface_api_token
+        headers = {"Authorization": f"Bearer {API_TOKEN}"}
+
+        logging.debug("huggingface: Creating query...")
+        data = query("Can you please let us know more details about your ")
+
+        API_URL = f"https://api-inference.huggingface.co/models/{huggingface_model}"
+        response = requests.post(API_URL, headers=headers, json=data)
+
+        if response.status_code == 200:
+            summary = response.json()['choices'][0]['message']['content'].strip()
+            logging.debug("huggingface: Summarization successful")
+            print("Summarization successful.")
+            return summary
         else:
-            return None, "No results found.", None, None
+            logging.debug("huggingface: Summarization failed")
+            print("Failed to process summary:", response.text)
+            return None
     except Exception as e:
-        error_message = f"An error occurred: {str(e)}"
-        return None, error_message, None, None
+        logging.debug("huggingface: Error in processing: %s", str(e))
+        print("Error occurred while processing summary with huggingface:", str(e))
+        return None
+
+
+
+    def same_auth(username, password):
+        return username == password
 
 
 
@@ -1142,7 +1184,7 @@ def process_transcription(json_data):
         fn=process_url,
         inputs=[
             gr.components.Textbox(label="URL"),
-            gr.components.Dropdown(choices=["openai", "anthropic", "cohere", "groq", "llama", "kobold", "ooba"], label="API Name"),
+            gr.components.Dropdown(choices=["huggingface", "openai", "anthropic", "cohere", "groq", "llama", "kobold", "ooba"], label="API Name"),
             gr.components.Textbox(label="API Key"),
             gr.components.Number(value=2, label="Number of Speakers"),
             gr.components.Dropdown(choices=whisper_models, value="small.en", label="Whisper Model"),
@@ -1161,64 +1203,8 @@ def process_transcription(json_data):
         allow_flagging="never"
     )
 
-
-# FIXME - c/p from openai - only to be used when configured with Gradio for HF Space
-def summarize_with_huggingface(api_key, file_path):
-    try:
-        logging.debug("openai: Loading json data for summarization")
-        with open(file_path, 'r') as file:
-            segments = json.load(file)
-
-        logging.debug("openai: Extracting text from the segments")
-        text = extract_text_from_segments(segments)
-
-        headers = {
-            'Authorization': f'Bearer {api_key}',
-            'Content-Type': 'application/json'
-        }
-
-        logging.debug("openai: Preparing data + prompt for submittal")
-        prompt_text = f"{text} \n\n\n\nPlease provide a detailed, bulleted list of the points made throughout the transcribed video and any supporting arguments made for said points"
-        data = {
-            "model": "CohereForAI/c4ai-command-r-plus",
-            "messages": [
-                {
-                    "role": "system",
-                    "content": "You are a professional summarizer."
-                },
-                {
-                    "role": "user",
-                    "content": prompt_text
-                }
-            ],
-            "max_tokens": 4096,  # Adjust tokens as needed
-            "temperature": 0.7
-        }
-        logging.debug("openai: Posting request")
-        response = requests.post('https://api.openai.com/v1/chat/completions', headers=headers, json=data)
-
-        if response.status_code == 200:
-            summary = response.json()['choices'][0]['message']['content'].strip()
-            logging.debug("openai: Summarization successful")
-            print("Summarization successful.")
-            return summary
-        else:
-            logging.debug("openai: Summarization failed")
-            print("Failed to process summary:", response.text)
-            return None
-    except Exception as e:
-        logging.debug("openai: Error in processing: %s", str(e))
-        print("Error occurred while processing summary with openai:", str(e))
-        return None
-
-
-
-    def same_auth(username, password):
-        return username == password
-
-
-
-    iface.launch(auth=same_auth,share=True)
+    #iface.launch(auth=same_auth,share=False)
+    iface.launch()
 
 #
 #
@@ -1235,6 +1221,8 @@ def same_auth(username, password):
 #
 
 def main(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model="small.en", offset=0, vad_filter=False, download_video_flag=False):
+    if input_path is None and args.user_interface:
+        return []
     start_time = time.monotonic()
     paths = []  # Initialize paths as an empty list
     if os.path.isfile(input_path) and input_path.endswith('.txt'):
@@ -1373,40 +1361,40 @@ def main(input_path, api_name=None, api_key=None, num_speakers=2, whisper_model=
     if args.user_interface:
         launch_ui()
     else:
-        if args.input_path is None:
+        if not args.input_path:
             parser.print_help()
             sys.exit(1)
 
-    logging.basicConfig(level=getattr(logging, args.log_level), format='%(asctime)s - %(levelname)s - %(message)s')
-
-    logging.info('Starting the transcription and summarization process.')
-    logging.info(f'Input path: {args.input_path}')
-    logging.info(f'API Name: {args.api_name}')
-    logging.debug(f'API Key: {args.api_key}') # ehhhhh
-    logging.info(f'Number of speakers: {args.num_speakers}')
-    logging.info(f'Whisper model: {args.whisper_model}')
-    logging.info(f'Offset: {args.offset}')
-    logging.info(f'VAD filter: {args.vad_filter}')
-    logging.info(f'Log Level: {args.log_level}') #lol
-
-    if args.api_name and args.api_key:
-        logging.info(f'API: {args.api_name}')
-        logging.info('Summarization will be performed.')
-    else:
-        logging.info('No API specified. Summarization will not be performed.')
+        logging.basicConfig(level=getattr(logging, args.log_level), format='%(asctime)s - %(levelname)s - %(message)s')
+
+        logging.info('Starting the transcription and summarization process.')
+        logging.info(f'Input path: {args.input_path}')
+        logging.info(f'API Name: {args.api_name}')
+        logging.debug(f'API Key: {args.api_key}') # ehhhhh
+        logging.info(f'Number of speakers: {args.num_speakers}')
+        logging.info(f'Whisper model: {args.whisper_model}')
+        logging.info(f'Offset: {args.offset}')
+        logging.info(f'VAD filter: {args.vad_filter}')
+        logging.info(f'Log Level: {args.log_level}') #lol
+
+        if args.api_name and args.api_key:
+            logging.info(f'API: {args.api_name}')
+            logging.info('Summarization will be performed.')
+        else:
+            logging.info('No API specified. Summarization will not be performed.')
 
-    logging.debug("Platform check being performed...")
-    platform_check()
-    logging.debug("CUDA check being performed...")
-    cuda_check()
-    logging.debug("ffmpeg check being performed...")
-    check_ffmpeg()
+        logging.debug("Platform check being performed...")
+        platform_check()
+        logging.debug("CUDA check being performed...")
+        cuda_check()
+        logging.debug("ffmpeg check being performed...")
+        check_ffmpeg()
 
-    try:
-        results = main(args.input_path, api_name=args.api_name, api_key=args.api_key, num_speakers=args.num_speakers, whisper_model=args.whisper_model, offset=args.offset, vad_filter=args.vad_filter, download_video_flag=args.video)
-        logging.info('Transcription process completed.')
-    except Exception as e:
-        logging.error('An error occurred during the transcription process.')
-        logging.error(str(e))
-        sys.exit(1)
+        try:
+            results = main(args.input_path, api_name=args.api_name, api_key=args.api_key, num_speakers=args.num_speakers, whisper_model=args.whisper_model, offset=args.offset, vad_filter=args.vad_filter, download_video_flag=args.video)
+            logging.info('Transcription process completed.')
+        except Exception as e:
+            logging.error('An error occurred during the transcription process.')
+            logging.error(str(e))
+            sys.exit(1)
 
diff --git a/Samples/compare/aoe-english.json → ...-scripts/Samples/compare/aoe-english.json b/Samples/compare/aoe-english.json → ...-scripts/Samples/compare/aoe-english.json
diff --git a/Samples/compare/aoe.yaml → ...original-scripts/Samples/compare/aoe.yaml b/Samples/compare/aoe.yaml → ...original-scripts/Samples/compare/aoe.yaml
diff --git a/Samples/compare/ufo-13b-english.json → ...ipts/Samples/compare/ufo-13b-english.json b/Samples/compare/ufo-13b-english.json → ...ipts/Samples/compare/ufo-13b-english.json
diff --git a/Samples/compare/ufo-13b.yaml → ...inal-scripts/Samples/compare/ufo-13b.yaml b/Samples/compare/ufo-13b.yaml → ...inal-scripts/Samples/compare/ufo-13b.yaml
diff --git a/Samples/compare/ufo-english.json → ...-scripts/Samples/compare/ufo-english.json b/Samples/compare/ufo-english.json → ...-scripts/Samples/compare/ufo-english.json
diff --git a/Samples/compare/ufo.yaml → ...original-scripts/Samples/compare/ufo.yaml b/Samples/compare/ufo.yaml → ...original-scripts/Samples/compare/ufo.yaml
diff --git a/...Carlson (2023) [zaB_20bkoA4].diarize.json → ...Carlson (2023) [zaB_20bkoA4].diarize.json b/...Carlson (2023) [zaB_20bkoA4].diarize.json → ...Carlson (2023) [zaB_20bkoA4].diarize.json
diff --git a/...er Carlson (2023) [zaB_20bkoA4].info.json → ...er Carlson (2023) [zaB_20bkoA4].info.json b/...er Carlson (2023) [zaB_20bkoA4].info.json → ...er Carlson (2023) [zaB_20bkoA4].info.json
diff --git a/...Carlson (2023) [zaB_20bkoA4].summary.json → ...Carlson (2023) [zaB_20bkoA4].summary.json b/...Carlson (2023) [zaB_20bkoA4].summary.json → ...Carlson (2023) [zaB_20bkoA4].summary.json
diff --git a/...tory interview [YRvf00NooN8].diarize.json → ...tory interview [YRvf00NooN8].diarize.json b/...tory interview [YRvf00NooN8].diarize.json → ...tory interview [YRvf00NooN8].diarize.json
diff --git a/...factory interview [YRvf00NooN8].info.json → ...factory interview [YRvf00NooN8].info.json b/...factory interview [YRvf00NooN8].info.json → ...factory interview [YRvf00NooN8].info.json
diff --git a/...tory interview [YRvf00NooN8].summary.json → ...tory interview [YRvf00NooN8].summary.json b/...tory interview [YRvf00NooN8].summary.json → ...tory interview [YRvf00NooN8].summary.json
diff --git a/...he Resurgence) [jnoxjLJind4].diarize.json → ...he Resurgence) [jnoxjLJind4].diarize.json b/...he Resurgence) [jnoxjLJind4].diarize.json → ...he Resurgence) [jnoxjLJind4].diarize.json
diff --git a/... (The Resurgence) [jnoxjLJind4].info.json → ... (The Resurgence) [jnoxjLJind4].info.json b/... (The Resurgence) [jnoxjLJind4].info.json → ... (The Resurgence) [jnoxjLJind4].info.json
diff --git a/...n Podcast #185 [4dC_nRYIDZU].diarize.json → ...n Podcast #185 [4dC_nRYIDZU].diarize.json b/...n Podcast #185 [4dC_nRYIDZU].diarize.json → ...n Podcast #185 [4dC_nRYIDZU].diarize.json
diff --git a/...dman Podcast #185 [4dC_nRYIDZU].info.json → ...dman Podcast #185 [4dC_nRYIDZU].info.json b/...dman Podcast #185 [4dC_nRYIDZU].info.json → ...dman Podcast #185 [4dC_nRYIDZU].info.json
diff --git a/...n Podcast #185 [4dC_nRYIDZU].summary.json → ...n Podcast #185 [4dC_nRYIDZU].summary.json b/...n Podcast #185 [4dC_nRYIDZU].summary.json → ...n Podcast #185 [4dC_nRYIDZU].summary.json
diff --git a/...ffairs Hearing [KQ7Dw-739VY].diarize.json → ...ffairs Hearing [KQ7Dw-739VY].diarize.json b/...ffairs Hearing [KQ7Dw-739VY].diarize.json → ...ffairs Hearing [KQ7Dw-739VY].diarize.json
diff --git a/...n Affairs Hearing [KQ7Dw-739VY].info.json → ...n Affairs Hearing [KQ7Dw-739VY].info.json b/...n Affairs Hearing [KQ7Dw-739VY].info.json → ...n Affairs Hearing [KQ7Dw-739VY].info.json
diff --git a/...boros-l2-13b-gpt4-1.4.1_1691017407.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017407.ndjson b/...boros-l2-13b-gpt4-1.4.1_1691017407.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017407.ndjson
diff --git a/...boros-l2-13b-gpt4-1.4.1_1691017434.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017434.ndjson b/...boros-l2-13b-gpt4-1.4.1_1691017434.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017434.ndjson
diff --git a/...boros-l2-13b-gpt4-1.4.1_1691017487.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017487.ndjson b/...boros-l2-13b-gpt4-1.4.1_1691017487.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017487.ndjson
diff --git a/...boros-l2-13b-gpt4-1.4.1_1691017596.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017596.ndjson b/...boros-l2-13b-gpt4-1.4.1_1691017596.ndjson → ...boros-l2-13b-gpt4-1.4.1_1691017596.ndjson
diff --git a/...t-300_english_airoboros-l2-context.ndjson → ...t-300_english_airoboros-l2-context.ndjson b/...t-300_english_airoboros-l2-context.ndjson → ...t-300_english_airoboros-l2-context.ndjson
diff --git a/...l-300_english_airoboros-l2-context.ndjson → ...l-300_english_airoboros-l2-context.ndjson b/...l-300_english_airoboros-l2-context.ndjson → ...l-300_english_airoboros-l2-context.ndjson
diff --git a/...n-300_english_airoboros-l2-context.ndjson → ...n-300_english_airoboros-l2-context.ndjson b/...n-300_english_airoboros-l2-context.ndjson → ...n-300_english_airoboros-l2-context.ndjson
diff --git a/...x-300_english_airoboros-l2-context.ndjson → ...x-300_english_airoboros-l2-context.ndjson b/...x-300_english_airoboros-l2-context.ndjson → ...x-300_english_airoboros-l2-context.ndjson
diff --git a/...o-300_english_airoboros-l2-context.ndjson → ...o-300_english_airoboros-l2-context.ndjson b/...o-300_english_airoboros-l2-context.ndjson → ...o-300_english_airoboros-l2-context.ndjson
diff --git a/Samples/prompts/airoboros-l2-context.txt → .../Samples/prompts/airoboros-l2-context.txt b/Samples/prompts/airoboros-l2-context.txt → .../Samples/prompts/airoboros-l2-context.txt
diff --git a/tldw-scripts/chunker.py → tldw-original-scripts/chunker.py b/tldw-scripts/chunker.py → tldw-original-scripts/chunker.py
diff --git a/tldw-scripts/compare-app.py → tldw-original-scripts/compare-app.py b/tldw-scripts/compare-app.py → tldw-original-scripts/compare-app.py
diff --git a/tldw-scripts/compare.py → tldw-original-scripts/compare.py b/tldw-scripts/compare.py → tldw-original-scripts/compare.py
diff --git a/tldw-scripts/merger.py → tldw-original-scripts/merger.py b/tldw-scripts/merger.py → tldw-original-scripts/merger.py
diff --git a/tldw-scripts/params/summary.json → tldw-original-scripts/params/summary.json b/tldw-scripts/params/summary.json → tldw-original-scripts/params/summary.json
diff --git a/tldw-scripts/pyannote.py → tldw-original-scripts/pyannote.py b/tldw-scripts/pyannote.py → tldw-original-scripts/pyannote.py
diff --git a/tldw-scripts/roller-chatgpt-v2.py → tldw-original-scripts/roller-chatgpt-v2.py b/tldw-scripts/roller-chatgpt-v2.py → tldw-original-scripts/roller-chatgpt-v2.py
diff --git a/tldw-scripts/roller-chatgpt.py → tldw-original-scripts/roller-chatgpt.py b/tldw-scripts/roller-chatgpt.py → tldw-original-scripts/roller-chatgpt.py
diff --git a/tldw-scripts/roller-exllama.py → tldw-original-scripts/roller-exllama.py b/tldw-scripts/roller-exllama.py → tldw-original-scripts/roller-exllama.py
diff --git a/tldw-scripts/roller-vllm.py → tldw-original-scripts/roller-vllm.py b/tldw-scripts/roller-vllm.py → tldw-original-scripts/roller-vllm.py