This commit is contained in:
Gigi
2025-03-29 19:43:42 +00:00
2 changed files with 133 additions and 8 deletions

View File

@@ -4,6 +4,7 @@ import os
import sys
from pathlib import Path
import ollama
import time
def read_transcript(transcript_file: Path) -> str:
"""Read the content of a transcript file."""
@@ -57,25 +58,44 @@ def main():
# Create summaries directory if it doesn't exist
summary_dir.mkdir(parents=True, exist_ok=True)
# Get list of all transcript files
transcript_files = list(transcript_dir.glob("*.txt"))
total_files = len(transcript_files)
print(f"Found {total_files} transcript(s) to process")
# Process all transcript files
for transcript_file in transcript_dir.glob("*.txt"):
print(f"Processing {transcript_file.name}...")
for idx, transcript_file in enumerate(transcript_files, 1):
print(f"\nProcessing {transcript_file.name} ({idx}/{total_files})...")
# Read transcript
transcript_text = read_transcript(transcript_file)
# Skip if summary already exists
summary_file = summary_dir / f"{transcript_file.stem}_summary.txt"
if summary_file.exists():
print(" Summary already exists, skipping...")
continue
# Generate summary
try:
# Read transcript
transcript_text = read_transcript(transcript_file)
print(f" Read transcript ({len(transcript_text)} characters)")
# Generate summary
summary = process_transcript(transcript_text)
# Save summary
summary_file = summary_dir / f"{transcript_file.stem}_summary.txt"
save_summary(summary, summary_file)
print(f" Summary saved to {summary_file}")
print(f"Summary saved to {summary_file}")
# Add a small delay between files to avoid overloading
if idx < total_files:
time.sleep(1)
except Exception as e:
print(f"Error processing {transcript_file.name}: {str(e)}")
print(f" Failed to process {transcript_file.name}")
print(f" Error: {str(e)}")
continue
print("\nDone! All transcripts processed.")
if __name__ == "__main__":
main()