Untitled

mail@pastecode.io avatarunknown
plain_text
2 months ago
896 B
24
Indexable
Never
import re

def process_zoom_transcript(transcript):
    # Remove timestamps from each line
    cleaned_lines = [re.sub(r'\[\d{1,2}:\d{2}:\d{2}\]', '', line) for line in transcript]

    # Consolidate lines into a single paragraph
    consolidated_paragraph = ' '.join(cleaned_lines)
    
    return consolidated_paragraph

# Example Zoom transcript with timestamps
zoom_transcript = [
    "[00:01:23] Speaker 1: Good morning.",
    "[00:02:45] Speaker 2: Hello there.",
    "[00:03:10] Speaker 1: How are you?",
    "[00:04:55] Speaker 2: I'm doing well. Thanks for asking.",
    "[00:05:30] Speaker 1: That's great to hear.",
    "[00:06:15] Speaker 2: Yeah, indeed.",
    "[00:08:00] Speaker 1: Anyway, it was nice talking to you.",
    "[00:09:20] Speaker 2: Absolutely. Let's catch up again soon!"
]

processed_transcript = process_zoom_transcript(zoom_transcript)
print(processed_transcript)