Implemented an initial transcript merge stage

This commit is contained in:
2026-04-26 13:57:13 -05:00
parent c32349a017
commit 18f1873776
8 changed files with 535 additions and 28 deletions

View File

@@ -2,7 +2,15 @@ package model
// RawTranscript is a loaded input document before canonical normalization.
type RawTranscript struct {
Source string `json:"source"`
Source string `json:"source"`
Segments []RawSegment `json:"segments"`
}
// RawSegment is the supported WhisperX segment subset.
type RawSegment struct {
Start float64 `json:"start"`
End float64 `json:"end"`
Text string `json:"text"`
}
// CanonicalTranscript is a per-speaker transcript in seriatim's internal model.