From 5295001a54cc2d191159b00ce51c623f980ffd66 Mon Sep 17 00:00:00 2001
From: gamvo74 <gamalveo@gmail.com>
Date: Wed, 25 Feb 2026 11:37:43 -0500
Subject: [PATCH] Integrate actual S3 upload and OpenAI Whisper transcription
 in TranscribePage

---
 apps/web/app/transcribe/page.tsx | 325 ++++++++++++++++++++++---------
 1 file changed, 237 insertions(+), 88 deletions(-)
diff --git a/apps/web/app/transcribe/page.tsx b/apps/web/app/transcribe/page.tsx
index d3c27d5..d10cd7c 100644
--- a/apps/web/app/transcribe/page.tsx
+++ b/apps/web/app/transcribe/page.tsx
@@ -15,35 +15,46 @@ import {
   FileText,
   Upload,
   X,
-  FileAudio
+  FileAudio,
+  Bot // For speaker identification (if available in transcription)
 } from 'lucide-react';
+import { useRouter } from 'next/navigation';
+import { AxiosError } from 'axios'; // Import AxiosError for type checking
 
-// Mock transcription data for demonstration
-const mockTranscript = [
-  { id: 1, start: 0, end: 5, speaker: "Speaker 1", text: "Welcome to the evidentiary hearing for Barden versus State Farm." },
-  { id: 2, start: 5, end: 12, speaker: "Speaker 2", text: "Thank you, Your Honor. We are here today to discuss the lack of personal jurisdiction as outlined in our recent motion." },
-  { id: 3, start: 12, end: 18, speaker: "Speaker 1", text: "Proceed. Please state your primary grounds for this challenge." },
-  { id: 4, start: 18, end: 25, speaker: "Speaker 2", text: "The defendant has no minimum contacts with the state of North Carolina, as required by the long-arm statute." },
-  { id: 5, start: 25, end: 32, speaker: "Speaker 3", text: "Objection, Your Honor. The defendant has maintained an office in Charlotte for over five years." },
-  { id: 6, start: 32, end: 40, speaker: "Speaker 1", text: "Overruled. I will allow the defense to finish their opening statement before hearing your rebuttal." },
-];
+// Transcription Segment Type
+interface TranscriptionSegment {
+  id: number;
+  start: number;
+  end: number;
+  speaker: string;
+  text: string;
+}
 
 export default function TranscribePage() {
+  const router = useRouter();
   const [isPlaying, setIsPlaying] = useState(false);
   const [currentTime, setCurrentTime] = useState(0);
-  const [duration, setDuration] = useState(40);
+  const [mediaDuration, setMediaDuration] = useState(0);
   const [searchQuery, setSearchQuery] = useState("");
   const [playbackSpeed, setPlaybackSpeed] = useState(1);
   const [isUploading, setIsUploading] = useState(false);
-  const [uploadProgress, setUploadProgress] = useState(0);
+  const [uploadProgress, setUploadProgress] = useState(0); // Will be updated by polling
   const [selectedFile, setSelectedFile] = useState<File | null>(null);
-  
+  const [transcription, setTranscription] = useState<TranscriptionSegment[]>([]);
+  const [documentId, setDocumentId] = useState<string | null>(null);
+  const [mediaBlobUrl, setMediaBlobUrl] = useState<string | null>(null); // For uploaded media preview
+  const [transcriptionStatus, setTranscriptionStatus] = useState<string>('PENDING');
+
   const audioRef = useRef<HTMLAudioElement>(null);
   const transcriptRef = useRef<HTMLDivElement>(null);
   const activeLineRef = useRef<HTMLDivElement>(null);
   const fileInputRef = useRef<HTMLInputElement>(null);
 
-  // Auto-scroll logic
+  // Hardcoded matterId for now - MUST be replaced with dynamic value (e.g., from URL or user context)
+  // For initial testing, ensure you have a matter created in your DB for the user.
+  const MATTER_ID = 'your_matter_id_here'; 
+
+  // --- Auto-scroll and media player controls ---
   useEffect(() => {
     if (activeLineRef.current && transcriptRef.current) {
       activeLineRef.current.scrollIntoView({
@@ -53,30 +64,6 @@ export default function TranscribePage() {
     }
   }, [currentTime]);
 
-  const handleUpload = (event: React.ChangeEvent<HTMLInputElement>) => {
-    const file = event.target.files?.[0];
-    if (file) {
-      setSelectedFile(file);
-      simulateUpload();
-    }
-  };
-
-  const simulateUpload = () => {
-    setIsUploading(true);
-    let progress = 0;
-    const interval = setInterval(() => {
-      progress += 10;
-      setUploadProgress(progress);
-      if (progress >= 100) {
-        clearInterval(interval);
-        setTimeout(() => {
-          setIsUploading(false);
-          setUploadProgress(0);
-        }, 500);
-      }
-    }, 200);
-  };
-
   const formatTime = (seconds: number) => {
     const h = Math.floor(seconds / 3600);
     const m = Math.floor((seconds % 3600) / 60);
@@ -87,6 +74,7 @@ export default function TranscribePage() {
   const handleTimeUpdate = () => {
     if (audioRef.current) {
       setCurrentTime(audioRef.current.currentTime);
+      setMediaDuration(audioRef.current.duration);
     }
   };
 
@@ -97,6 +85,134 @@ export default function TranscribePage() {
     }
   };
 
+  // --- Real Upload and Transcription Polling Logic ---
+  const getAuthToken = () => {
+    // TODO: Implement actual JWT token retrieval (e.g., from localStorage, context, or auth hook)
+    // For now, return a placeholder. This MUST be replaced with a real token.
+    return 'YOUR_JWT_TOKEN_HERE'; 
+  };
+
+  const handleUpload = async (event: React.ChangeEvent<HTMLInputElement>) => {
+    const file = event.target.files?.[0];
+    if (!file) return;
+
+    setSelectedFile(file);
+    setMediaBlobUrl(URL.createObjectURL(file)); // Create URL for local preview
+    setIsUploading(true);
+    setUploadProgress(0);
+    setTranscription([]);
+    setTranscriptionStatus('PENDING');
+
+    const formData = new FormData();
+    formData.append('file', file);
+
+    const token = getAuthToken();
+    if (token === 'YOUR_JWT_TOKEN_HERE') {
+      alert('Please replace YOUR_JWT_TOKEN_HERE with a real token in transcribe/page.tsx and MATTER_ID with a valid matter.');
+      setIsUploading(false);
+      return;
+    }
+
+    try {
+      const response = await fetch(`${process.env.NEXT_PUBLIC_API_URL}/documents/${MATTER_ID}/upload`, {
+        method: 'POST',
+        body: formData,
+        headers: {
+          'Authorization': `Bearer ${token}`, 
+        },
+      });
+
+      if (!response.ok) {
+        const errorData = await response.json();
+        throw new Error(errorData.message || 'File upload failed');
+      }
+
+      const data = await response.json();
+      setDocumentId(data.id); // Set the document ID to start polling for transcription
+      // No longer simulating progress, actual progress will come from polling.
+
+    } catch (error: any) {
+      setIsUploading(false);
+      console.error('Upload error:', error);
+      alert(`Upload failed: ${error.message}`);
+    }
+  };
+
+  // Polling for Transcription Results
+  useEffect(() => {
+    let pollingInterval: NodeJS.Timeout;
+
+    const pollTranscription = async () => {
+      if (!documentId) return;
+
+      const token = getAuthToken();
+      if (token === 'YOUR_JWT_TOKEN_HERE') return;
+
+      try {
+        const response = await fetch(`${process.env.NEXT_PUBLIC_API_URL}/documents/${documentId}/transcription`, {
+          headers: {
+            'Authorization': `Bearer ${token}`, 
+          },
+        });
+        const data = await response.json();
+        
+        setTranscriptionStatus(data.transcriptionStatus);
+        // Simulate progress based on status (real backend would send progress %)
+        if (data.transcriptionStatus === 'PROCESSING') {
+          setUploadProgress(50); 
+        } else if (data.transcriptionStatus === 'COMPLETED') {
+          setUploadProgress(100);
+        }
+
+        if (data.transcriptionStatus === 'COMPLETED' && data.transcriptionText) {
+          const parsedTranscription = JSON.parse(data.transcriptionText);
+          // Assuming parsedTranscription.segments contains what we need from OpenAI verbose_json
+          setTranscription(parsedTranscription.segments.map((s: any, index: number) => ({
+            id: index, // Use index if OpenAI doesn't provide segment ID directly
+            start: s.start,
+            end: s.end,
+            speaker: s.speaker || `Speaker ${s.id || 0}`, // Whisper doesn't do speaker diarization by default, might need external lib
+            text: s.text.trim(),
+          })));
+          setMediaDuration(parsedTranscription.duration || audioRef.current?.duration || 0);
+          setIsUploading(false); // Stop progress once transcription is done
+          clearInterval(pollingInterval);
+        } else if (data.transcriptionStatus === 'FAILED') {
+          setIsUploading(false);
+          alert('Transcription failed.');
+          clearInterval(pollingInterval);
+        }
+      } catch (error) {
+        console.error('Error fetching transcription:', error);
+        setIsUploading(false);
+        alert('Error fetching transcription status.');
+        clearInterval(pollingInterval);
+      }
+    };
+
+    if (documentId && isUploading) {
+      pollingInterval = setInterval(pollTranscription, 3000); // Poll every 3 seconds
+    }
+
+    return () => clearInterval(pollingInterval); // Cleanup interval
+  }, [documentId, isUploading]);
+
+  const displayStatusMessage = () => {
+    switch (transcriptionStatus) {
+      case 'PENDING':
+        return 'Waiting to start transcription...';
+      case 'PROCESSING':
+        return 'Transcribing in progress...';
+      case 'COMPLETED':
+        return 'Transcription complete!';
+      case 'FAILED':
+        return 'Transcription failed!';
+      default:
+        return 'Unknown status';
+    }
+  };
+
+
   return (
     <div className="h-[calc(100vh-12rem)] flex flex-col gap-6 -m-4">
       <div className="flex justify-between items-center px-4">
@@ -136,15 +252,17 @@ export default function TranscribePage() {
         </div>
       </div>
 
-      {isUploading && (
+      {isUploading && (transcriptionStatus !== 'COMPLETED') && (
         <div className="mx-4 bg-blue-50 dark:bg-blue-900/20 border border-blue-100 dark:border-blue-800 p-4 rounded-xl flex items-center gap-4">
           <div className="w-10 h-10 rounded-full bg-blue-600 flex items-center justify-center text-white">
             <Upload size={20} className="animate-bounce" />
           </div>
           <div className="flex-1">
             <div className="flex justify-between items-center mb-1">
-              <p className="text-sm font-bold text-blue-900 dark:text-blue-100">Processing: {selectedFile?.name}</p>
-              <p className="text-xs font-bold text-blue-600">{uploadProgress}%</p>
+              <p className="text-sm font-bold text-blue-900 dark:text-blue-100">
+                {selectedFile ? `Uploading & Processing: ${selectedFile.name}` : 'Processing file...'}
+              </p>
+              <p className="text-xs font-bold text-blue-600">{transcriptionStatus === 'COMPLETED' ? '100%' : uploadProgress > 0 ? `${uploadProgress}%` : ''}</p>
             </div>
             <div className="w-full bg-blue-200 dark:bg-blue-800 h-2 rounded-full overflow-hidden">
               <div 
@@ -152,8 +270,9 @@ export default function TranscribePage() {
                 style={{ width: `${uploadProgress}%` }}
               ></div>
             </div>
+            <p className="text-xs text-blue-700 dark:text-blue-200 mt-1">{displayStatusMessage()}</p>
           </div>
-          <button onClick={() => setIsUploading(false)} className="text-blue-400 hover:text-blue-600">
+          <button onClick={() => {setIsUploading(false); setTranscriptionStatus('PENDING');}} className="text-blue-400 hover:text-blue-600">
             <X size={20} />
           </button>
         </div>
@@ -163,12 +282,26 @@ export default function TranscribePage() {
         {/* Left: Media Player & Controls */}
         <div className="w-1/3 flex flex-col gap-4">
           <div className="bg-slate-900 rounded-2xl p-8 flex flex-col items-center justify-center text-white aspect-video relative overflow-hidden group">
-            {selectedFile ? (
-              <FileAudio size={64} className="text-blue-500 mb-4" />
+            {mediaBlobUrl ? (
+              <audio 
+                controls 
+                ref={audioRef} 
+                onTimeUpdate={handleTimeUpdate} 
+                onLoadedMetadata={() => audioRef.current && setMediaDuration(audioRef.current.duration)}
+                src={mediaBlobUrl} 
+                className="w-full h-full object-contain"
+                onPlay={() => setIsPlaying(true)}
+                onPause={() => setIsPlaying(false)}
+                onEnded={() => setIsPlaying(false)}
+                playbackRate={playbackSpeed}
+              ></audio>
             ) : (
-              <Volume2 size={64} className="text-blue-500/20 mb-4" />
+              <>
+                <Volume2 size={64} className="text-blue-500/20 mb-4" />
+                <p className="font-bold">Upload audio/video to begin</p>
+              </>
             )}
-            <p className="font-bold truncate max-w-full px-4">{selectedFile ? selectedFile.name : 'Evidentiary_Hearing_022426.mp3'}</p>
+            <p className="font-bold truncate max-w-full px-4">{selectedFile ? selectedFile.name : 'No file selected'}</p>
             <p className="text-xs text-slate-500">Matter: Barden v. State Farm</p>
             
             {/* Minimalist Player UI Overlay */}
@@ -176,11 +309,11 @@ export default function TranscribePage() {
               <div className="w-full bg-white/20 h-1.5 rounded-full mb-4 cursor-pointer relative" onClick={(e) => {
                 const rect = e.currentTarget.getBoundingClientRect();
                 const x = e.clientX - rect.left;
-                seek((x / rect.width) * duration);
+                seek((x / rect.width) * mediaDuration);
               }}>
                 <div 
                   className="absolute inset-y-0 left-0 bg-blue-500 rounded-full" 
-                  style={{ width: `${(currentTime / duration) * 100}%` }}
+                  style={{ width: `${(currentTime / mediaDuration) * 100}%` }}
                 ></div>
               </div>
               <div className="flex items-center justify-between">
@@ -189,8 +322,14 @@ export default function TranscribePage() {
                   <SkipBack size={20} className="cursor-pointer hover:text-blue-400" onClick={() => seek(currentTime - 5)} />
                   <button 
                     onClick={() => {
-                      setIsPlaying(!isPlaying);
-                      // In real app: audioRef.current.play/pause
+                      if (audioRef.current) {
+                        if (isPlaying) {
+                          audioRef.current.pause();
+                        } else {
+                          audioRef.current.play();
+                        }
+                        setIsPlaying(!isPlaying);
+                      }
                     }}
                     className="w-10 h-10 bg-blue-600 rounded-full flex items-center justify-center hover:bg-blue-700 transition-all"
                   >
@@ -198,7 +337,7 @@ export default function TranscribePage() {
                   </button>
                   <SkipForward size={20} className="cursor-pointer hover:text-blue-400" onClick={() => seek(currentTime + 5)} />
                 </div>
-                <span className="text-[10px] font-mono">{formatTime(duration)}</span>
+                <span className="text-[10px] font-mono">{formatTime(mediaDuration)}</span>
               </div>
             </div>
           </div>
@@ -209,7 +348,10 @@ export default function TranscribePage() {
               <span className="text-sm font-medium">Playback Speed</span>
               <select 
                 value={playbackSpeed} 
-                onChange={(e) => setPlaybackSpeed(Number(e.target.value))}
+                onChange={(e) => {
+                  setPlaybackSpeed(Number(e.target.value));
+                  if(audioRef.current) audioRef.current.playbackRate = Number(e.target.value);
+                }}
                 className="bg-slate-50 dark:bg-slate-800 border-none rounded-lg text-sm font-bold p-2"
               >
                 <option value={0.5}>0.5x</option>
@@ -235,8 +377,8 @@ export default function TranscribePage() {
               <h4 className="font-bold text-sm">Transcript (Sync Active)</h4>
             </div>
             <div className="flex gap-4 text-[10px] font-bold text-slate-400 uppercase tracking-widest">
-              <span className="flex items-center gap-1"><User size={12} /> 3 Speakers Identified</span>
-              <span className="flex items-center gap-1"><Clock size={12} /> 00:40 Total Duration</span>
+              <span className="flex items-center gap-1"><User size={12} /> {new Set(transcription.map(t => t.speaker)).size} Speakers Identified</span>
+              <span className="flex items-center gap-1"><Clock size={12} /> {formatTime(mediaDuration)} Total Duration</span>
             </div>
           </header>
 
@@ -244,51 +386,58 @@ export default function TranscribePage() {
             ref={transcriptRef}
             className="flex-1 overflow-y-auto p-8 space-y-8 scroll-smooth"
           >
-            {mockTranscript.map((line) => {
-              const isActive = currentTime >= line.start && currentTime < line.end;
-              const isMatch = searchQuery && line.text.toLowerCase().includes(searchQuery.toLowerCase());
+            {transcription.length > 0 ? (
+              transcription.map((line) => {
+                const isActive = currentTime >= line.start && currentTime < line.end;
+                const isMatch = searchQuery && line.text.toLowerCase().includes(searchQuery.toLowerCase());
 
-              return (
-                <div 
-                  key={line.id} 
-                  ref={isActive ? activeLineRef : null}
-                  className={`flex gap-6 transition-all duration-300 rounded-xl p-4 ${
-                    isActive ? 'bg-blue-50 dark:bg-blue-900/20 ring-1 ring-blue-100 dark:ring-blue-800 shadow-sm' : ''
-                  } ${isMatch ? 'bg-yellow-50 dark:bg-yellow-900/20' : ''}`}
-                >
-                  <button 
-                    onClick={() => seek(line.start)}
-                    className={`text-[11px] font-mono font-bold w-20 flex-shrink-0 transition-colors ${
-                      isActive ? 'text-blue-600' : 'text-slate-400 hover:text-blue-500'
-                    }`}
+                return (
+                  <div 
+                    key={line.id} 
+                    ref={isActive ? activeLineRef : null}
+                    className={`flex gap-6 transition-all duration-300 rounded-xl p-4 ${
+                      isActive ? 'bg-blue-50 dark:bg-blue-900/20 ring-1 ring-blue-100 dark:ring-blue-800 shadow-sm' : ''
+                    } ${isMatch ? 'bg-yellow-50 dark:bg-yellow-900/20' : ''}`}
                   >
-                    [{formatTime(line.start)}]
-                  </button>
-                  <div className="space-y-1 flex-1">
-                    <p className={`text-[10px] font-bold uppercase tracking-wider ${
-                      isActive ? 'text-blue-600' : 'text-slate-400'
-                    }`}>
-                      {line.speaker}
-                    </p>
-                    <p className={`text-sm leading-relaxed transition-colors ${
-                      isActive ? 'text-slate-900 dark:text-white font-medium' : 'text-slate-600 dark:text-slate-400'
-                    }`}>
-                      {line.text}
-                    </p>
+                    <button 
+                      onClick={() => seek(line.start)}
+                      className={`text-[11px] font-mono font-bold w-20 flex-shrink-0 transition-colors ${
+                        isActive ? 'text-blue-600' : 'text-slate-400 hover:text-blue-500'
+                      }`}
+                    >
+                      [{formatTime(line.start)}]
+                    </button>
+                    <div className="space-y-1 flex-1">
+                      <p className={`text-[10px] font-bold uppercase tracking-wider ${
+                        isActive ? 'text-blue-600' : 'text-slate-400'
+                      }`}>
+                        {line.speaker}
+                      </p>
+                      <p className={`text-sm leading-relaxed transition-colors ${
+                        isActive ? 'text-slate-900 dark:text-white font-medium' : 'text-slate-600 dark:text-slate-400'
+                      }`}>
+                        {line.text}
+                      </p>
+                    </div>
                   </div>
-                </div>
-              );
-            })}
+                );
+              })
+            ) : (
+              <div className="text-center text-slate-500 mt-12">
+                <p>Upload an audio or video file to get started with transcription.</p>
+                {isUploading && <p className="mt-2 text-blue-500">{displayStatusMessage()}</p>}
+              </div>
+            )}
           </div>
 
           <footer className="p-4 bg-slate-50 dark:bg-slate-800/50 border-t border-slate-200 dark:border-slate-800">
             <div className="flex items-center justify-between text-[10px] font-bold text-slate-400 uppercase tracking-widest">
               <p>Sync Latency: &lt;100ms</p>
-              <p>Autosave Active: 12:45 PM</p>
+              <p>Autosave Active: {new Date().toLocaleTimeString('en-US', { hour: '2-digit', minute: '2-digit' })}</p>
             </div>
           </footer>
         </div>
       </div>
     </div>
   );
-}
+}
\ No newline at end of file