MSU-AI
diff --git a/‎firebase.json‎
Lines changed: 11 additions & 1 deletion b/‎firebase.json‎
Lines changed: 11 additions & 1 deletion
diff --git a/‎frontend/src/components/DocumentUploader.tsx‎
Lines changed: 17 additions & 4 deletions b/‎frontend/src/components/DocumentUploader.tsx‎
Lines changed: 17 additions & 4 deletions
diff --git a/‎functions-node/index.js‎
Lines changed: 134 additions & 0 deletions b/‎functions-node/index.js‎
Lines changed: 134 additions & 0 deletions
@@ -6,14 +6,24 @@
   "functions": [
     {
       "source": "functions",
-      "codebase": "default",
+      "codebase": "python",
       "ignore": [
         "venv",
         ".git",
         "firebase-debug.log",
         "firebase-debug.*.log",
         "*.local"
       ]
+    },
+    {
+      "source": "functions-node",
+      "codebase": "nodejs",
+      "ignore": [
+        "node_modules",
+        ".git",
+        "firebase-debug.log",
+        "firebase-debug.*.log"
+      ]
     }
   ],
   "hosting": {
 
@@ -104,11 +104,24 @@ const DocumentUploader: React.FC = () => {
           const data = result.data as any;
 
           if (data.success) {
-            setProcessingStatus('Document uploaded successfully. Processing...');
+            setProcessingStatus('Document uploaded successfully. Extracting text...');
 
-            // Poll for document status
-            const documentId = data.documentId;
-            checkDocumentStatus(documentId);
+            // Call the new Node.js text extraction function
+            const extractText = httpsCallable(functions, 'extractPdfText');
+            const extractResult = await extractText({
+              documentType: documentType
+            });
+            
+            const extractData = extractResult.data as any;
+            
+            if (extractData.success) {
+              setProcessingStatus(`Successfully extracted ${extractData.textLength} characters. Predicting grade...`);
+              predictGrade();
+            } else {
+              setError('Text extraction failed: ' + (extractData.message || 'Unknown error'));
+              setProcessingStatus('');
+              setIsUploading(false);
+            }
           } else {
             setError('Upload failed: ' + (data.message || 'Unknown error'));
             setProcessingStatus('');
 
@@ -0,0 +1,134 @@
+const functions = require('firebase-functions');
+const admin = require('firebase-admin');
+const pdfParse = require('pdf-parse');
+const tmp = require('tmp');
+const fs = require('fs');
+
+admin.initializeApp();
+
+exports.extractPdfText = functions.https.onCall(async (data, context) => {
+  // Ensure user is authenticated
+  if (!context.auth) {
+    throw new functions.https.HttpsError(
+      'unauthenticated',
+      'User must be authenticated'
+    );
+  }
+  
+  const userId = context.auth.uid;
+  const { documentType } = data;
+  
+  if (!documentType || !['syllabus', 'transcript'].includes(documentType)) {
+    throw new functions.https.HttpsError(
+      'invalid-argument',
+      'Valid document type (syllabus or transcript) is required'
+    );
+  }
+  
+  try {
+    console.log(`Starting text extraction for ${documentType} from user ${userId}`);
+    
+    // Get document info from Firestore
+    const db = admin.firestore();
+    const docRef = db.collection('users').doc(userId).collection('documents').doc(documentType);
+    const doc = await docRef.get();
+    
+    if (!doc.exists) {
+      throw new functions.https.HttpsError(
+        'not-found',
+        `${documentType} not found`
+      );
+    }
+    
+    const docData = doc.data();
+    const filePath = docData.filePath;
+    
+    if (!filePath) {
+      throw new functions.https.HttpsError(
+        'not-found',
+        `File path not found for ${documentType}`
+      );
+    }
+    
+    console.log(`Downloading PDF from Firebase Storage: ${filePath}`);
+    
+    // Download file from Firebase Storage
+    const bucket = admin.storage().bucket();
+    const tempFile = tmp.fileSync({ postfix: '.pdf' });
+    
+    await bucket.file(filePath).download({
+      destination: tempFile.name
+    });
+    
+    console.log(`PDF downloaded to temporary file: ${tempFile.name}`);
+    
+    // Extract text using pdf-parse
+    const dataBuffer = fs.readFileSync(tempFile.name);
+    const pdfData = await pdfParse(dataBuffer);
+    
+    console.log(`Successfully extracted ${pdfData.text.length} characters of text`);
+    
+    // Clean up the temp file
+    tempFile.removeCallback();
+    
+    // Update document in Firestore with extracted text
+    await docRef.update({
+      text: pdfData.text,
+      lastExtracted: admin.firestore.FieldValue.serverTimestamp(),
+      status: 'processed'
+    });
+    
+    return {
+      success: true,
+      documentType,
+      message: `Successfully extracted text from ${documentType}`,
+      textLength: pdfData.text.length
+    };
+  } catch (error) {
+    console.error(`Error extracting text from PDF: ${error}`);
+    throw new functions.https.HttpsError(
+      'internal',
+      `Error extracting text from ${documentType}: ${error.message}`
+    );
+  }
+});
+
+// Add a function that works with the PDF upload trigger
+exports.processPdfUpload = functions.storage.object().onFinalize(async (object) => {
+  const filePath = object.name;
+  
+  // Only process PDFs in the user's directory
+  if (!filePath || !filePath.startsWith('users/') || !filePath.endsWith('.pdf')) {
+    return null;
+  }
+  
+  // Extract user ID and document type from path
+  // Expected format: users/{userId}/{documentType}/{filename}.pdf
+  const pathParts = filePath.split('/');
+  if (pathParts.length < 4) {
+    return null;
+  }
+  
+  const userId = pathParts[1];
+  const documentType = pathParts[2]; // "syllabus" or "transcript"
+  
+  try {
+    console.log(`Processing uploaded PDF: ${filePath}`);
+    
+    // Store basic information in Firestore
+    const db = admin.firestore();
+    const docRef = db.collection('users').doc(userId).collection('documents').doc(documentType);
+    
+    await docRef.set({
+      filePath: filePath,
+      uploadedAt: admin.firestore.FieldValue.serverTimestamp(),
+      status: 'uploaded'
+    });
+    
+    console.log(`PDF upload metadata saved to Firestore for ${filePath}`);
+    return null;
+  } catch (error) {
+    console.error(`Error processing uploaded PDF: ${error}`);
+    return null;
+  }
+});