Removed Parakeet again as it requires PyTorch which is too large for this project

2026-06-15 09:51:51 +02:00 · 2026-01-18 19:13:18 +01:00
parent 8f2024df14
commit b6276b005e
2 changed files with 0 additions and 125 deletions
@@ -1,54 +0,0 @@
-// -----------------------------------------------------------
-//  Parakeet (Step 3A: spawn Python minimal integration)
-// -----------------------------------------------------------
-
-const fs = require("fs");
-const path = require("path");
-const { spawn } = require("child_process");
-
-module.exports = {
-    name: "parakeet",
-    type: "transcription",
-    displayname: "NVIDIA Parakeet",
-
-    async function(audioFilePath) {
-        console.log("🦜 [Parakeet] Starting test integration (spawn only)...");
-        console.log("🦜 Input audio:", audioFilePath);
-
-        // Check audio exists
-        if (!fs.existsSync(audioFilePath)) {
-            throw new Error("Audio file does not exist: " + audioFilePath);
-        }
-
-        // Output path in storage/transcripts
-        const sessionId = path.basename(audioFilePath).replace(/\.[^.]+$/, "");
-        const outputDir = path.join(__dirname, "../../../storage/transcripts");
-        fs.mkdirSync(outputDir, { recursive: true });
-
-        const outputPath = path.join(outputDir, `${sessionId}.json`);
-
-        // -------------------------------------------------------
-        // SPAWN PYTHON SCRIPT (step 3A — dummy script)
-        // -------------------------------------------------------
-        return new Promise((resolve, reject) => {
-            const python310 = "C:\\Users\\smith\\AppData\\Local\\Programs\\Python\\Python310\\python.exe";
-            const py = spawn(python310, [
-                path.join(__dirname, "parakeet_transcribe.py"),
-                audioFilePath,
-                outputPath
-            ]);
-
-            py.stdout.on("data", data => console.log("🦜 [Python]", data.toString().trim()));
-            py.stderr.on("data", data => console.error("🦜 [Python ERR]", data.toString().trim()));
-
-            py.on("close", code => {
-                if (code === 0) {
-                    console.log("🦜 [Parakeet] Done (spawn test). Output:", outputPath);
-                    resolve(outputPath);
-                } else {
-                    reject(new Error("Python script failed with exit code " + code));
-                }
-            });
-        });
-    }
-};
@@ -1,71 +0,0 @@
-# -----------------------------------------------------------
-#  Parakeet Real Transcriber (NVIDIA NeMo + PyTorch GPU)
-# -----------------------------------------------------------
-
-import sys
-import json
-import soundfile as sf
-import torch
-from nemo.collections.asr.models import ASRModel
-
-# Args:
-#   sys.argv[1] = input audio path
-#   sys.argv[2] = output JSON path
-
-audio_path = sys.argv[1]
-output_path = sys.argv[2]
-
-print("🔥 Starting Parakeet model...")
-device = "cuda" if torch.cuda.is_available() else "cpu"
-print("🔥 Using device:", device)
-
-# -----------------------------------------------------------
-# Load Parakeet model (NVIDIA pretrained ASR)
-# -----------------------------------------------------------
-model = ASRModel.from_pretrained(model_name="nvidia/parakeet-ctc-0.6b")
-model = model.to(device)
-model.eval()
-
-# -----------------------------------------------------------
-# Load audio
-# -----------------------------------------------------------
-print("🎧 Loading audio:", audio_path)
-audio, sr = sf.read(audio_path)
-
-# model expects mono float32
-if len(audio.shape) > 1:
-    audio = audio.mean(axis=1)
-
-audio = audio.astype("float32")
-
-# -----------------------------------------------------------
-# Run inference
-# -----------------------------------------------------------
-print("🧠 Running inference...")
-with torch.no_grad():
-    hyp = model.transcribe([audio])[0]
-
-# Extract only the text
-if hasattr(hyp, "text"):
-    transcript = hyp.text
-else:
-    # fallback: convert to string (rare)
-    transcript = str(hyp)
-
-print("📄 Transcript:", transcript)
-
-# -----------------------------------------------------------
-# Save JSON format compatible with V2D pipeline
-# -----------------------------------------------------------
-result = {
-    "id": output_path.split("/")[-1].replace(".json", ""),
-    "tool": "nemo_parakeet",
-    "status": "completed",
-    "text": transcript,
-    "words": []  # Parakeet XS doesn’t return word timestamps
-}
-
-with open(output_path, "w", encoding="utf-8") as f:
-    json.dump(result, f, indent=2, ensure_ascii=False)
-
-print("✔ JSON saved at:", output_path)