Foadsf · February 2, 2026 21:59
diff --git a/README.md b/README.md
diff --git a/jarvis_ui.py b/jarvis_ui.py
 #!/usr/bin/env python3
 import os
 import sys
 import subprocess
 import warnings
 import logging
 import sounddevice as sd
 import soundfile as sf
 from rich.console import Console
 from rich.panel import Panel
 from rich.align import Align
 from transformers import pipeline

 # --- SILENCE THE MACHINE ---
 warnings.filterwarnings("ignore")
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
 logging.getLogger("transformers").setLevel(logging.ERROR)

 # --- CONFIGURATION ---
 LLAMA_PATH = os.path.expanduser("~/llama-npu")
 PIPER_DIR = os.path.expanduser("~/piper_tts")
 PIPER_BIN = os.path.join(PIPER_DIR, "piper/piper")
 PIPER_MODEL = os.path.join(PIPER_DIR, "en_US-ryan-medium.onnx")
 SAMPLE_RATE = 16000
 RECORD_SECONDS = 5

 # Add local path for importing Llama engine
 sys.path.append(os.getcwd())
 try:
    from llama_engine import LlamaNPU
 except ImportError:
    print("❌ Error: llama_engine.py not found in current folder.")
    sys.exit(1)

 console = Console()

 class JarvisVoice:
    """Handles Neural TTS via Piper."""
    def __init__(self):
        if not os.path.exists(PIPER_BIN):
            raise FileNotFoundError("Piper binary not found.")
            
    def speak(self, text):
        if not text or len(text.strip()) == 0: return
        try:
            clean_text = text.replace("\n", " ").replace('"', '').strip()
            # Generate Audio to temp file to prevent gibberish/static
            cmd = [PIPER_BIN, "--model", PIPER_MODEL, "--output_file", "temp_speech.wav"]
            
            # Run silently
            p = subprocess.Popen(cmd, stdin=subprocess.PIPE, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
            p.communicate(input=clean_text.encode('utf-8'))
            
            # Play Audio
            subprocess.run(["aplay", "-q", "temp_speech.wav"], stderr=subprocess.DEVNULL)
        except Exception:
            pass # Fail silently in UI

 def record_audio(duration):
    recording = sd.rec(int(duration * SAMPLE_RATE), samplerate=SAMPLE_RATE, channels=1)
    sd.wait()
    return recording

 def main():
    console.clear()
    console.print(Panel(Align.center(
        "[bold cyan]RADXA DRAGON NPU[/bold cyan]\n"
        "[bold white]J.A.R.V.I.S. ONLINE[/bold white]", 
        vertical="middle"), border_style="cyan", padding=(1, 2)))

    with console.status("[bold green]Booting Systems...", spinner="dots"):
        try:
            brain = LlamaNPU(LLAMA_PATH)
            # Force English to avoid language detection latency
            ears = pipeline("automatic-speech-recognition", model="openai/whisper-tiny", device="cpu")
            voice = JarvisVoice()
        except Exception as e:
            console.print(f"[bold red]System Failure:[/bold red] {e}")
            return
            
    console.print("[bold green]✓ Ready[/bold green]\n")
    voice.speak("Systems online.")

    while True:
        try:
            console.rule("[bold cyan]STANDBY[/bold cyan]")
            console.print("[dim]Press [bold white]ENTER[/bold white] to speak[/dim]", justify="center")
            input()
            
            console.print(Panel("[bold red]● LISTENING...[/bold red]", border_style="red"))
            audio_data = record_audio(RECORD_SECONDS)
            sf.write("temp_input.wav", audio_data, SAMPLE_RATE)
            
            with console.status("[bold yellow]Processing...[/bold yellow]", spinner="aesthetic"):
                result = ears("temp_input.wav", generate_kwargs={"language": "en"})
                user_text = result["text"].strip()

            if len(user_text) < 2:
                console.print("[dim italic]...no speech detected...[/dim italic]")
                continue

            console.print(f"\n[bold cyan]USER:[/bold cyan] {user_text}")

            with console.status("[bold magenta]Thinking...[/bold magenta]", spinner="earth"):
                response = brain.generate(user_text)

            console.print(f"[bold green]JARVIS:[/bold green] {response}\n")
            voice.speak(response)

        except KeyboardInterrupt:
            voice.speak("Goodbye.")
            break

 if __name__ == "__main__":
    main()
diff --git a/llama_engine.py b/llama_engine.py
 import subprocess
 import os
 import re

 class LlamaNPU:
    def __init__(self, model_dir="~/llama-npu"):
        self.model_dir = os.path.expanduser(model_dir)
        self.cmd_path = os.path.join(self.model_dir, "genie-t2t-run")
        self.config = os.path.join(self.model_dir, "htp-model-config-llama32-1b-gqa.json")
        
        # Validation
        required = ["genie-t2t-run", "tokenizer.json"]
        for f in required:
            if not os.path.exists(os.path.join(self.model_dir, f)):
                raise FileNotFoundError(f"Missing {f} in {self.model_dir}")

    def generate(self, user_prompt):
        """Runs Llama on NPU and returns clean text."""
        
        # 1. Prompt Engineering (Keep it concise)
        full_prompt = (
            f"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n"
            f"You are Jarvis. Answer concisely in one sentence.<|eot_id|>"
            f"<|start_header_id|>user<|end_header_id|>\n\n{user_prompt}<|eot_id|>"
            f"<|start_header_id|>assistant<|end_header_id|>\n\n"
        )

        # 2. Environment Setup
        env = os.environ.copy()
        env["LD_LIBRARY_PATH"] = f"{self.model_dir}:{env.get('LD_LIBRARY_PATH', '')}"

        cmd = [self.cmd_path, "-c", self.config, "-p", full_prompt]

        try:
            # 3. Execution (Fix: Run inside model dir)
            result = subprocess.run(
                cmd, 
                cwd=self.model_dir, # <--- CRITICAL FIX for tokenizer.json
                capture_output=True, 
                text=True, 
                env=env, 
                encoding='utf-8', 
                errors='replace'
            )
            
            raw_output = result.stdout + result.stderr

            # 4. Output Cleaning
            # Try to extract content between [BEGIN] and [END] tags
            match = re.search(r'\[BEGIN\]:\s*(.*?)(?:\[END\]|$)', raw_output, re.DOTALL)
            if match:
                clean = match.group(1).strip()
                if clean: return clean

            # Fallback: Strip system logs line-by-line
            clean_lines = []
            for line in raw_output.split('\n'):
                if any(x in line for x in ["libGenie", "[INFO]", "Allocated", "rpcmem", "PROMPT:", "tokenizer"]):
                    continue
                if line.strip():
                    clean_lines.append(line)
            
            return "\n".join(clean_lines).strip() or "I heard you, but I have no response."

        except Exception as e:
            return f"System Error: {str(e)}"
	#!/usr/bin/env python3
	import os
	import sys
	import subprocess
	import warnings
	import logging
	import sounddevice as sd
	import soundfile as sf
	from rich.console import Console
	from rich.panel import Panel
	from rich.align import Align
	from transformers import pipeline

	# --- SILENCE THE MACHINE ---
	warnings.filterwarnings("ignore")
	os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
	logging.getLogger("transformers").setLevel(logging.ERROR)

	# --- CONFIGURATION ---
	LLAMA_PATH = os.path.expanduser("~/llama-npu")
	PIPER_DIR = os.path.expanduser("~/piper_tts")
	PIPER_BIN = os.path.join(PIPER_DIR, "piper/piper")
	PIPER_MODEL = os.path.join(PIPER_DIR, "en_US-ryan-medium.onnx")
	SAMPLE_RATE = 16000
	RECORD_SECONDS = 5

	# Add local path for importing Llama engine
	sys.path.append(os.getcwd())
	try:
	from llama_engine import LlamaNPU
	except ImportError:
	print("❌ Error: llama_engine.py not found in current folder.")
	sys.exit(1)

	console = Console()

	class JarvisVoice:
	"""Handles Neural TTS via Piper."""
	def __init__(self):
	if not os.path.exists(PIPER_BIN):
	raise FileNotFoundError("Piper binary not found.")

	def speak(self, text):
	if not text or len(text.strip()) == 0: return
	try:
	clean_text = text.replace("\n", " ").replace('"', '').strip()
	# Generate Audio to temp file to prevent gibberish/static
	cmd = [PIPER_BIN, "--model", PIPER_MODEL, "--output_file", "temp_speech.wav"]

	# Run silently
	p = subprocess.Popen(cmd, stdin=subprocess.PIPE, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
	p.communicate(input=clean_text.encode('utf-8'))

	# Play Audio
	subprocess.run(["aplay", "-q", "temp_speech.wav"], stderr=subprocess.DEVNULL)
	except Exception:
	pass # Fail silently in UI

	def record_audio(duration):
	recording = sd.rec(int(duration * SAMPLE_RATE), samplerate=SAMPLE_RATE, channels=1)
	sd.wait()
	return recording

	def main():
	console.clear()
	console.print(Panel(Align.center(
	"[bold cyan]RADXA DRAGON NPU[/bold cyan]\n"
	"[bold white]J.A.R.V.I.S. ONLINE[/bold white]",
	vertical="middle"), border_style="cyan", padding=(1, 2)))

	with console.status("[bold green]Booting Systems...", spinner="dots"):
	try:
	brain = LlamaNPU(LLAMA_PATH)
	# Force English to avoid language detection latency
	ears = pipeline("automatic-speech-recognition", model="openai/whisper-tiny", device="cpu")
	voice = JarvisVoice()
	except Exception as e:
	console.print(f"[bold red]System Failure:[/bold red] {e}")
	return

	console.print("[bold green]✓ Ready[/bold green]\n")
	voice.speak("Systems online.")

	while True:
	try:
	console.rule("[bold cyan]STANDBY[/bold cyan]")
	console.print("[dim]Press [bold white]ENTER[/bold white] to speak[/dim]", justify="center")
	input()

	console.print(Panel("[bold red]● LISTENING...[/bold red]", border_style="red"))
	audio_data = record_audio(RECORD_SECONDS)
	sf.write("temp_input.wav", audio_data, SAMPLE_RATE)

	with console.status("[bold yellow]Processing...[/bold yellow]", spinner="aesthetic"):
	result = ears("temp_input.wav", generate_kwargs={"language": "en"})
	user_text = result["text"].strip()

	if len(user_text) < 2:
	console.print("[dim italic]...no speech detected...[/dim italic]")
	continue

	console.print(f"\n[bold cyan]USER:[/bold cyan] {user_text}")

	with console.status("[bold magenta]Thinking...[/bold magenta]", spinner="earth"):
	response = brain.generate(user_text)

	console.print(f"[bold green]JARVIS:[/bold green] {response}\n")
	voice.speak(response)

	except KeyboardInterrupt:
	voice.speak("Goodbye.")
	break

	if __name__ == "__main__":
	main()
	import subprocess
	import os
	import re

	class LlamaNPU:
	def __init__(self, model_dir="~/llama-npu"):
	self.model_dir = os.path.expanduser(model_dir)
	self.cmd_path = os.path.join(self.model_dir, "genie-t2t-run")
	self.config = os.path.join(self.model_dir, "htp-model-config-llama32-1b-gqa.json")

	# Validation
	required = ["genie-t2t-run", "tokenizer.json"]
	for f in required:
	if not os.path.exists(os.path.join(self.model_dir, f)):
	raise FileNotFoundError(f"Missing {f} in {self.model_dir}")

	def generate(self, user_prompt):
	"""Runs Llama on NPU and returns clean text."""

	# 1. Prompt Engineering (Keep it concise)
	full_prompt = (
	f"<\|begin_of_text\|><\|start_header_id\|>system<\|end_header_id\|>\n\n"
	f"You are Jarvis. Answer concisely in one sentence.<\|eot_id\|>"
	f"<\|start_header_id\|>user<\|end_header_id\|>\n\n{user_prompt}<\|eot_id\|>"
	f"<\|start_header_id\|>assistant<\|end_header_id\|>\n\n"
	)

	# 2. Environment Setup
	env = os.environ.copy()
	env["LD_LIBRARY_PATH"] = f"{self.model_dir}:{env.get('LD_LIBRARY_PATH', '')}"

	cmd = [self.cmd_path, "-c", self.config, "-p", full_prompt]

	try:
	# 3. Execution (Fix: Run inside model dir)
	result = subprocess.run(
	cmd,
	cwd=self.model_dir, # <--- CRITICAL FIX for tokenizer.json
	capture_output=True,
	text=True,
	env=env,
	encoding='utf-8',
	errors='replace'
	)

	raw_output = result.stdout + result.stderr

	# 4. Output Cleaning
	# Try to extract content between [BEGIN] and [END] tags
	match = re.search(r'\[BEGIN\]:\s(.?)(?:\[END\]\|$)', raw_output, re.DOTALL)
	if match:
	clean = match.group(1).strip()
	if clean: return clean

	# Fallback: Strip system logs line-by-line
	clean_lines = []
	for line in raw_output.split('\n'):
	if any(x in line for x in ["libGenie", "[INFO]", "Allocated", "rpcmem", "PROMPT:", "tokenizer"]):
	continue
	if line.strip():
	clean_lines.append(line)

	return "\n".join(clean_lines).strip() or "I heard you, but I have no response."

	except Exception as e:
	return f"System Error: {str(e)}"