akshitsinha
diff --git a/‎.github/workflows/ci.yml
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/ci.yml
Lines changed: 1 addition & 0 deletions
diff --git a/‎pyproject.toml
Lines changed: 2 additions & 0 deletions b/‎pyproject.toml
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/config.py
Lines changed: 0 additions & 6 deletions b/‎src/config.py
Lines changed: 0 additions & 6 deletions
diff --git a/‎src/devices/audio.py
Lines changed: 188 additions & 87 deletions b/‎src/devices/audio.py
Lines changed: 188 additions & 87 deletions
diff --git a/‎src/devices/preview.py
Lines changed: 0 additions & 5 deletions b/‎src/devices/preview.py
Lines changed: 0 additions & 5 deletions
diff --git a/‎src/devices/printer.py
Lines changed: 1 addition & 7 deletions b/‎src/devices/printer.py
Lines changed: 1 addition & 7 deletions
@@ -21,6 +21,7 @@ jobs:
           pip install uv
       - name: Install dependencies
         run: |
+          sudo apt-get install libasound-dev portaudio19-dev libportaudio2 libportaudiocpp0 ffmpeg libav-tools
           uv tool install ruff
           uv sync
       - name: Lint with ruff
 
@@ -7,6 +7,8 @@ requires-python = ">=3.10"
 dependencies = [
     "fastmcp>=2.4.0",
     "mss>=10.0.0",
+    "numpy>=2.2.6",
+    "pyaudio>=0.2.14",
     "python-ffmpeg>=2.0.12",
     "screeninfo>=0.8.1",
 ]
@@ -11,15 +11,9 @@ class Settings(BaseSettings):
         default=True, description="Enable printer functionality"
     )
     enable_audio: bool = Field(default=True, description="Enable audio functionality")
-    enable_storage: bool = Field(
-        default=True, description="Enable storage device functionality"
-    )
     enable_screen: bool = Field(
         default=True, description="Enable screen capture functionality"
     )
-    enable_usb: bool = Field(
-        default=True, description="Enable USB device functionality"
-    )
 
     model_config = {
         "env_prefix": "MCP_",
 
@@ -1,97 +1,198 @@
-from typing import Dict, List, Optional, Any
 from fastmcp import FastMCP
-
-
-class AudioDevice:
-    def __init__(self, device_id: str, name: str, is_input: bool):
-        self.device_id = device_id
-        self.name = name
-        self.is_input = is_input
+import pyaudio
+import wave
+from typing import Dict, List, Optional
+from pydantic import Field
+from typing import Annotated
+import tempfile
+import datetime
+import os
 
 
 def register_tools(app: FastMCP) -> None:
     @app.tool(
         name="list_audio_devices",
-        description="List all audio devices connected to the system",
+        description="List all available audio input and output devices",
+        tags=["audio"],
     )
-    async def list_audio_devices(
-        input_only: bool = False, output_only: bool = False
-    ) -> List[Dict[str, Any]]:
-        devices = []
-
-        if not output_only:
-            devices.extend(
-                [
-                    {
-                        "device_id": "mic0",
-                        "name": "Built-in Microphone",
-                        "type": "input",
-                    },
-                    {"device_id": "mic1", "name": "USB Microphone", "type": "input"},
-                ]
-            )
+    def list_audio_devices() -> Dict[str, List[Dict[str, any]]]:
+        p = pyaudio.PyAudio()
+
+        try:
+            input_devices = []
+            output_devices = []
+
+            for i in range(p.get_device_count()):
+                device_info = p.get_device_info_by_index(i)
+                device_data = {
+                    "index": i,
+                    "name": device_info["name"],
+                    "max_input_channels": device_info["maxInputChannels"],
+                    "max_output_channels": device_info["maxOutputChannels"],
+                    "default_sample_rate": device_info["defaultSampleRate"],
+                    "host_api": p.get_host_api_info_by_index(device_info["hostApi"])[
+                        "name"
+                    ],
+                }
+
+                if device_info["maxInputChannels"] > 0:
+                    input_devices.append(device_data)
+
+                if device_info["maxOutputChannels"] > 0:
+                    output_devices.append(device_data)
+
+            return {"input_devices": input_devices, "output_devices": output_devices}
+        finally:
+            p.terminate()
+
+    @app.tool(
+        name="record_audio",
+        description="Record audio from the microphone and save to a file",
+        tags=["audio"],
+    )
+    def record_audio(
+        duration: Annotated[
+            float, Field(default=5.0, description="Recording duration in seconds")
+        ],
+        sample_rate: Annotated[
+            Optional[int], Field(default=44100, description="Sample rate in Hz")
+        ] = 44100,
+        channels: Annotated[
+            Optional[int], Field(default=1, description="Number of audio channels")
+        ] = 1,
+        output_file: Annotated[
+            Optional[str], Field(description="Output file path for the recorded audio")
+        ] = None,
+        device_index: Annotated[
+            Optional[int],
+            Field(
+                default=None, description="Audio input device index (None for default)"
+            ),
+        ] = None,
+    ) -> Dict[str, any]:
+        chunk = 1024
+        format = pyaudio.paInt16
+
+        if output_file is None:
+            timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
+            filename = f"recording_{timestamp}.wav"
+            output_file = os.path.join(tempfile.gettempdir(), filename)
+
+        p = pyaudio.PyAudio()
+
+        try:
+            device_info = None
+            if device_index is not None:
+                device_info = p.get_device_info_by_index(device_index)
+                if device_info["maxInputChannels"] == 0:
+                    return {
+                        "success": False,
+                        "error": f"Device {device_index} is not an input device",
+                    }
 
-        if not input_only:
-            devices.extend(
-                [
-                    {
-                        "device_id": "spk0",
-                        "name": "Built-in Speakers",
-                        "type": "output",
-                    },
-                    {
-                        "device_id": "spk1",
-                        "name": "HDMI Audio Output",
-                        "type": "output",
-                    },
-                ]
+            stream = p.open(
+                format=format,
+                channels=channels,
+                rate=sample_rate,
+                input=True,
+                frames_per_buffer=chunk,
+                input_device_index=device_index,
             )
 
-        return devices
-
-    @app.tool(name="record_audio", description="Record audio from an input device")
-    async def record_audio(
-        device_id: str,
-        duration: Optional[int] = None,
-        save_path: Optional[str] = None,
-        format: str = "mp3",
-        quality: str = "medium",
-    ) -> Dict[str, Any]:
-        return {
-            "success": True,
-            "recording_id": "audio123456",
-            "device_id": device_id,
-            "file_path": save_path or f"/tmp/mcp-peripherals/audio_recording.{format}",
-            "start_time": "2025-05-23T12:34:56",
-            "format": format,
-            "quality": quality,
-            "max_duration": duration or "unlimited",
-        }
-
-    @app.tool(name="stop_audio_recording", description="Stop recording audio")
-    async def stop_audio_recording(recording_id: str) -> Dict[str, Any]:
-        return {
-            "success": True,
-            "recording_id": recording_id,
-            "file_path": "/tmp/mcp-peripherals/audio_recording.mp3",
-            "duration": "00:02:34",
-            "file_size": "3.2 MB",
-        }
-
-    @app.tool(name="play_audio", description="Play audio through an output device")
-    async def play_audio(
-        device_id: str, file_path: str, volume: Optional[int] = 100, loop: bool = False
-    ) -> Dict[str, Any]:
-        return {
-            "success": True,
-            "playback_id": "play123456",
-            "device_id": device_id,
-            "file_path": file_path,
-            "duration": "00:03:45",
-            "volume": volume,
-            "loop": loop,
-        }
-
-    @app.tool(name="stop_audio_playback", description="Stop playing audio")
-    async def stop_audio_playback(playback_id: str) -> Dict[str, Any]:
-        return {"success": True, "playback_id": playback_id, "status": "stopped"}
+            frames = []
+            total_frames = int(sample_rate / chunk * duration)
+
+            for i in range(total_frames):
+                data = stream.read(chunk)
+                frames.append(data)
+
+            stream.stop_stream()
+            stream.close()
+
+            with wave.open(output_file, "wb") as wf:
+                wf.setnchannels(channels)
+                wf.setsampwidth(p.get_sample_size(format))
+                wf.setframerate(sample_rate)
+                wf.writeframes(b"".join(frames))
+
+            return {
+                "success": True,
+                "output_file": output_file,
+                "duration": duration,
+                "sample_rate": sample_rate,
+                "channels": channels,
+                "device_used": device_info["name"] if device_info else "Default device",
+            }
+        except Exception as e:
+            return {"success": False, "error": str(e)}
+        finally:
+            p.terminate()
+
+    @app.tool(
+        name="play_audio",
+        description="Play an audio file through the specified output device",
+        tags=["audio"],
+    )
+    def play_audio(
+        file_path: Annotated[str, Field(description="Path to the audio file to play")],
+        device_index: Annotated[
+            Optional[int],
+            Field(
+                default=None, description="Audio output device index (None for default)"
+            ),
+        ] = None,
+    ) -> Dict[str, any]:
+        try:
+            with wave.open(file_path, "rb") as wf:
+                channels = wf.getnchannels()
+                sample_width = wf.getsampwidth()
+                sample_rate = wf.getframerate()
+                frames = wf.getnframes()
+                duration = frames / sample_rate
+
+                p = pyaudio.PyAudio()
+
+                try:
+                    device_info = None
+                    if device_index is not None:
+                        device_info = p.get_device_info_by_index(device_index)
+                        if device_info["maxOutputChannels"] == 0:
+                            return {
+                                "success": False,
+                                "error": f"Device {device_index} is not an output device",
+                            }
+
+                    stream = p.open(
+                        format=p.get_format_from_width(sample_width),
+                        channels=channels,
+                        rate=sample_rate,
+                        output=True,
+                        output_device_index=device_index,
+                    )
+
+                    chunk = 1024
+                    data = wf.readframes(chunk)
+
+                    while data:
+                        stream.write(data)
+                        data = wf.readframes(chunk)
+
+                    stream.stop_stream()
+                    stream.close()
+
+                    return {
+                        "success": True,
+                        "file_played": file_path,
+                        "duration": duration,
+                        "sample_rate": sample_rate,
+                        "channels": channels,
+                        "device_used": device_info["name"]
+                        if device_info
+                        else "Default device",
+                    }
+                finally:
+                    p.terminate()
+        except FileNotFoundError:
+            return {"success": False, "error": f"Audio file not found: {file_path}"}
+        except Exception as e:
+            return {"success": False, "error": str(e)}
@@ -8,11 +8,6 @@
 import os
 
 
-class Printer:
-    def __init__(self, printer_name: str):
-        self.printer_name = printer_name
-
-
 def register_tools(app: FastMCP) -> None:
     @app.tool(
         description="List all printers available on the system",
@@ -31,8 +26,7 @@ async def list_printers() -> List[Dict[str, str]]:
                     match = re.match(r"printer (\S+)", line)
                     if match:
                         printer_name = match.group(1)
-                        printer = Printer(printer_name=printer_name)
-                        printers.append({"printer_name": printer.name})
+                        printers.append({"printer_name": printer_name})
         except subprocess.CalledProcessError:
             printers = []
         return printers
Original file line number	Diff line number	Diff line change
`@@ -7,6 +7,8 @@ requires-python = ">=3.10"`
`7`	`7`	`dependencies = [`
`8`	`8`	`"fastmcp>=2.4.0",`
`9`	`9`	`"mss>=10.0.0",`
	`10`	`+ "numpy>=2.2.6",`
	`11`	`+ "pyaudio>=0.2.14",`
`10`	`12`	`"python-ffmpeg>=2.0.12",`
`11`	`13`	`"screeninfo>=0.8.1",`
`12`	`14`	`]`