feat: add Java support and example usage to README and new Java files (#74)

arthasking123 · web-flow · commit ec9f9e83579f · 2025-11-15T15:13:53.000+08:00
* feat: add Java support and example usage to README and new Java files

- Updated README.md to include Java usage section and updated platform support for Java.
- Added TestTenVad.java as an example of using the TEN VAD library in Java.
- Introduced TenVad.java as a Java wrapper for the TEN VAD native library, enabling voice activity detection in Java applications.

* refactor: enhance TenVad library with improved error handling and debug information

- Updated TenVad.java to use Pointer for vadHandle and improved library loading error messages.
- Refactored getLibraryPath method for better platform detection and library path management.
- Added printDebugInfo method to assist in diagnosing library loading issues.
- Modified TestTenVad.java to print debug information instead of library version.

* refactor: streamline TenVad implementation and enhance error handling

- Simplified the initialization of the VAD instance in TenVad.java by using the CLib interface for native method calls.
- Removed unnecessary debug information printing from TestTenVad.java.
- Improved error messages for VAD creation and processing failures.
- Updated library path retrieval logic for better clarity and maintainability.
diff --git a/README.md b/README.md
@@ -46,6 +46,7 @@
     - [Linux](#1-linux--macos--windows)
   - [JS Usage](#js-usage)
     - [Web](#1-web)
+  - [Java Usage](#java-usage)
   - [C Usage](#c-usage)
     - [Linux](#1-linux)
     - [Windows](#2-windows)
@@ -254,22 +255,22 @@ The project supports five major platforms with dynamic library linking.
     <th align="center"> Linux </th>
     <td align="center"> libten_vad.so </td>
     <td align="center"> x64 </td>
-    <td align="center"> Python, C </td>
-    <td rowspan="6">ten_vad.h <br> ten_vad.py <br> ten_vad.js</td>
+    <td align="center"> Python, C, Java </td>
+    <td rowspan="6">ten_vad.h <br> ten_vad.py <br> ten_vad.js <br> TenVad.java</td>
     <td>  </td>
   </tr>
   <tr>
     <th align="center"> Windows </th>
     <td align="center"> ten_vad.dll </td>
     <td align="center"> x64, x86 </td>
-    <td align="center"> C </td>
+    <td align="center"> C, Java </td>
     <td>  </td>
   </tr>
   <tr>
     <th align="center"> macOS </th>
     <td align="center"> ten_vad.framework </td>
     <td align="center"> arm64, x86_64 </td>
-    <td align="center"> C </td>
+    <td align="center"> C, Java </td>
     <td>  </td>
   </tr>
   <tr>
@@ -283,7 +284,7 @@ The project supports five major platforms with dynamic library linking.
     <th align="center"> Android </th>
     <td align="center"> libten_vad.so </td>
     <td align="center"> arm64-v8a, armeabi-v7a </td>
-    <td align="center"> C </td>
+    <td align="center"> C, Java </td>
     <td>  </td>
   </tr>
   <tr>
@@ -392,6 +393,83 @@ from ten_vad import TenVad
 
 <br>
 
+### **Java Usage**
+
+TEN VAD provides comprehensive Java support with JNI (Java Native Interface) bindings for all major platforms.
+
+#### **Requirements**
+
+- Java 8 or higher
+- Native libraries in `lib/` directory
+- JNI headers
+
+#### **Compilation**
+
+```bash
+# Compile Java source
+javac -cp . include/TenVad.java examples/TestTenVad.java
+
+# Run example
+java -cp . -Djava.library.path=lib TestTenVad s0724-s0730.wav out.txt
+```
+
+#### **Example Code**
+
+```java
+import com.ten.vad.TenVad;
+
+public class VADExample {
+    public static void main(String[] args) {
+        // Create VAD instance
+        TenVad vad = new TenVad(256, 0.5f);
+        
+        // Process audio frame
+        short[] audioFrame = new short[256]; // 16ms at 16kHz
+        // ... fill audioFrame with audio data ...
+        
+        TenVad.VadResult result = vad.process(audioFrame);
+        System.out.println("Probability: " + result.getProbability());
+        System.out.println("Voice detected: " + result.isVoiceDetected());
+        
+        // Clean up
+        vad.destroy();
+    }
+}
+```
+
+#### **Platform-Specific Notes**
+
+- **Linux**: Requires `libc++1` package
+- **Windows**: Ensure Visual C++ Redistributable is installed
+- **macOS**: No additional requirements
+- **Android**: Use Android NDK for native library integration
+
+#### **API Reference**
+
+```java
+public class TenVad {
+    // Constructor
+    public TenVad(int hopSize, float threshold)
+    
+    // Process audio frame
+    public VadResult process(short[] audioData)
+    
+    // Get library version
+    public static String getVersion()
+    
+    // Cleanup
+    public void destroy()
+}
+
+public static class VadResult {
+    public float getProbability()    // [0.0, 1.0]
+    public int getFlag()            // 0 or 1
+    public boolean isVoiceDetected() // true if voice detected
+}
+```
+
+<br>
+
 ### **C Usage**
 
 #### **Build Scripts**
diff --git a/examples/TestTenVad.java b/examples/TestTenVad.java
@@ -0,0 +1,184 @@
+//
+// Copyright © 2025 Agora
+// This file is part of TEN Framework, an open source project.
+// Licensed under the Apache License, Version 2.0, with certain conditions.
+// Refer to the "LICENSE" file in the root directory for more information.
+//
+
+
+// import com.ten.vad.TenVad; // Uncomment when using package structure
+import javax.sound.sampled.*;
+import java.io.*;
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+/**
+ * Example usage of TEN VAD Java interface.
+ * 
+ * This example demonstrates how to use the TEN VAD library in Java
+ * for real-time voice activity detection.
+ * 
+ * Usage: java TestTenVad <input_wav_file> <output_txt_file>
+ * 
+ * @author TEN Framework Team
+ * @version 1.0
+ */
+public class TestTenVad {
+    
+    private static final int HOP_SIZE = 256; // 16 ms per frame at 16kHz
+    private static final float THRESHOLD = 0.5f;
+    
+    public static void main(String[] args) {
+        if (args.length != 2) {
+            System.err.println("Usage: java TestTenVad <input_wav_file> <output_txt_file>");
+            System.exit(1);
+        }
+        
+        String inputFile = args[0];
+        String outputFile = args[1];
+        
+        try {          
+            
+            // Create VAD instance
+            TenVad vad = new TenVad(HOP_SIZE, THRESHOLD);
+            System.out.println("TEN VAD initialized with hop_size=" + vad.getHopSize() + 
+                             ", threshold=" + vad.getThreshold());
+            
+            // Load and process audio file
+            processAudioFile(vad, inputFile, outputFile);
+            
+            // Clean up
+            vad.destroy();
+            System.out.println("Processing completed successfully!");
+            
+        } catch (Exception e) {
+            System.err.println("Error: " + e.getMessage());
+            e.printStackTrace();
+            System.exit(1);
+        }
+    }
+    
+    /**
+     * Process audio file and write VAD results to output file.
+     */
+    private static void processAudioFile(TenVad vad, String inputFile, String outputFile) 
+            throws IOException, UnsupportedAudioFileException {
+        
+        // Load WAV file
+        AudioInputStream audioStream = AudioSystem.getAudioInputStream(new File(inputFile));
+        AudioFormat format = audioStream.getFormat();
+        
+        // Verify audio format
+        if (format.getSampleRate() != 16000) {
+            throw new IllegalArgumentException("Audio sample rate must be 16kHz, got: " + 
+                format.getSampleRate());
+        }
+        
+        if (format.getSampleSizeInBits() != 16) {
+            throw new IllegalArgumentException("Audio sample size must be 16-bit, got: " + 
+                format.getSampleSizeInBits());
+        }
+        
+        if (format.getChannels() != 1) {
+            throw new IllegalArgumentException("Audio must be mono, got: " + 
+                format.getChannels() + " channels");
+        }
+        
+        System.out.println("Audio format: " + format);
+        
+        // Read audio data
+        ByteArrayOutputStream buffer = new ByteArrayOutputStream();
+        byte[] data = new byte[4096];
+        int bytesRead;
+        
+        while ((bytesRead = audioStream.read(data)) != -1) {
+            buffer.write(data, 0, bytesRead);
+        }
+        
+        audioStream.close();
+        byte[] audioBytes = buffer.toByteArray();
+        
+        // Convert to short array
+        short[] audioSamples = bytesToShorts(audioBytes, format.isBigEndian());
+        System.out.println("Loaded " + audioSamples.length + " audio samples");
+        
+        // Process audio in frames
+        int numFrames = audioSamples.length / HOP_SIZE;
+        System.out.println("Processing " + numFrames + " frames...");
+        
+        try (PrintWriter writer = new PrintWriter(new FileWriter(outputFile))) {
+            for (int i = 0; i < numFrames; i++) {
+                // Extract frame
+                short[] frame = new short[HOP_SIZE];
+                System.arraycopy(audioSamples, i * HOP_SIZE, frame, 0, HOP_SIZE);
+                
+                // Process frame
+                TenVad.VadResult result = vad.process(frame);
+                
+                // Write result
+                String line = String.format("[%d] %.6f, %d", i, 
+                    result.getProbability(), result.getFlag());
+                System.out.println(line);
+                writer.println(line);
+            }
+        }
+    }
+    
+    /**
+     * Convert byte array to short array.
+     */
+    private static short[] bytesToShorts(byte[] bytes, boolean bigEndian) {
+        short[] shorts = new short[bytes.length / 2];
+        ByteBuffer.wrap(bytes).order(bigEndian ? ByteOrder.BIG_ENDIAN : ByteOrder.LITTLE_ENDIAN)
+                 .asShortBuffer().get(shorts);
+        return shorts;
+    }
+    
+    /**
+     * Example of real-time audio processing from microphone.
+     */
+    public static void processMicrophoneInput() {
+        try {
+            TenVad vad = new TenVad(HOP_SIZE, THRESHOLD);
+            
+            // Set up audio capture
+            AudioFormat format = new AudioFormat(16000, 16, 1, true, false);
+            DataLine.Info info = new DataLine.Info(TargetDataLine.class, format);
+            
+            if (!AudioSystem.isLineSupported(info)) {
+                System.err.println("Microphone input not supported");
+                return;
+            }
+            
+            TargetDataLine line = (TargetDataLine) AudioSystem.getLine(info);
+            line.open(format);
+            line.start();
+            
+            System.out.println("Recording from microphone... Press Ctrl+C to stop");
+            
+            byte[] buffer = new byte[HOP_SIZE * 2]; // 16-bit samples
+            short[] frame = new short[HOP_SIZE];
+            
+            while (true) {
+                int bytesRead = line.read(buffer, 0, buffer.length);
+                if (bytesRead == buffer.length) {
+                    // Convert to short array
+                    ByteBuffer.wrap(buffer).order(ByteOrder.LITTLE_ENDIAN)
+                             .asShortBuffer().get(frame);
+                    
+                    // Process frame
+                    TenVad.VadResult result = vad.process(frame);
+                    
+                    // Print result
+                    System.out.printf("VAD: %.3f, %s%n", 
+                        result.getProbability(), 
+                        result.isVoiceDetected() ? "VOICE" : "SILENCE");
+                }
+            }
+            
+        } catch (Exception e) {
+            System.err.println("Error in microphone processing: " + e.getMessage());
+            e.printStackTrace();
+        }
+    }
+}
diff --git a/include/TenVad.java b/include/TenVad.java