-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathAudioProcessor.java
148 lines (122 loc) · 5.63 KB
/
AudioProcessor.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
import org.bytedeco.javacv.*;
import org.bytedeco.ffmpeg.avcodec.*;
import org.bytedeco.ffmpeg.avformat.*;
import org.bytedeco.ffmpeg.avutil.*;
import org.bytedeco.ffmpeg.swresample.*;
import java.util.ArrayList;
import java.util.List;
import java.util.stream.IntStream;
import java.util.stream.Collectors;
import static org.bytedeco.ffmpeg.global.avcodec.*;
import static org.bytedeco.ffmpeg.global.avformat.*;
import static org.bytedeco.ffmpeg.global.avutil.*;
import static org.bytedeco.ffmpeg.global.swresample.*;
public class AudioProcessor {
public static void main(String[] args) {
try {
String mp3File = "input.mp3";
List<Double> audioSamples = new ArrayList<>();
// Initialize FFmpeg
av_log_set_level(AV_LOG_QUIET);
AVFormatContext formatContext = new AVFormatContext(null);
if (avformat_open_input(formatContext, mp3File, null, null) < 0) {
throw new IllegalArgumentException("Could not open file: " + mp3File);
}
if (avformat_find_stream_info(formatContext, (AVDictionary) null) < 0) {
throw new RuntimeException("Could not find stream information");
}
// Find the audio stream
int audioStreamIndex = -1;
AVCodecContext codecContext = null;
for (int i = 0; i < formatContext.nb_streams(); i++) {
AVStream stream = formatContext.streams(i);
AVCodecParameters codecParams = stream.codecpar();
if (codecParams.codec_type() == AVMEDIA_TYPE_AUDIO) {
audioStreamIndex = i;
AVCodec codec = avcodec_find_decoder(codecParams.codec_id());
codecContext = avcodec_alloc_context3(codec);
avcodec_parameters_to_context(codecContext, codecParams);
avcodec_open2(codecContext, codec, (AVDictionary) null);
break;
}
}
if (audioStreamIndex == -1) {
throw new RuntimeException("No audio stream found");
}
// Read audio packets
AVPacket packet = av_packet_alloc();
AVFrame frame = av_frame_alloc();
while (av_read_frame(formatContext, packet) >= 0) {
if (packet.stream_index() == audioStreamIndex) {
int ret = avcodec_send_packet(codecContext, packet);
while (ret >= 0) {
ret = avcodec_receive_frame(codecContext, frame);
if (ret == AVERROR_EOF || ret == AVERROR_EAGAIN())
break;
// Convert samples to doubles
for (int i = 0; i < frame.nb_samples(); i++) {
// Assuming 16-bit audio, adjust if different
short sample = frame.data(0).getShort(i * 2);
audioSamples.add(sample / 32768.0);
}
}
}
av_packet_unref(packet);
}
// Process audio with moving average
int windowSize = 100;
List<Double> processedSamples = movingAverage(audioSamples, windowSize);
// Print statistics
System.out.println("Original samples: " + audioSamples.size());
System.out.println("Processed samples: " + processedSamples.size());
// Clean up
av_frame_free(frame);
av_packet_free(packet);
avcodec_free_context(codecContext);
avformat_close_input(formatContext);
} catch (Exception e) {
e.printStackTrace();
}
}
private static List<Double> movingAverage(List<Double> input, int windowSize) {
return IntStream.range(0, input.size() - windowSize + 1)
.mapToDouble(i -> input.subList(i, i + windowSize)
.stream()
.mapToDouble(Double::doubleValue)
.average()
.orElse(0.0))
.boxed()
.collect(Collectors.toList());
}
public static void recordFromMicrophone(String outputFile, int durationSeconds) {
try (FFmpegFrameGrabber grabber = new FFmpegFrameGrabber("default")) {
// Set up audio grabber
grabber.setFormat("avfoundation"); // Use avfoundation for macOS
grabber.setSampleRate(44100);
grabber.setAudioChannels(2);
grabber.start();
// Set up recorder
FFmpegFrameRecorder recorder = new FFmpegFrameRecorder(outputFile, 2);
recorder.setFormat("mp3");
recorder.setSampleRate(44100);
recorder.setAudioChannels(2);
recorder.setAudioQuality(0); // Highest quality
recorder.setAudioCodec(AV_CODEC_ID_MP3);
recorder.start();
// Record for specified duration
long startTime = System.currentTimeMillis();
while ((System.currentTimeMillis() - startTime) < (durationSeconds * 1000)) {
Frame frame = grabber.grab();
if (frame != null && frame.samples != null) {
recorder.record(frame);
}
}
// Clean up
recorder.stop();
recorder.release();
} catch (Exception e) {
System.err.println("Error recording audio: " + e.getMessage());
e.printStackTrace();
}
}
}