feat : things

노현욱
Commit 86a3d093d2d262a2095352191363168fa386abdb 86a3d093 1 parent 715eaa29
Showing 12 changed files with 463 additions and 104 deletions
calc_decibel.py
callBackWire.py
find_peak.py
make_echo.py
output.wav
sets.py
streamToOut.py
stream_echo.py
testForPort.py
visualize.py
what_to_do
wire.py
--- a/calc_decibel.py 0 → 100644
View file @86a3d09
+++ b/calc_decibel.py 0 → 100644
View file @86a3d09
+ import pyaudio
+ import numpy as np
+ 
+ # Define constants
+ CHUNK_SIZE = 1024  # Number of audio frames per buffer
+ FORMAT = pyaudio.paInt16  # Audio format (16-bit int)
+ CHANNELS = 1  # Mono audio
+ RATE = 44100  # Sample rate (Hz)
+ RMS_REF = 1.0  # Reference RMS amplitude for dB calculation
+ 
+ # Initialize PyAudio stream
+ audio = pyaudio.PyAudio()
+ stream = audio.open(format=FORMAT, channels=CHANNELS, rate=RATE, input=True, frames_per_buffer=CHUNK_SIZE)
+ 
+ # Main loop
+ while True:
+     # Read audio data from stream
+     data = stream.read(CHUNK_SIZE)
+     
+     # Convert audio data to numpy array
+     audio_array = np.frombuffer(data, dtype=np.int16)
+     
+     # Calculate RMS amplitude
+     rms = np.sqrt(np.mean(np.square(audio_array)))
+     
+     # Calculate dB level
+     avg_db = 20 * np.log10(rms / RMS_REF)
+     max_db = 20 * np.log10(np.max(audio_array) / RMS_REF)
+     
+     # Print dB level to console
+     try:
+         if(avg_db != np.NaN and max_db != np.NaN and max_db > 50):
+             print("dB level:", int(avg_db), int(max_db))
+     except:
+         continue
\ No newline at end of file
--- a/callBackWire.py deleted 100644 → 0
View file @715eaa2
+++ b/callBackWire.py deleted 100644 → 0
View file @715eaa2
- """PyAudio Example: Audio wire between input and output. Callback version."""
- 
- import time
- import sys
- import pyaudio
- import numpy as np
- 
- 
- DURATION = 5  # seconds
- 
- delay_buffer = np.zeros((44100, 2), dtype=np.float32)
- 
- def callback(in_data, frame_count, time_info, status):
-     global delay_buffer
-     audio_data = np.frombuffer(in_data, dtype=np.float32).reshape(frame_count, 2)
-     delayed_data = np.concatenate((delay_buffer, audio_data))
-     delay_buffer = delayed_data[frame_count:]
-     return (audio_data + 0.5 * delay_buffer).tobytes(), pyaudio.paContinue
- 
- p = pyaudio.PyAudio()
- stream = p.open(format=p.get_format_from_width(2),
-                 channels=1,
-                 rate=44100,
-                 input=True,
-                 output=True,
-                 frames_per_buffer=1024,
- 
-                 stream_callback=callback)
- 
- start = time.time()
- while stream.is_active() and (time.time() - start) < DURATION:
-     time.sleep(0.1)
- 
- stream.close()
- p.terminate()
\ No newline at end of file
--- a/find_peak.py 0 → 100644
View file @86a3d09
+++ b/find_peak.py 0 → 100644
View file @86a3d09
+ import pyaudio
+ import numpy as np
+ import scipy.signal as signal
+ import matplotlib.pyplot as plt
+ # 파라미터 설정
+ RATE = 44100  # 샘플링 주파수
+ CHUNK = 1024  # 읽을 샘플의 수
+ THRESHOLD = 256  # 피크를 검출하기 위한 threshold 값
+ WIN_SIZE = 1024  # STFT를 적용할 윈도우 사이즈
+ HOP_SIZE = 512  # STFT에서 윈도우 사이의 거리 (오버랩 사이즈)
+ 
+ # PyAudio 객체 생성
+ p = pyaudio.PyAudio()
+ 
+ # 콜백 함수 정의
+ def process_audio(in_data, frame_count, time_info, status):
+     # 오디오 데이터 변환
+     data = np.frombuffer(in_data, dtype=np.int16)
+ 
+     # STFT 수행
+     f, t, Zxx = signal.stft(data, RATE, nperseg=WIN_SIZE, noverlap=HOP_SIZE)
+ 
+     # 피크 검출
+     peaks, _ = signal.find_peaks(np.abs(np.mean(Zxx, axis=1)), height=THRESHOLD, distance=WIN_SIZE)
+     # 파라미터 추정
+     if len(peaks) > 0:
+         peak_idx = peaks[0]  # 첫 번째 피크 선택
+         height = np.abs(Zxx[peak_idx, 0])  # 피크의 높이 추정
+         freq = f[peak_idx]  # 피크의 주파수 추정
+         amp = np.max(np.abs(data))  # 신호의 진폭 추정
+         progress = (peak_idx + HOP_SIZE) / RATE  # 충돌음의 진행 길이 추정
+ 
+         # 결과 출력
+         print("Height: {:.2f}, Frequency: {:.2f}, Amplitude: {:.2f}, Progress: {:.2f}".format(height, freq, amp, progress))
+ 
+     # 반환할 데이터 없음
+     return (in_data, pyaudio.paContinue)
+ 
+ # 입력 스트림 열기
+ stream = p.open(format=p.get_format_from_width(2),
+                 channels=1,
+                 rate=RATE,
+                 input=True,
+                 output=True,
+                 frames_per_buffer=CHUNK,
+                 stream_callback=process_audio
+                 )
+ 
+ # 스트림 시작
+ stream.start_stream()
+ 
+ # 프로그램 실행 중지 전까지 무한 대기
+ while stream.is_active():
+     pass
+ 
+ # 스트림과 PyAudio 객체 종료
+ stream.stop_stream()
+ stream.close()
+ p.terminate()
--- a/make_echo.py 0 → 100644
View file @86a3d09
+++ b/make_echo.py 0 → 100644
View file @86a3d09
+ 
+ 
+ 
+ import sys
+ import numpy as np
+ import pyaudio
+ 
+ RECORD_SECONDS = 5
+ CHUNK = 128
+ RATE = 44100
+ DELAY = 0.1  # Delay time in seconds
+ GAIN = 1  # Echo gain (0 to 1)
+ 
+ # Create buffer for delayed audio data
+ buffer_size = int(RATE * DELAY)
+ buffer = np.zeros(buffer_size, dtype=np.int16)
+ 
+ def add_echo(in_data, frame_count, time_info, status_flags):
+     global buffer
+     data = np.frombuffer(in_data, dtype=np.int16)
+     output = data + GAIN * buffer[:len(data)]
+     buffer = np.roll(buffer, len(data))
+     buffer[-len(data):] = data
+     return (output.astype(np.int16).tobytes(), pyaudio.paContinue)
+ 
+ 
+ p = pyaudio.PyAudio()
+ stream = p.open(format=p.get_format_from_width(2),
+                 channels=1 if sys.platform == 'darwin' else 2,
+                 rate=RATE,
+                 input=True,
+                 output=True,
+                 frames_per_buffer=CHUNK,
+                 stream_callback=add_echo
+                 )
+ 
+ print('* recording')
+ 
+ stream.start_stream()
+ 
+ while stream.is_active():
+     # Do other processing here if necessary
+     pass
+ 
+ stream.stop_stream()
+ stream.close()
+ p.terminate()
--- a/output.wav deleted 100644 → 0
View file @715eaa2
+++ b/output.wav deleted 100644 → 0
View file @715eaa2
--- a/sets.py 0 → 100644
View file @86a3d09
+++ b/sets.py 0 → 100644
View file @86a3d09
+ import base64
+ 
+ task_list = []
+ 
+ 
+ def display_menu():
+     print("일정 관리자")
+     print("1. 일정 추가")
+     print("2. 일정 보기")
+     print("3. 일정 완료 표시")
+     print("4. 종료")
+ 
+ 
+ def add_task():
+     title = input("일정 제목 입력: ")
+     description = input("일정 설명 입력: ")
+     status = "하는 중"
+     task = { "title": title, "description": description, "status": status}
+     task_list.append(task)
+     print("일정이 추가되었습니다.")
+ 
+ 
+ def view_tasks():
+     if not task_list:
+         print("일정 목록이 비어 있습니다.")
+     else:
+         print()
+         print("일정 목록:")
+         print("----------------")
+         for task in task_list:
+             print(f"제목: {task['title']}")
+             print(f"설명: {task['description']}")
+             print(f"상태: {task['status']}")
+             print("----------------")
+ 
+ 
+ def mark_task_complete():
+     if not task_list:
+         print("일정 목록이 비어 있습니다.")
+         return
+ 
+     title = input("완료로 표시할 일정의 제목 입력: ")
+     for task in task_list:
+         if task['title'] == title:
+             task['status'] = "완료"
+             print("일정이 완료로 표시되었습니다.")
+             return
+ 
+     print("식별자와 일치하는 일정을 찾을 수 없습니다.")
+ 
+ 
+ while True:
+     display_menu()
+     choice = input("선택: ")
+ 
+     if choice == "1":
+         add_task()
+     elif choice == "2":
+         view_tasks()
+     elif choice == "3":
+         mark_task_complete()
+     elif choice == "4":
+         print("프로그램을 종료합니다.")
+         break
+     else:
+         print("올바른 선택지를 입력하세요.")
+     print()
+ 
--- a/streamToOut.py deleted 100644 → 0
View file @715eaa2
+++ b/streamToOut.py deleted 100644 → 0
View file @715eaa2
- import pyaudio
- from pydub import AudioSegment
- from pydub.effects import normalize
- 
- # set up PyAudio
- pa = pyaudio.PyAudio()
- stream = pa.open(format=pyaudio.paInt16,
-                  channels=1,
-                  rate=44100,
-                  input=True,
-                  frames_per_buffer=1024)
- 
- # record some audio from the microphone
- audio_data = []
- for i in range(0, int(44100 / 1024 * 5)):
-     data = stream.read(1024)
-     audio_data.append(data)
- 
- # convert the audio data to a PyDub audio segment
- audio_segment = AudioSegment(
-     data=b''.join(audio_data),
-     sample_width=2,
-     frame_rate=44100,
-     channels=1
- )
- 
- # apply an echo effect to the audio segment
- echoed_segment = normalize(audio_segment)
- 
- # save the output audio file
- echoed_segment.export("output.mp3", format="mp3")
- 
- # clean up
- stream.stop_stream()
- stream.close()
- pa.terminate()
--- a/stream_echo.py 0 → 100644
View file @86a3d09
+++ b/stream_echo.py 0 → 100644
View file @86a3d09
+ import sys
+ import numpy as np
+ import pyaudio
+ import librosa
+ 
+ RECORD_SECONDS = 5
+ CHUNK = 1024
+ RATE = 44100
+ DELAY = 0.1  # Delay time in seconds
+ GAIN = 1  # Echo gain (0 to 1)
+ MAX_FREQ = 3000
+ 
+ # Create buffer for delayed audio data
+ buffer_size = int(RATE * DELAY)
+ buffer = np.zeros(buffer_size, dtype=np.int16)
+ 
+ def add_echo(in_data, frame_count, time_info, status_flags):
+     global buffer
+     data = np.frombuffer(in_data, dtype=np.int16)
+ 
+     def get_max_average_db(data):
+         data_float = data.astype(np.float32) 
+ 
+         # Compute the power spectrogram of the data
+         S = librosa.stft(data_float, n_fft=2048, hop_length=512)
+         S_power = np.abs(S)**2
+ 
+         # Convert power spectrogram to dB scale
+         S_dB = librosa.amplitude_to_db(S_power, ref=np.max)
+ 
+         # Calculate the average dB level
+         avg_dB = np.mean(S_dB)
+         max_dB = np.max(S_dB)
+ 
+         return avg_dB, max_dB
+ 
+     def get_dominant_freq(data):
+         data = data.astype(np.float32) / 32768.0
+ 
+         # Compute the Fourier transform of the data
+         fft_data = np.fft.fft(data)
+ 
+         # Compute the power spectral density of the data
+         psd_data = np.abs(fft_data)**2
+ 
+         # Define the frequency range of interest
+         freqs = np.fft.fftfreq(len(psd_data), d=1/RATE)
+ 
+         # Compute the power spectrogram on the mel scale
+         S = librosa.feature.melspectrogram(y=data, sr=RATE, n_fft=2048, hop_length=1024)
+ 
+         # Find the frequency bin with the maximum energy in each frame
+         max_bin = np.argmax(S, axis=0)
+ 
+         # Find the dominant frequency in each frame
+         dominant_freqs = freqs[max_bin]
+ 
+         # Compute the median of the dominant frequencies to get the overall dominant frequency
+         dominant_freq = np.median(dominant_freqs)
+ 
+         return dominant_freq
+ 
+     freq = get_dominant_freq(data)
+     avg_db, max_db = get_max_average_db(data)
+     print(int(freq), int(avg_db), int(max_db))
+     temp_gain = freq/MAX_FREQ
+     output = data + freq/2500 * buffer[:len(data)]
+     buffer = np.roll(buffer, len(data))
+     buffer[-len(data):] = data
+     return (output.astype(np.int16).tostring(), pyaudio.paContinue)
+ 
+ 
+ p = pyaudio.PyAudio()
+ stream = p.open(format=p.get_format_from_width(2),
+                 channels=1 if sys.platform == 'darwin' else 2,
+                 rate=RATE,
+                 input=True,
+                 output=True,
+                 frames_per_buffer=CHUNK,
+                 stream_callback=add_echo
+                 )
+ 
+ print('* recording')
+ 
+ stream.start_stream()
+ 
+ while stream.is_active():
+     # Do other processing here if necessary
+     pass
+ 
+ stream.stop_stream()
+ stream.close()
+ p.terminate()
--- a/testForPort.py deleted 100644 → 0
View file @715eaa2
+++ b/testForPort.py deleted 100644 → 0
View file @715eaa2
- import numpy as np
- import pyaudio
- import time
- 
- pa = pyaudio.PyAudio()
- delay_buffer = np.zeros((44100, 1), dtype=np.float32)
- 
- def callback(in_data, frame_count, time_info, status):
-     global delay_buffer
-     audio_data = np.frombuffer(in_data, dtype=np.float32).reshape(1024, 1)
-     delayed_data = np.concatenate((delay_buffer, audio_data))
-     delay_buffer = delayed_data[frame_count:]
-     return (audio_data + 0.5 * delay_buffer).tobytes(), pyaudio.paContinue
- 
- stream = pa.open(format=pyaudio.paFloat32,
-                  channels=1,
-                  rate=1024,
-                  input=True,
-                  output=True,
-                  frames_per_buffer=44100,
-                  stream_callback=callback)
- start = time.time()
- DURATION = 30
- # keep the stream running for a few seconds
- while stream.is_active() and (time.time() - start) < DURATION:
-     time.sleep(0.1)
- 
- stream.stop()
- stream.close()
- pa.terminate()
\ No newline at end of file
--- a/visualize.py 0 → 100644
View file @86a3d09
+++ b/visualize.py 0 → 100644
View file @86a3d09
+ import pyaudio
+ import numpy as np
+ import matplotlib.pyplot as plt
+ import librosa
+ import threading
+ import sys
+ 
+ print = sys.stdout.write
+ 
+ 
+ # Define constants for audio parameters
+ FORMAT = pyaudio.paFloat32
+ CHANNELS = 1
+ RATE = 44100
+ FRAMES_PER_BUFFER = 1024
+ DELAY = 0.1
+ GAIN = 0.5
+ 
+ # Open an audio stream
+ stream = pyaudio.PyAudio().open(format=FORMAT, channels=CHANNELS, rate=RATE, input=True, frames_per_buffer=FRAMES_PER_BUFFER)
+ 
+ 
+ sound = []
+ def get_stream_data():
+     global sound
+     sound.append(stream.read(FRAMES_PER_BUFFER*5, False))
+ 
+ get_stream_data()
+ 
+ 
+ # Create buffer for delayed audio data
+ buffer_size = int(RATE * DELAY)
+ buffer = np.zeros(buffer_size, dtype=np.int16)
+ 
+ def add_echo(in_data, frame_count, time_info, status_flags):
+     global buffer
+     data = np.frombuffer(in_data, dtype=np.int16)
+     output = data + GAIN * buffer[:len(data)]
+     buffer = np.roll(buffer, len(data))
+     buffer[-len(data):] = data
+     return (output.astype(np.int16).tostring(), pyaudio.paContinue)
+ 
+ 
+ 
+ def get_max_average_db():
+     global sound
+     data = sound[-1]
+     # Convert data to numpy array
+     data_float = np.frombuffer(data, dtype=np.float32)
+ 
+     # Compute the power spectrogram of the data
+     S = librosa.stft(data_float, n_fft=2048, hop_length=512)
+     S_power = np.abs(S)**2
+ 
+     # Convert power spectrogram to dB scale
+     S_dB = librosa.amplitude_to_db(S_power, ref=np.max)
+ 
+     # Calculate the average dB level
+     avg_dB = np.mean(S_dB)
+ 
+     print("Average dB: {:.2f}".format(avg_dB) + " "+ "Max dB: {:.2f}".format(np.max(S_dB)) + "\n")
+ 
+ 
+ def print_dominant_freq():
+     global sound
+     data = sound[-1]
+ 
+     # Convert data to numpy array
+     data = np.frombuffer(data, dtype=np.float32)
+ 
+     # Compute the Fourier transform of the data
+     fft_data = np.fft.fft(data)
+ 
+     # Compute the power spectral density of the data
+     psd_data = np.abs(fft_data)**2
+ 
+     # Define the frequency range of interest
+     freqs = np.fft.fftfreq(len(psd_data), d=1/RATE)
+ 
+ 
+     # Compute the power spectrogram on the mel scale
+     S = librosa.feature.melspectrogram(y=data, sr=RATE, n_fft=2048, hop_length=1024, n_mels=512)
+ 
+     # Find the frequency bin with the maximum energy in each frame
+     max_bin = np.argmax(S, axis=0)
+ 
+     # Find the dominant frequency in each frame
+     dominant_freqs = freqs[max_bin]
+ 
+     # Compute the median of the dominant frequencies to get the overall dominant frequency
+     dominant_freq = np.median(dominant_freqs)
+ 
+     print("Dominant frequency: {:.2f} Hz\n".format(dominant_freq))
+ 
+ 
+ threading.Thread(target=get_stream_data).start()
+ 
+ while True:
+     get_data = threading.Thread(target=get_stream_data)
+     calc_data = threading.Thread(target=print_dominant_freq)
+     #get_decibel = threading.Thread(target=get_max_average_db)
+     
+     get_data.start()
+     calc_data.start()
+     #get_decibel.start()
+     
+     get_data.join()
+     
+     sys.stdin.flush()
--- a/what_to_do 0 → 100644
View file @86a3d09
+++ b/what_to_do 0 → 100644
View file @86a3d09
+ 시나리오 작성 먼저 해보기. -> 때리는 소리따라 나오게, 
+ 시나리오에 따라서 딜레이를 줄이는 방식을 좀 더 만들어 보자.
+ 
+ 소리 왜곡방법은 알아서 재밌어 보이는걸로 해보자.
+ 지향성마이크도 한번 달아보기.
+ 
+ 1. 실제 소리변형으로 뭔가 만들기
+ - 실제 소리가 들릴거냐 말거냐
+ 2. identification만 하고, 다른 소리 재생도 할 수 있음.
\ No newline at end of file
--- a/wire.py
View file @86a3d09
+++ b/wire.py
View file @86a3d09
 import sys
- 
+ import numpy as np
 import pyaudio
+ import matplotlib.pyplot as plt
 
 RECORD_SECONDS = 5
 CHUNK = 1024
@@ -16,15 +17,54 @@ stream = p.open(format=p.get_format_from_width(2),
 
 print('* recording')
 
+ # Initialize plot
+ fig, ax = plt.subplots()
+ x = np.arange(0, RECORD_SECONDS, CHUNK / RATE)
+ line, = ax.plot(x, np.zeros(len(x)))
+ 
 def add_echo(data, output_stream):
     output_stream.write(data)
 
+ # Initialize data arrays
+ db_data = np.zeros(len(x))
+ 
 
 for i in range(0, int(RATE / CHUNK * RECORD_SECONDS)):
-     add_echo(stream.read(CHUNK), stream)
+     byte_stream = stream.read(CHUNK)
+     data = np.frombuffer(byte_stream, dtype=np.int16)
+     fft_data = np.fft.fft(data)
+     # 주파수 대역 설정
+     freq_range = (200, 2000)  # 200Hz ~ 2kHz
+ 
+     # 주파수 스펙트럼에서 주파수 대역 추출
+     freq_spectrum = fft_data[(freq_range[0] // (RATE // len(data))) : (freq_range[1] // (RATE // len(data)))]
+ 
+     # 에너지 계산
+     energy = np.sum(np.abs(freq_spectrum)**2)
+     # 소리의 세기 계산
+     db = 10 * np.log10(energy)
 
+     # 소리의 높낮이 계산
+     max_freq = (np.argmax(np.abs(freq_spectrum)) * RATE) / len(data)
+     print("freq : ", max_freq)
+     print("db : ", db)
+ 
+     # Add data to arrays
+     db_data = np.roll(db_data, -1)
+     db_data[-1] = db
+ 
+     # Update plot
+     line.set_ydata(db_data)
+     ax.relim()
+     ax.autoscale_view()
+ 
+     plt.draw()
+     plt.pause(0.001)
 
 print('* done')
 
 stream.close()
- p.terminate()
\ No newline at end of file
+ p.terminate()
+ 
+ # Show plot
+ plt.show()