backup

khu
Commit b567b00ea7261408e453f969d642b53b8b5415f4 b567b00e 0 parents
Showing 23 changed files with 674 additions and 0 deletions
2018-08-13_Untitled.mp4
CapsNet
FFT연습/FFT.ipynb
FFT연습/FFT_for_analyize_data.ipynb
FFT연습/FFT_readfrom_WAV.ipynb
FFT연습/FFT_wavefile_temp1.ipynb
FFT연습/Kaggle_sound_tutorial.ipynb
FFT연습/Realtime_saveWAV.ipynb
FFT연습/fft연습.ipynb
FFT연습/realtime FFT.ipynb
FFT연습/trash.ipynb
SUBSTRACT_MEAN_VERSION+Make_spectogram+save_to_csv.ipynb
Untitled.ipynb
VANILA+Training_model.ipynb
VANILA_+Make_spectogram+save_to_csv.ipynb
VANILA_EVALUATE.ipynb
VANILA_TEST.ipynb
VANILA_VERSION+Make_spectogram+save_to_csv.ipynb
Various_Spectograms.ipynb
badch_testset_blankresults.csv
--- a/2018-08-13_Untitled.mp4 0 → 100644
View file @b567b00
+++ b/2018-08-13_Untitled.mp4 0 → 100644
View file @b567b00
--- a/CapsNet @ 7d884474
+++ b/CapsNet @ 7d884474
+Subproject commit 7d8844740c119ae66576be9510474a791240a745
--- a/FFT연습/FFT.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/FFT.ipynb 0 → 100644
View file @b567b00
--- a/FFT연습/FFT_for_analyize_data.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/FFT_for_analyize_data.ipynb 0 → 100644
View file @b567b00
--- a/FFT연습/FFT_readfrom_WAV.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/FFT_readfrom_WAV.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "from scipy.fftpack import fft\n",
+    "from scipy.io import wavfile # get the api"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "ename": "TypeError",
+     "evalue": "'numpy.int16' object is not iterable",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
+      "\u001b[0;32m<ipython-input-4-c176e6e452f3>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[0mfs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mwavfile\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'1.wav'\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# load the data\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      2\u001b[0m \u001b[0ma\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mT\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;31m# this is a two channel soundtrack, I get the first track\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 3\u001b[0;31m \u001b[0mb\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mele\u001b[0m\u001b[0;34m/\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m**\u001b[0m\u001b[0;36m8.\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m-\u001b[0m\u001b[0;36m1\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mele\u001b[0m \u001b[0;32min\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;31m# this is 8-bit track, b is now normalized on [-1,1)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      4\u001b[0m \u001b[0mc\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfft\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mb\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# calculate fourier transform (complex numbers list)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      5\u001b[0m \u001b[0md\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mc\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m/\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m)\u001b[0m  \u001b[0;31m# you only need half of the fft list (real signal symmetry)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+      "\u001b[0;31mTypeError\u001b[0m: 'numpy.int16' object is not iterable"
+     ]
+    }
+   ],
+   "source": [
+    "fs, data = wavfile.read('1.wav') # load the data\n",
+    "a = data.T[0] # this is a two channel soundtrack, I get the first track\n",
+    "b=[(ele/2**8.)*2-1 for ele in a] # this is 8-bit track, b is now normalized on [-1,1)\n",
+    "c = fft(b) # calculate fourier transform (complex numbers list)\n",
+    "d = int(len(c)/2)  # you only need half of the fft list (real signal symmetry)\n",
+    "plt.plot(abs(c[:(d-1)]),'r') \n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#wav파일 프린트 할줄알아야함 \n",
+    "#(채널 : 모노라면 1, 스테레오라면 2\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/FFT연습/FFT_wavefile_temp1.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/FFT_wavefile_temp1.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import math\n",
+    "import wave\n",
+    "import sys\n",
+    "import struct\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "ValueError",
+     "evalue": "invalid literal for int() with base 10: '/run/user/1000/jupyter/kernel-6454a929-4509-4b51-949d-f1c910f7ce09.json'",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
+      "\u001b[0;32m<ipython-input-3-cc8beb2556b6>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[1;32m      3\u001b[0m \u001b[0msample_rate\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgetframerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m \u001b[0mtotal_num_samps\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgetnframes\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 5\u001b[0;31m \u001b[0mfft_length\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msys\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0margv\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      6\u001b[0m \u001b[0mnum_fft\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mtotal_num_samps\u001b[0m \u001b[0;34m/\u001b[0m \u001b[0mfft_length\u001b[0m \u001b[0;34m)\u001b[0m \u001b[0;34m-\u001b[0m \u001b[0;36m2\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+      "\u001b[0;31mValueError\u001b[0m: invalid literal for int() with base 10: '/run/user/1000/jupyter/kernel-6454a929-4509-4b51-949d-f1c910f7ce09.json'"
+     ]
+    }
+   ],
+   "source": [
+    "# 웨이브 파일을 열어라\n",
+    "fp = wave.open('birdsound.wav',\"rb\")\n",
+    "sample_rate = fp.getframerate()\n",
+    "total_num_samps = fp.getnframes()\n",
+    "fft_length = int(sys.argv[2])\n",
+    "num_fft = (total_num_samps / fft_length ) - 2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 임시로 사용할 작업 배열을 만들어라\n",
+    "temp = zeros((num_fft,fft_length),Float)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 파일로부터 데이터를 읽어 들여라\n",
+    "for i in range(num_fft):\n",
+    "    tempb = fp.readframes(fft_length);\n",
+    "    temp[i,:] = array(struct.unpack(\"%dB\"%(fft_length), \\\n",
+    "                tempb),Float) - 128.0\n",
+    "fp.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 데이터를 창틀화하라\n",
+    "temp = temp * hamming(fft_length)\n",
+    "\n",
+    "# FFT를 사용하여 변환하라, 파워를 반환하라\n",
+    "freq_pwr  = 10*log10(1e-20+abs(real_fft(temp,fft_length))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 결과를 도표하라\n",
+    "n_out_pts = (fft_length / 2) + 1\n",
+    "y_axis = 0.5*float(sample_rate) / n_out_pts * \\\n",
+    "         arange(n_out_pts)\n",
+    "x_axis = (total_num_samps / float(sample_rate)) / \\\n",
+    "         num_fft * arange(num_fft)\n",
+    "setvar(\"X\",\"Time (sec)\")\n",
+    "setvar(\"Y\",\"Frequency (Hertz)\")\n",
+    "conshade(freq_pwr,x_axis,y_axis)\n",
+    "disfin()"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/FFT연습/Kaggle_sound_tutorial.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/Kaggle_sound_tutorial.ipynb 0 → 100644
View file @b567b00
--- a/FFT연습/Realtime_saveWAV.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/Realtime_saveWAV.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import wave\n",
+    "import pyaudio"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def play_file(fname):\n",
+    "    #오디오 객체 생성\n",
+    "    wf = wave.open('output.wav','rb') # wave파일 할당해준 객체\n",
+    "    p = pyaudio.PyAudio() #파이오디오 할당해준 객체\n",
+    "    chunk = 1024\n",
+    "    \n",
+    "    #stream = pyaudio로 open 하는것\n",
+    "    stream = p.open(format=p.get_format_from_width(wf.getsampwidth()),\n",
+    "                    channels=wf.getnchannels(),\n",
+    "                    rate=wf.getframerate(),\n",
+    "                    output=True)\n",
+    "    \n",
+    "    #데이터 wav파일에서 읽기\n",
+    "    data = wf.readframes(chunk)\n",
+    "    \n",
+    "    #읽은 데이터 있는동안 \n",
+    "    while data !='':\n",
+    "        stream.write(data) #스트림에 데이터 쓰기 \n",
+    "        data = wf.readframes(chunk) #데이터 wav파일에서 다시읽기\n",
+    "    \n",
+    "    #객체 닫아주기\n",
+    "    stream.close()\n",
+    "    p.terminate()\n",
+    "        "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "play_file('output.wav')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/FFT연습/fft연습.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/fft연습.ipynb 0 → 100644
View file @b567b00
--- a/FFT연습/realtime FFT.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/realtime FFT.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "    import numpy as np\n",
+    "    import pylab\n",
+    "    import matplotlib.pyplot as plt\n",
+    "    from scipy.io import wavfile\n",
+    "    import time\n",
+    "    import sys\n",
+    "    import seaborn as sns\n",
+    "    import pyaudio"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "i=0\n",
+    "f,ax = plt.subplots(2)\n",
+    "\n",
+    "# Prepare the Plotting Environment with random starting values\n",
+    "x = np.arange(10000)\n",
+    "y = np.random.randn(10000)\n",
+    "\n",
+    "# Plot 0 is for raw audio data\n",
+    "li, = ax[0].plot(x, y)\n",
+    "ax[0].set_xlim(0,1000)\n",
+    "ax[0].set_ylim(-5000,5000)\n",
+    "ax[0].set_title(\"Raw Audio Signal\")\n",
+    "# Plot 1 is for the FFT of the audio\n",
+    "li2, = ax[1].plot(x, y)\n",
+    "ax[1].set_xlim(0,5000)\n",
+    "ax[1].set_ylim(-100,100)\n",
+    "ax[1].set_title(\"Fast Fourier Transform\")\n",
+    "# Show the plot, but without blocking updates\n",
+    "plt.pause(0.01)\n",
+    "plt.tight_layout()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "FORMAT = pyaudio.paInt16 # We use 16bit format per sample\n",
+    "CHANNELS = 1\n",
+    "RATE = 44100\n",
+    "CHUNK = 1024 # 1024bytes of data red from a buffer\n",
+    "RECORD_SECONDS = 0.1\n",
+    "WAVE_OUTPUT_FILENAME = \"file.wav\"\n",
+    "\n",
+    "audio = pyaudio.PyAudio()\n",
+    "\n",
+    "# start Recording\n",
+    "stream = audio.open(format=FORMAT,\n",
+    "                    channels=CHANNELS,\n",
+    "                    rate=RATE,\n",
+    "                    input=True)#,\n",
+    "                    #frames_per_buffer=CHUNK)\n",
+    "\n",
+    "global keep_going\n",
+    "keep_going = True\n",
+    "\n",
+    "def plot_data(in_data):\n",
+    "    # get and convert the data to float\n",
+    "    audio_data = np.fromstring(in_data, np.int16)\n",
+    "    # Fast Fourier Transform, 10*log10(abs) is to scale it to dB\n",
+    "    # and make sure it's not imaginary\n",
+    "    dfft = 10.*np.log10(abs(np.fft.rfft(audio_data)))\n",
+    "\n",
+    "    # Force the new data into the plot, but without redrawing axes.\n",
+    "    # If uses plt.draw(), axes are re-drawn every time\n",
+    "    #print audio_data[0:10]\n",
+    "    #print dfft[0:10]\n",
+    "    #print\n",
+    "    li.set_xdata(np.arange(len(audio_data)))\n",
+    "    li.set_ydata(audio_data)\n",
+    "    li2.set_xdata(np.arange(len(dfft))*10.)\n",
+    "    li2.set_ydata(dfft)\n",
+    "\n",
+    "    # Show the updated plot, but without blocking\n",
+    "    plt.pause(0.01)\n",
+    "    if keep_going:\n",
+    "        return True\n",
+    "    else:\n",
+    "        return False\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "# Open the connection and start streaming the data\n",
+    "stream.start_stream()\n",
+    "print (\"\\n+---------------------------------+\")\n",
+    "print (\"| Press Ctrl+C to Break Recording |\")\n",
+    "print (\"+---------------------------------+\\n\")\n",
+    "\n",
+    "# Loop so program doesn't end while the stream callback's\n",
+    "# itself for new data\n",
+    "while keep_going:\n",
+    "    try:\n",
+    "        plot_data(stream.read(CHUNK))\n",
+    "    except KeyboardInterrupt:\n",
+    "        keep_going=False\n",
+    "    except:\n",
+    "        pass\n",
+    "\n",
+    "# Close up shop (currently not used because KeyboardInterrupt\n",
+    "# is the only way to close)\n",
+    "stream.stop_stream()\n",
+    "stream.close()\n",
+    "\n",
+    "audio.terminate()\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/FFT연습/trash.ipynb 0 → 100644
View file @b567b00
+++ b/FFT연습/trash.ipynb 0 → 100644
View file @b567b00
--- a/SUBSTRACT_MEAN_VERSION+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
+++ b/SUBSTRACT_MEAN_VERSION+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
--- a/Untitled.ipynb 0 → 100644
View file @b567b00
+++ b/Untitled.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "TEST할것\n",
+    "<입력값>\n",
+    "1. 일정 데시벨파워 이하는 다 지운 멜스펙토그램 <-아... 원래 데이터셋 새소리 어느정도 작은 소리까지 잡는겨\n",
+    "2. mel filter 80 & axis=1평균을 뺀 멜스펙토그램\n",
+    "3. 새소리 주파수 이하는 주파수대는 짜름\n",
+    "5. 커널씩 보면서 차이나는것만 뽑아내기 (그주변만 비교하는게 있을거같은데)\n",
+    "6. 멜필터 안씌운거 보고 새소리 주파수 이하 짤라버릴때등.. 안씌운거 보기\n",
+    "\n",
+    "<모델>\n",
+    "1. 일반 뛰어난 CNN모델. 첫번째 모델이 왜 더 좋은지 보자\n",
+    "3. C+RNN <- RNN 부분 잘 된건가?\n",
+    "4. Capsul network\n",
+    "\n",
+    "<추가적>\n",
+    "1.  라벨링 : 확실히 귀에 잘 들리고 눈에 잘 보이는 애들만 1로 라벨링, 희미한건 0으로 라벨링 \n",
+    "    -> 필드테스트 한 애들만 맞춘거 비율이 높도록 보이기. 머신이 새라고 한거중에 0인애들만 또 보여주기\n",
+    "2. 필드테스트랑 원래하던거랑 왜안될까? -> 짹짹이가 데이터셋에 별로없거나 모델이 안좋거나.. (먼저 컴한테 분류시켜보고 판단?)\n",
+    "3. 그경우, 찌르레기 소리에 초점을 맞춰서 저 패턴을 학습시키고 아예 그걸 찾도록 하는것도 나쁘지 않을듯\n",
+    "4. 아이폰녹음이랑 뭐가다른지, 실제로 차이가 난건지도 봐야함. "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "1. CRNN - RNN 코드 다시 보고 돌리기\n",
+    "2. CNN - 논문1네 모델 돌리기\n",
+    "3. 캡슐 네트워크 돌리기\n",
+    "\n",
+    "#### scipy / librosa 둘다로 mel spectogram 짜봤는데 librosa가 더 좋았음."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/VANILA+Training_model.ipynb 0 → 100644
View file @b567b00
+++ b/VANILA+Training_model.ipynb 0 → 100644
View file @b567b00
--- a/VANILA_+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
+++ b/VANILA_+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
--- a/VANILA_EVALUATE.ipynb 0 → 100644
View file @b567b00
+++ b/VANILA_EVALUATE.ipynb 0 → 100644
View file @b567b00
--- a/VANILA_TEST.ipynb 0 → 100644
View file @b567b00
+++ b/VANILA_TEST.ipynb 0 → 100644
View file @b567b00
--- a/VANILA_VERSION+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
+++ b/VANILA_VERSION+Make_spectogram+save_to_csv.ipynb 0 → 100644
View file @b567b00
--- a/Various_Spectograms.ipynb 0 → 100644
View file @b567b00
+++ b/Various_Spectograms.ipynb 0 → 100644
View file @b567b00
--- a/badch_testset_blankresults.csv 0 → 100644
View file @b567b00
+++ b/badch_testset_blankresults.csv 0 → 100644
View file @b567b00
--- a/model/bird_sound-17-0.3943.hdf5 0 → 100644
View file @b567b00
+++ b/model/bird_sound-17-0.3943.hdf5 0 → 100644
View file @b567b00
--- a/pyaudio 실시간듣기.ipynb 0 → 100644
View file @b567b00
+++ b/pyaudio 실시간듣기.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pyaudio\n",
+    "import wave"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "* recording\n",
+      "* done recording\n"
+     ]
+    }
+   ],
+   "source": [
+    "CHUNK = 1024\n",
+    "FORMAT = pyaudio.paInt16\n",
+    "CHANNELS = 1\n",
+    "RATE = 25600\n",
+    "RECORD_SECONDS = 10\n",
+    "WAVE_OUTPUT_FILENAME = \"test.wav\"\n",
+    "\n",
+    "p = pyaudio.PyAudio()\n",
+    "\n",
+    "stream = p.open(format=FORMAT,\n",
+    "                channels=CHANNELS,\n",
+    "                rate=RATE,\n",
+    "                input=True,\n",
+    "                frames_per_buffer=CHUNK)\n",
+    "\n",
+    "print(\"* recording\")\n",
+    "\n",
+    "frames = []\n",
+    "\n",
+    "for i in range(0, int(RATE / CHUNK * RECORD_SECONDS)):\n",
+    "    data = stream.read(CHUNK)\n",
+    "    frames.append(data)\n",
+    "\n",
+    "print(\"* done recording\")\n",
+    "\n",
+    "stream.stop_stream()\n",
+    "stream.close()\n",
+    "p.terminate()\n",
+    "\n",
+    "wf = wave.open(WAVE_OUTPUT_FILENAME, 'wb')\n",
+    "wf.setnchannels(CHANNELS)\n",
+    "wf.setsampwidth(p.get_sample_size(FORMAT))\n",
+    "wf.setframerate(RATE)\n",
+    "wf.writeframes(b''.join(frames))\n",
+    "wf.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/오디오10초씩자르기.ipynb 0 → 100644
View file @b567b00
+++ b/오디오10초씩자르기.ipynb 0 → 100644
View file @b567b00
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pydub"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "done\n"
+     ]
+    }
+   ],
+   "source": [
+    "from pydub import AudioSegment\n",
+    "\n",
+    "for i in range(0,45):\n",
+    "    t1 = i * 10000 #Works in milliseconds\n",
+    "    t2 = (i+1) * 10000\n",
+    "    \n",
+    "    newAudio = AudioSegment.from_wav(\"./New/IMG_3867.wav\")\n",
+    "    newAudio = newAudio[t1:t2]\n",
+    "    newAudio.export('./field/IMG_3867%d.wav'%(i), format=\"wav\")\n",
+    "\n",
+    "print('done')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}