Tony607
diff --git a/‎.gitignore
Lines changed: 87 additions & 0 deletions b/‎.gitignore
Lines changed: 87 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 39 additions & 0 deletions b/‎README.md
Lines changed: 39 additions & 0 deletions
diff --git a/‎Trigger word detection - v1.ipynb
Lines changed: 1797 additions & 0 deletions b/‎Trigger word detection - v1.ipynb
Lines changed: 1797 additions & 0 deletions
diff --git a/‎audio_examples/chime.wav
162 KB b/‎audio_examples/chime.wav
162 KB
diff --git a/‎audio_examples/example_train.wav
1.68 MB b/‎audio_examples/example_train.wav
1.68 MB
diff --git a/‎audio_examples/insert_reference.wav
1.68 MB b/‎audio_examples/insert_reference.wav
1.68 MB
diff --git a/‎audio_examples/my_audio.wav
1.68 MB b/‎audio_examples/my_audio.wav
1.68 MB
diff --git a/‎audio_examples/train_reference.wav
1.68 MB b/‎audio_examples/train_reference.wav
1.68 MB
diff --git a/‎chime_output.wav
1.68 MB b/‎chime_output.wav
1.68 MB
diff --git a/‎images/date_attention.png
131 KB b/‎images/date_attention.png
131 KB
diff --git a/‎images/date_attention2.png
130 KB b/‎images/date_attention2.png
130 KB
diff --git a/‎images/label_diagram.png
81.4 KB b/‎images/label_diagram.png
81.4 KB
diff --git a/‎images/model_trigger.png
227 KB b/‎images/model_trigger.png
227 KB
diff --git a/‎images/music_gen.png
185 KB b/‎images/music_gen.png
185 KB
diff --git a/‎images/ones_reference.png
36.7 KB b/‎images/ones_reference.png
36.7 KB
diff --git a/‎images/poorly_trained_model.png
10.1 KB b/‎images/poorly_trained_model.png
10.1 KB
diff --git a/‎images/sound.png
197 KB b/‎images/sound.png
197 KB
diff --git a/‎images/spectrogram.png
41.7 KB b/‎images/spectrogram.png
41.7 KB
diff --git a/‎images/train_label.png
40.7 KB b/‎images/train_label.png
40.7 KB
diff --git a/‎images/train_reference.png
342 KB b/‎images/train_reference.png
342 KB
diff --git a/‎images/woebot.png
410 KB b/‎images/woebot.png
410 KB
diff --git a/‎insert_test.wav
1.68 MB b/‎insert_test.wav
1.68 MB
diff --git a/‎models/tr_model.h5
7.33 MB b/‎models/tr_model.h5
7.33 MB
diff --git a/‎raw_data/activates/1.wav
124 KB b/‎raw_data/activates/1.wav
124 KB
diff --git a/‎raw_data/activates/1_act2.wav
63 KB b/‎raw_data/activates/1_act2.wav
63 KB
diff --git a/‎raw_data/activates/1_act3.wav
300 KB b/‎raw_data/activates/1_act3.wav
300 KB
diff --git a/‎raw_data/activates/2.wav
157 KB b/‎raw_data/activates/2.wav
157 KB
diff --git a/‎raw_data/activates/2_act2.wav
62.5 KB b/‎raw_data/activates/2_act2.wav
62.5 KB
diff --git a/‎raw_data/activates/3.wav
115 KB b/‎raw_data/activates/3.wav
115 KB
diff --git a/‎raw_data/activates/3_act2.wav
78.9 KB b/‎raw_data/activates/3_act2.wav
78.9 KB
diff --git a/‎raw_data/activates/3_act3.wav
412 KB b/‎raw_data/activates/3_act3.wav
412 KB
diff --git a/‎raw_data/activates/4_act2.wav
56.4 KB b/‎raw_data/activates/4_act2.wav
56.4 KB
diff --git a/‎raw_data/backgrounds/1.wav
1.68 MB b/‎raw_data/backgrounds/1.wav
1.68 MB
diff --git a/‎raw_data/backgrounds/2.wav
1.68 MB b/‎raw_data/backgrounds/2.wav
1.68 MB
diff --git a/‎raw_data/dev/1.wav
1.68 MB b/‎raw_data/dev/1.wav
1.68 MB
diff --git a/‎raw_data/dev/2.wav
1.68 MB b/‎raw_data/dev/2.wav
1.68 MB
diff --git a/‎raw_data/negatives/1.wav
62.1 KB b/‎raw_data/negatives/1.wav
62.1 KB
diff --git a/‎raw_data/negatives/1_0.wav
99.8 KB b/‎raw_data/negatives/1_0.wav
99.8 KB
diff --git a/‎raw_data/negatives/2.wav
70.2 KB b/‎raw_data/negatives/2.wav
70.2 KB
diff --git a/‎raw_data/negatives/2_1.wav
93.2 KB b/‎raw_data/negatives/2_1.wav
93.2 KB
diff --git a/‎raw_data/negatives/3.wav
113 KB b/‎raw_data/negatives/3.wav
113 KB
diff --git a/‎raw_data/negatives/3_2.wav
61.7 KB b/‎raw_data/negatives/3_2.wav
61.7 KB
diff --git a/‎raw_data/negatives/4.wav
95.1 KB b/‎raw_data/negatives/4.wav
95.1 KB
diff --git a/‎raw_data/negatives/4_0.wav
230 KB b/‎raw_data/negatives/4_0.wav
230 KB
diff --git a/‎raw_data/negatives/5.wav
61.2 KB b/‎raw_data/negatives/5.wav
61.2 KB
diff --git a/‎raw_data/negatives/5_1.wav
103 KB b/‎raw_data/negatives/5_1.wav
103 KB
diff --git a/‎requirements.txt
Lines changed: 6 additions & 0 deletions b/‎requirements.txt
Lines changed: 6 additions & 0 deletions
diff --git a/‎td_utils.py
Lines changed: 46 additions & 0 deletions b/‎td_utils.py
Lines changed: 46 additions & 0 deletions
diff --git a/‎train.wav
1.68 MB b/‎train.wav
1.68 MB
@@ -0,0 +1,87 @@
+### https://raw.github.com/github/gitignore/f57304e9762876ae4c9b02867ed0cb887316387e/Python.gitignore
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+env/
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*,cover
+.hypothesis/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# pyenv
+.python-version
+
+# celery beat schedule file
+celerybeat-schedule
+
+# SageMath parsed files
+*.sage.py
+
+# dotenv
+.env
+
+# virtualenv
+.venv
+venv/
+ENV/
+
+# Spyder project settings
+.spyderproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+/.idea/
+
+/checkpoints/
+.DS_Store
+
+XY_dev/
+XY_train/
+*.npy
@@ -0,0 +1,6 @@
+numpy
+keras
+h5py
+pydub
+scipy
+matplotlib
@@ -0,0 +1,46 @@
+import matplotlib.pyplot as plt
+from scipy.io import wavfile
+import os
+from pydub import AudioSegment
+
+# Calculate and plot spectrogram for a wav audio file
+def graph_spectrogram(wav_file):
+    rate, data = get_wav_info(wav_file)
+    nfft = 200 # Length of each window segment
+    fs = 8000 # Sampling frequencies
+    noverlap = 120 # Overlap between windows
+    nchannels = data.ndim
+    if nchannels == 1:
+        pxx, freqs, bins, im = plt.specgram(data, nfft, fs, noverlap = noverlap)
+    elif nchannels == 2:
+        pxx, freqs, bins, im = plt.specgram(data[:,0], nfft, fs, noverlap = noverlap)
+    return pxx
+
+# Load a wav file
+def get_wav_info(wav_file):
+    rate, data = wavfile.read(wav_file)
+    return rate, data
+
+# Used to standardize volume of audio clip
+def match_target_amplitude(sound, target_dBFS):
+    change_in_dBFS = target_dBFS - sound.dBFS
+    return sound.apply_gain(change_in_dBFS)
+
+# Load raw audio files for speech synthesis
+def load_raw_audio():
+    activates = []
+    backgrounds = []
+    negatives = []
+    for filename in os.listdir("./raw_data/activates"):
+        if filename.endswith("wav"):
+            activate = AudioSegment.from_wav("./raw_data/activates/"+filename)
+            activates.append(activate)
+    for filename in os.listdir("./raw_data/backgrounds"):
+        if filename.endswith("wav"):
+            background = AudioSegment.from_wav("./raw_data/backgrounds/"+filename)
+            backgrounds.append(background)
+    for filename in os.listdir("./raw_data/negatives"):
+        if filename.endswith("wav"):
+            negative = AudioSegment.from_wav("./raw_data/negatives/"+filename)
+            negatives.append(negative)
+    return activates, negatives, backgrounds
-Original file line number
+Diff line change
@@ @@ -0,0 +1,6 @@ @@
 +numpy
 +keras
 +h5py
 +pydub
 +scipy
 +matplotlib