ding, logger

2026-06-27 16:43:35 +08:00 · 2019-01-12 11:12:11 +08:00
parent 21b06db316
commit a67bc9531d
5 changed files with 88 additions and 73 deletions
@@ -1,17 +1,20 @@
 ####  RUNNING THE MODEL
-# Michels-MacBook-Pro:~ ShebMichel$ cd documents/pmlg/wake/decoder
+# cd documents/pmlg/wake/decoder
-# Michels-MacBook-Pro:decoder ShebMichel$ python demo.py resources/HiBitLit.pmdl
+# python demo.py resources/HiBitLit.pmdl
 from __future__ import print_function
 import os
 import sys
 import snowboydecoder
 from snowboydecoder import play_ding, play_dong
 import signal
 import numpy as np
 import time
 import numpy as np
 import BitLit_main
 t0 = time.time()  ## Time counter
 interrupted = False
@@ -36,10 +39,9 @@ model = sys.argv[1]
 # capture SIGINT signal, e.g., Ctrl+C
 signal.signal(signal.SIGINT, signal_handler)
-
+play_ding()
-detector = snowboydecoder.HotwordDetector(model, sensitivity=0.75)
+detector = snowboydecoder.HotwordDetector(model, sensitivity=0.5)
-print("Listening for hotword (Hi BitLit)... Press Ctrl+C to exit")
+print("Listening... Press Ctrl+C to exit")
 snowboydecoder.play_audio_file()
 detector.start(
@@ -23,7 +23,7 @@ import hashlib
 import tempfile
 from logger import logger
-from snowboydecoder import play_audio_file
+from snowboydecoder import play_ding, play_dong
 import speech_recognition as sr  ## Packages for voice recognizer
 for index, name in enumerate(sr.Microphone.list_microphone_names()):
@@ -42,11 +42,11 @@ except:
 def play_mp3(mp3_file):
    """Play mp3 file with pyglet."""
    # FIXME (wassname) It currently plays in background but we want to wait untill it's finished
    source = pyglet.media.load(filename=mp3_file, streaming=False)
    source.play()
-    time.sleep(source.duration*2 + 2)  # TODO must be a better way to wait untill the media has played
+    print(mp3_file, source.duration)
-
+    time.sleep(source.duration + 4)  # must be a better way to wait untill the media has played
    print(mp3_file, source.duration)
 def cache_gtts(text, lang="en-nz", cache_file=None):
    """
@@ -71,7 +71,7 @@ def cache_gtts(text, lang="en-nz", cache_file=None):
        en: English
    """
-    print('say:', text)
+    logger.debug('say: %s', text)
    if not cache_file:
        hash_filename = hashlib.md5(text.encode()).hexdigest() + '.mp3'
        cache_file = os.path.join(tempfile.gettempdir(), hash_filename)
@@ -85,49 +85,61 @@ def generate_poem():
    ############ AUDIO CONVERSION TO TEST
-    play_audio_file()
+    play_dong()
    t0 = time.time()
    r = sr.Recognizer()
    with sr.Microphone() as source:
-        outfile1 = cache_gtts(text="Hi! My Name is BIT-LIT. PLEASE SPEAK SOME IDEAS FOR A POEM between the beeps.")
+
        # print(r.energy_threshold)
        # r.adjust_for_ambient_noise(source) 
        # print('energy_threshold', r.energy_threshold)
        r.energy_threshold=50
        print('mic', source)
        outfile1 = cache_gtts(text="Hi! My Name is BIT-LIT. PLEASE SPEAK SOME IDEAS FOR A POEM AFTER THE BEEP.")
        play_mp3(outfile1)
        play_ding()
-        play_audio_file()
+        print('speak now', time.time())
        audio = r.listen(source)
        logger.debug('done recording %s', time.time())
        logger.info('recorded %s s', len(audio.frame_data)/audio.sample_rate)
-        audio = r.listen(source, phrase_time_limit=20)
+        play_dong()
-        play_audio_file()
+        outfile2 = cache_gtts(text="BEEP. THANK YOU! GIVE ME A MINUTE TO GENERATE AND READ YOUR POEM")
        outfile2 = cache_gtts(text="BEEP. THANK YOU! GIVE ME A MINUTE TO GENERATE AND READ YOUR POEM. BEEP")
        play_mp3(outfile2)
    t1 = time.time()
-    print('listen took', t1 - t0)
+    logger.debug('listen took %s', t1 - t0)
    try:
-        print("using google speech to text...")
+        logger.debug("using google speech to text...")
        USER_INPUT = r.recognize_google_cloud(audio, credentials_json=GOOGLE_CLOUD_SPEECH_CREDENTIALS)
-        print("Google thinks you said: " + USER_INPUT)
+        logger.info("Google thinks you said: " + USER_INPUT)
    except sr.UnknownValueError as e:
-        print("Could not understand audio. {}".format(e))
+        logger.error("Could not understand audio. {}".format(e))
        return 
    except sr.RequestError as e:
-        print("Could not request results; {0}".format(e))
+        logger.error("Could not request results; {0}".format(e))
        return
    t1b = time.time()
-    print('transcribe took', t1b - t1)
+    logger.debug('transcribe took %s', t1b - t1)
    return
    # Generate poem from user seed
    text_generated = poem(USER_INPUT)
    t2 = time.time()
    logger.info("ML POEM is: %s", text_generated)
-    logger.info('poem and rhyme generation took %s', t2 - t1)
+    logger.debug('poem and rhyme generation took %s', t2 - t1)
    # TEXT CONVERSION IN AUDIO
    # FEED POEM TO TRANSCRIBER
    tts = gTTS(text=text_generated)
-    # ts = datetime.datetime.utcnow().strftime('%Y%m%d_%H-%M-%S')
+    ts = datetime.datetime.utcnow().strftime('%Y%m%d_%H-%M-%S')
-    poem_mp3 = "outputs/BitLit_poem.mp3"#.format(ts)
+    poem_mp3 = "outputs/BitLit_{}.mp3".format(ts)
    tts.save(poem_mp3)
    play_mp3(poem_mp3)
@@ -136,8 +148,8 @@ def generate_poem():
    ######
    t3 = time.time()
-    logger.info('Poem to speech took %s', t3 - t2)
+    logger.debug('Poem to speech took %s', t3 - t2)
-    logger.info("Time spent is about: %s seconds")
+    logger.debug("Total time spent is about: %s seconds", np.round(t3 - t0))
 if __name__ == "__main__":
@@ -1,5 +1,5 @@
-
+Forked from https://github.com/ShebMichel/BitLit_test1
 # Run
 To run the program once installed 
@@ -42,43 +42,35 @@ API Keys:
 When setup the layout should look something like
-```
+  ├── BitLit_decoder.py
-    ├── BitLit_decoder.py
+  ├── BitLit_main.py
-    ├── BitLit_main.py
+  ├── BitLit_main.pyc
-    ├── BitLit_main.pyc
+  ├── BitLit_model_param.py
-    ├── BitLit_model_param.py
+  ├── BitLit_model_param.pyc
-    ├── BitLit_model_param.pyc
+  ├── HiBitLit.pmdl
-    ├── HiBitLit.pmdl
+  ├── README.md
-    ├── README.md
+  ├── logger.py
-    ├── logger.py
+  ├── logger.pyc
-    ├── logger.pyc
+  ├── outputs
-    ├── outputs
+  ├── poem_generator.py
-    ├── poem_generator.py
+  ├── poem_generator.pyc
-    ├── poem_generator.pyc
+  ├── requirements.txt
-    ├── requirements.txt
+  ├── secrets
-    ├── secrets
+  │   ├── google_cloud_credentials.json
-    │   ├── google_cloud_credentials.json
+  │   └── google_cloud_credentials.template.json
-    │   └── google_cloud_credentials.template.json
+  ├── snowboy
-    ├── snowboy
+  │   ├── _snowboydetect.so
-    │   ├── _snowboydetect.so
+  │   ├── resources
-    │   ├── resources
+  │   │   ├── alexa.umdl
-    │   │   ├── alexa.umdl
+  │   │   ├── alexa_02092017.umdl
-    │   │   ├── alexa_02092017.umdl
+  │   │   ├── common.res
-    │   │   ├── common.res
+  │   │   ├── ding.wav
-    │   │   ├── ding.wav
+  │   │   ├── dong.wav
-    │   │   ├── dong.wav
+  │   │   └── snowboy.umdl
-    │   │   └── snowboy.umdl
+  │   ├── snowboydetect.py
-    │   ├── snowboydetect.py
+  │   └── snowboydetect.pyc
-    │   └── snowboydetect.pyc
+  ├── snowboydecoder.py
-    ├── snowboydecoder.py
+  ├── snowboydecoder.pyc
-    ├── snowboydecoder.pyc
+  └── weights
-    └── weights
+    ├── model_poems.npy
-      ├── model_poems.npy
+    └── model_rhymes.npy
      └── model_rhymes.npy
 ```
 # TODO
 - [ ] make sure text logging works
 - [ ] improve before and after text
 - [ ] it start recording while prompt is playing?
@@ -2,9 +2,11 @@
 Voice to text to poem to speech
 Credits: Michel, Lauren, Thomas
 """
 from __future__ import print_function
 import os
 import numpy as np
 from logger import logger
 import re
 from textblob import TextBlob
 import random
@@ -120,7 +122,7 @@ def poem(USER_INPUT):
        start_string = [first_rhyme]
    else:
        start_string = [random.choice(list(word2idx_rhymes.keys()))]
-        print("The word {} is not in our corpus of rhymes yet.".format(first_rhyme))
+        logger.error("The word {} is not in our corpus of rhymes yet.".format(first_rhyme))
    input_eval = [
        word2idx_rhymes[s] for s in start_string
    ]  # converts start_string to numbers the model understands
@@ -143,7 +145,7 @@ def poem(USER_INPUT):
        input_eval = tf.expand_dims([predicted_id], 0)
        rhymes += [idx2word_rhymes[predicted_id]]
-    print("rhymes:", rhymes)
+    logger.info("rhymes:", rhymes)
    ####################
    #  POEM GENERATION #
@@ -60,6 +60,13 @@ def play_audio_file(fname=DETECT_DING):
    audio.terminate()
 def play_ding():
    play_audio_file(fname=DETECT_DING)
 def play_dong():
    play_audio_file(fname=DETECT_DONG)
 class HotwordDetector(object):
    """
    Snowboy decoder to detect whether a keyword specified by `decoder_model`