mirror of
https://github.com/wassname/BitLit_test1.git
synced 2026-06-27 18:02:39 +08:00
254 lines
9.6 KiB
Python
254 lines
9.6 KiB
Python
'''
|
|
Voice to text to poem to speech
|
|
Credits: Michel, Lauren, Thomas
|
|
'''
|
|
|
|
import sys
|
|
from gtts import gTTS ## Packages for Text to voice
|
|
import os
|
|
import numpy as np
|
|
import speech_recognition as sr ## Packages for voice recognizer
|
|
import tensorflow as tf
|
|
tf.enable_eager_execution()
|
|
from tensorflow.keras.layers import Embedding, GRU, Dense
|
|
import re
|
|
from textblob import TextBlob
|
|
import random
|
|
from BitLit_param import*
|
|
#BitLit_param()
|
|
#parameters_poems = np.load('model_poems.npy')[()]
|
|
#embedding_weights_poems = parameters_poems['embedding_weights']
|
|
#gru_weights_poems = parameters_poems['gru_weights']
|
|
#fc_weights_poems = parameters_poems['fc_weights']
|
|
#char2idx_poems = parameters_poems['char2idx']
|
|
#idx2char_poems = parameters_poems['idx2char']
|
|
#max_length_poems = parameters_poems['max_length']
|
|
#embedding_dim_poems = parameters_poems['embedding_dim']
|
|
#units_poems = parameters_poems['units']
|
|
#BATCH_SIZE_poems = parameters_poems['BATCH_SIZE']
|
|
#BUFFER_SIZE_poems = parameters_poems['BUFFER_SIZE']
|
|
#
|
|
#vocab_size_poems = len(dict(idx2char_poems))
|
|
#
|
|
## Load hyperparameters and layers' weights previously saved
|
|
#parameters_rhymes = np.load('model_rhymes.npy')[()]
|
|
#embedding_weights_rhymes = parameters_rhymes['embedding_weights']
|
|
#gru_weights_rhymes = parameters_rhymes['gru_weights']
|
|
#fc_weights_rhymes = parameters_rhymes['fc_weights']
|
|
#word2idx_rhymes = parameters_rhymes['word2idx']
|
|
#idx2word_rhymes = parameters_rhymes['idx2word']
|
|
#max_length_rhymes = parameters_rhymes['max_length']
|
|
#embedding_dim_rhymes = parameters_rhymes['embedding_dim']
|
|
#units_rhymes = parameters_rhymes['units']
|
|
#BATCH_SIZE_rhymes = parameters_rhymes['BATCH_SIZE']
|
|
#BUFFER_SIZE_rhymes = parameters_rhymes['BUFFER_SIZE']
|
|
#
|
|
#vocab_size_rhymes = len(dict(idx2word_rhymes))
|
|
|
|
|
|
# Architechture of the GRU
|
|
|
|
class Model(tf.keras.Model):
|
|
def __init__(self, vocab_size, embedding_dim, units, batch_size):
|
|
super(Model, self).__init__()
|
|
self.units = units
|
|
self.batch_sz = batch_size
|
|
self.embedding = Embedding(vocab_size, embedding_dim)
|
|
self.gru = GRU(self.units, return_sequences=True, return_state=True, recurrent_activation='sigmoid', recurrent_initializer='glorot_uniform')
|
|
self.fc = Dense(vocab_size)
|
|
|
|
def call(self, x, hidden):
|
|
x = self.embedding(x)
|
|
output, states = self.gru(x, initial_state=hidden)
|
|
output = tf.reshape(output, (-1, output.shape[2]))
|
|
x = self.fc(output)
|
|
return x, states
|
|
|
|
# Creation of the poem models and rhymes model
|
|
model_poems = Model(vocab_size_poems, embedding_dim_poems, units_poems, BATCH_SIZE_poems)
|
|
model_rhymes = Model(vocab_size_rhymes, embedding_dim_rhymes, units_rhymes, BATCH_SIZE_rhymes)
|
|
|
|
|
|
# Set the weights for the poems model
|
|
num_generate = 1
|
|
start_string = 'child'[::-1]
|
|
input_eval = [char2idx_poems[s] for s in start_string]
|
|
input_eval = tf.expand_dims(input_eval, 0)
|
|
hidden = [tf.zeros((1, units_poems))]
|
|
predictions, hidden = model_poems(input_eval, hidden)
|
|
|
|
model_poems.embedding.set_weights(np.asarray(embedding_weights_poems))
|
|
model_poems.gru.set_weights(gru_weights_poems)
|
|
model_poems.fc.set_weights(fc_weights_poems)
|
|
|
|
|
|
# Set the weights for the rhymes model
|
|
num_generate = 1 # number of characters to generate
|
|
start_string = ['fell'] # beginning of the generated text. TODO: try start_string = ' '
|
|
input_eval = [word2idx_rhymes[s] for s in start_string] # converts start_string to numbers the model understands
|
|
input_eval = tf.expand_dims(input_eval, 0)
|
|
hidden = [tf.zeros((1, units_rhymes))]
|
|
predictions, hidden = model_rhymes(input_eval, hidden)
|
|
|
|
model_rhymes.embedding.set_weights(np.asarray(embedding_weights_rhymes))
|
|
model_rhymes.gru.set_weights(gru_weights_rhymes)
|
|
model_rhymes.fc.set_weights(fc_weights_rhymes)
|
|
|
|
def poem(USER_INPUT):
|
|
###https://pythonprogramminglanguage.com/text-to-speech/
|
|
#### cmd 1:::: sudo pip install gTTS
|
|
#### cmd 2:::: sudo pip install pyttsx
|
|
|
|
|
|
#######################################################
|
|
##sys.path
|
|
##sys.path.append('/System/Library/Frameworks/Python.framework/Versions/2.7/Extras/lib/python')
|
|
##sys.path.append('/Users/ShebMichel/Library/Python/2.7/lib/python/site-packages'
|
|
################################################################################
|
|
############ AUDIO CONVERSION TO TEST
|
|
#r = sr.Recognizer()
|
|
#with sr.Microphone() as source:
|
|
## tts = gTTS(text='HELLO! My Name is BIT-LIT. PLEASE SPEAK IN ABOUT 3 SECONDS.', lang='en')
|
|
## tts.save("hello.mp3")
|
|
## os.system("start hello.mp3")
|
|
## ######
|
|
#
|
|
# print("SPEAK NOW-SPEAK NOW-SPEAK NOW:")
|
|
# audio = r.listen(source)
|
|
# tts = gTTS(text='THANK YOU! GIVE ME A SECOND TO READ OUT YOUR POEM', lang='en')
|
|
# tts.save("thanks.mp3")
|
|
# os.system("start thanks.mp3")
|
|
#try:
|
|
# # for testing purposes, we're just using the default API key
|
|
# # to use another API key, use `r.recognize_google(audio, key="GOOGLE_SPEECH_RECOGNITION_API_KEY")`
|
|
# # instead of `r.recognize_google(audio)
|
|
# AA0=r.recognize_google(audio)
|
|
# USER_INPUT=AA0
|
|
# print("You said: " + r.recognize_google(audio))
|
|
#except sr.UnknownValueError:
|
|
# print("Could not understand audio")
|
|
#except sr.RequestError as e:
|
|
# print("Could not request results; {0}".format(e))
|
|
#################################################################################
|
|
### ML POEM PREDICTOR
|
|
|
|
#####################
|
|
# BACKGROUND STUFF #
|
|
#####################
|
|
|
|
'''
|
|
|
|
Each time we run the script, we load the parameters and set the weights.
|
|
This is inefficient. Is there a way to run the background stuff only once ? (lines 60 to 140)
|
|
|
|
'''
|
|
# Load the poems model parameters (hyperparameters and weights)
|
|
#parameters_poems = np.load('model_poems.npy')[()]
|
|
|
|
|
|
|
|
|
|
'''
|
|
|
|
End of the background thingy
|
|
|
|
'''
|
|
|
|
|
|
###########################
|
|
# USER INPUT a line #
|
|
###########################
|
|
|
|
USER_INPUT = USER_INPUT.lower()
|
|
USER_INPUT = re.sub('[^a-z\n]', ' ', USER_INPUT)
|
|
text_generated = USER_INPUT[::-1]
|
|
first_rhyme = USER_INPUT.split(' ')[-1] # Michel's magic
|
|
|
|
|
|
|
|
######################
|
|
# RHYMES GENERATION #
|
|
######################
|
|
|
|
|
|
temperature = 0.09
|
|
|
|
num_generate = 5 # number of characters to generate
|
|
if first_rhyme in idx2word_rhymes.values():
|
|
start_string = [first_rhyme]
|
|
else:
|
|
start_string = [random.choice(list(word2idx_rhymes.keys()))]
|
|
print('The word {} is not in our corpus of rhymes yet.'.format(first_rhyme))
|
|
input_eval = [word2idx_rhymes[s] for s in start_string] # converts start_string to numbers the model understands
|
|
input_eval = tf.expand_dims(input_eval, 0)
|
|
|
|
rhymes = []
|
|
|
|
|
|
hidden = [tf.zeros((1, units_rhymes))]
|
|
for i in range(num_generate):
|
|
predictions, hidden = model_rhymes(input_eval, hidden) # predictions holds the probabily for each character to be most adequate continuation
|
|
|
|
predictions = predictions / temperature # alters characters' probabilities to be picked (but keeps the order)
|
|
predicted_id = tf.multinomial(tf.exp(predictions), num_samples=1)[0][0].numpy() # picks the next character for the generated text
|
|
input_eval = tf.expand_dims([predicted_id], 0)
|
|
rhymes += [idx2word_rhymes[predicted_id]]
|
|
|
|
print('rhymes:', rhymes)
|
|
|
|
|
|
####################
|
|
# POEM GENERATION #
|
|
####################
|
|
|
|
|
|
temperature = 0.8
|
|
text_generated = USER_INPUT
|
|
text_generated = text_generated[::-1] + '\n'
|
|
num_generate = 150
|
|
for rhyme in rhymes:
|
|
start_string = text_generated + rhyme[::-1]
|
|
input_eval = [char2idx_poems[s] for s in start_string]
|
|
input_eval = tf.expand_dims(input_eval, 0)
|
|
hidden = [tf.zeros((1, units_poems))]
|
|
|
|
b = True
|
|
c = 1
|
|
added_text = ' '
|
|
while b == True:
|
|
|
|
predictions, hidden = model_poems(input_eval, hidden)
|
|
predictions = predictions / temperature
|
|
predicted_id = tf.multinomial(tf.exp(predictions), num_samples=1)[0][0].numpy()
|
|
input_eval = tf.expand_dims([predicted_id], 0)
|
|
added_text += idx2char_poems[predicted_id]
|
|
c += 1
|
|
if idx2char_poems[predicted_id] == '\n' or c > num_generate:
|
|
text_generated = rhyme[::-1] + added_text + text_generated
|
|
b = False
|
|
|
|
text_generated = text_generated[::-1] # That's the poem to return to the user in voice format
|
|
|
|
text_generated = re.sub(' +',' ',text_generated)
|
|
text_generated = str(TextBlob(text_generated).correct())
|
|
return text_generated
|
|
|
|
#### END CODE
|
|
#########################################################
|
|
################# TEXT CONVERSION IN AUDIO
|
|
################# FEED POEM TO TRANSCRIBER
|
|
# print('ML POEM is:', text_generated)
|
|
# tts = gTTS(text=text_generated, lang='en')
|
|
# tts.save("poem.mp3")
|
|
# os.system("start poem.mp3")
|
|
# #########################################################
|
|
# ####
|
|
# print("BIT-LIT ENDING STATEMENT:")
|
|
# tts = gTTS(text='THANK YOU! CHECK ME OUT IN THE NEWS SOON.', lang='en')
|
|
# tts.save("goodbye.mp3")
|
|
# #os.system("start goodbye.mp3")
|
|
# ### USING JUPITER
|
|
# # import IPython.display as ipd
|
|
# # ipd.Audio(filename='path/to/file.mp3')
|
|
# #tk.mainloop()
|