# I use these libraries for working with the APIs and downloading files
!pip install ibm_watson wget

from ibm_watson import SpeechToTextV1 
import json
from ibm_cloud_sdk_core.authenticators import IAMAuthenticator

# Setting up the speech-to-text service with my credentials

speech_to_text_url = "https://stream.watsonplatform.net/speech-to-text/api"

my_s2t_api_key = "YOUR_API_KEY_HERE"  # Replace with your actual API key

my_authenticator = IAMAuthenticator(my_s2t_api_key)  # Initialize the IAM authenticator with my API key
my_s2t_service = SpeechToTextV1(authenticator=my_authenticator)  # Create a Speech to Text service instance
my_s2t_service.set_service_url(speech_to_text_url)  # Set the service URL for the Speech to Text service
my_s2t_service  # Display the service instance

# Downloading the sample audio file for testing
!wget -O my_sample_audio.mp3 https://s3-api.us-geo.objectstorage.softlayer.net/cf-courses-data/CognitiveClass/PY0101EN/labs/PolynomialRegressionandPipelines.mp3

audio_file_path = 'my_sample_audio.mp3'

with open(audio_file_path, mode="rb") as audio_file:
    my_response = my_s2t_service.recognize(audio=audio_file, content_type='audio/mp3')

my_response.result

from pandas.io.json import json_normalize

# Normalize the JSON response to flatten the data
json_normalize(my_response.result['results'], "alternatives")

my_response

recognized_text = my_response.result['results'][0]["alternatives"][0]["transcript"]
type(recognized_text)

from ibm_watson import LanguageTranslatorV3  # For translating text

translator_url = 'https://gateway.watsonplatform.net/language-translator/api'

my_translator_api_key = 'YOUR_TRANSLATOR_API_KEY'  # Replace with your actual API key

translator_version = '2018-05-01'

translator_authenticator = IAMAuthenticator(my_translator_api_key)  # Update API key variable name
language_translator = LanguageTranslatorV3(version=translator_version, authenticator=translator_authenticator)  # Update version variable name
language_translator.set_service_url(translator_url)  # Update URL variable name
language_translator

from pandas.io.json import json_normalize

# Retrieve and normalize the list of identifiable languages
languages_data = language_translator.list_identifiable_languages().get_result()
normalized_languages = json_normalize(languages_data, "languages")

normalized_languages

translation_response = language_translator.translate(\
    text=recognized_text, model_id='en-es')
translation_response

translation = translation_response.get_result()
translation

spanish_translation = translation['translations'][0]['translation']  # Get the Spanish translation from the API response
spanish_translation  # Display the Spanish translation

translation_back = language_translator.translate(text=spanish_translation, model_id='es-en').get_result()

english_translation = translation_back['translations'][0]['translation']
english_translation

french_translation_response = language_translator.translate(
    text=english_translation, model_id='en-fr').get_result()

french_translation_response['translations'][0]['translation']

Exploring Speech Recognition and Translation APIs¶

What's Inside¶

Speech to Text: My Approach¶

Language Translation: My Experience¶

Reflections on Language Translation¶

My Takeaways and Next Steps¶