|
@@ -0,0 +1,256 @@
|
|
|
|
+<?php
|
|
|
|
+
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * transcribe_azure class
|
|
|
|
+ *
|
|
|
|
+ * @method null download
|
|
|
|
+ */
|
|
|
|
+if (!class_exists('transcribe_azure')) {
|
|
|
|
+ class transcribe_azure implements transcribe_interface {
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * declare private variables
|
|
|
|
+ */
|
|
|
|
+ private $api_key;
|
|
|
|
+ private $api_url;
|
|
|
|
+ private $language;
|
|
|
|
+ private $path;
|
|
|
|
+ private $filename;
|
|
|
|
+ private $format;
|
|
|
|
+ private $voice;
|
|
|
|
+ private $message;
|
|
|
|
+ private $model;
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * called when the object is created
|
|
|
|
+ */
|
|
|
|
+ public function __construct($settings) {
|
|
|
|
+
|
|
|
|
+ //build the setting object and get the recording path
|
|
|
|
+ $this->api_key = $settings->get('transcribe', 'api_key');
|
|
|
|
+ $this->api_url = $settings->get('transcribe', 'api_url');
|
|
|
|
+ $this->language = $settings->get('transcribe', 'language');
|
|
|
|
+
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_path(string $audio_path) {
|
|
|
|
+ $this->path = $audio_path;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_filename(string $audio_filename) {
|
|
|
|
+ $this->filename = $audio_filename;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_format(string $audio_format) {
|
|
|
|
+ $this->format = $audio_format;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_voice(string $audio_voice) {
|
|
|
|
+ $this->voice = $audio_voice;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_language(string $audio_language) {
|
|
|
|
+ $this->language = $audio_language;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_translate(string $audio_translate) {
|
|
|
|
+ $this->translate = $audio_translate;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function set_message(string $audio_message) {
|
|
|
|
+ $this->message = $audio_message;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function is_language_enabled() : bool {
|
|
|
|
+ //return the whether engine is handles languages
|
|
|
|
+ return false;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function is_translate_enabled() : bool {
|
|
|
|
+ //return the whether engine is able to translate
|
|
|
|
+ return false;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ public function get_languages() : array {
|
|
|
|
+ //create the languages array
|
|
|
|
+ $languages = array(
|
|
|
|
+ "af" => "Afrikaans",
|
|
|
|
+ "ar" => "Arabic",
|
|
|
|
+ "hy" => "Armenian",
|
|
|
|
+ "az" => "Azerbaijani",
|
|
|
|
+ "be" => "Belarusian",
|
|
|
|
+ "bs" => "Bosnian",
|
|
|
|
+ "bg" => "Bulgarian",
|
|
|
|
+ "ca" => "Catalan",
|
|
|
|
+ "zh" => "Chinese",
|
|
|
|
+ "hr" => "Croatian",
|
|
|
|
+ "cs" => "Czech",
|
|
|
|
+ "da" => "Danish",
|
|
|
|
+ "nl" => "Dutch",
|
|
|
|
+ "en" => "English",
|
|
|
|
+ "et" => "Estonian",
|
|
|
|
+ "fi" => "Finnish",
|
|
|
|
+ "fr" => "French",
|
|
|
|
+ "gl" => "Galician",
|
|
|
|
+ "de" => "German",
|
|
|
|
+ "el" => "Greek",
|
|
|
|
+ "he" => "Hebrew",
|
|
|
|
+ "hi" => "Hindi",
|
|
|
|
+ "hu" => "Hungarian",
|
|
|
|
+ "is" => "Icelandic",
|
|
|
|
+ "id" => "Indonesian",
|
|
|
|
+ "it" => "Italian",
|
|
|
|
+ "ja" => "Japanese",
|
|
|
|
+ "kn" => "Kannada",
|
|
|
|
+ "kk" => "Kazakh",
|
|
|
|
+ "ko" => "Korean",
|
|
|
|
+ "lv" => "Latvian",
|
|
|
|
+ "lt" => "Lithuanian",
|
|
|
|
+ "mk" => "Macedonian",
|
|
|
|
+ "ms" => "Malay",
|
|
|
|
+ "mr" => "Marathi",
|
|
|
|
+ "mi" => "Maori",
|
|
|
|
+ "ne" => "Nepali",
|
|
|
|
+ "no" => "Norwegian",
|
|
|
|
+ "fa" => "Persian",
|
|
|
|
+ "pl" => "Polish",
|
|
|
|
+ "pt" => "Portuguese",
|
|
|
|
+ "ro" => "Romanian",
|
|
|
|
+ "ru" => "Russian",
|
|
|
|
+ "sr" => "Serbian",
|
|
|
|
+ "sk" => "Slovak",
|
|
|
|
+ "sl" => "Slovenian",
|
|
|
|
+ "es" => "Spanish",
|
|
|
|
+ "sw" => "Swahili",
|
|
|
|
+ "sv" => "Swedish",
|
|
|
|
+ "tl" => "Tagalog",
|
|
|
|
+ "ta" => "Tamil",
|
|
|
|
+ "th" => "Thai",
|
|
|
|
+ "tr" => "Turkish",
|
|
|
|
+ "uk" => "Ukrainian",
|
|
|
|
+ "ur" => "Urdu",
|
|
|
|
+ "vi" => "Vietnamese",
|
|
|
|
+ "cy" => "Welsh"
|
|
|
|
+ );
|
|
|
|
+
|
|
|
|
+ //return the languages array
|
|
|
|
+ return $languages;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * transcribe - speech to text
|
|
|
|
+ */
|
|
|
|
+ public function transcribe() : string {
|
|
|
|
+
|
|
|
|
+ //get the content type
|
|
|
|
+ $path_array = pathinfo($this->path.'/'.$this->filename);
|
|
|
|
+ if ($path_array['extension'] == "mp3") {
|
|
|
|
+ $content_type = 'audio/mp3';
|
|
|
|
+ }
|
|
|
|
+ if ($path_array['extension'] == "wav") {
|
|
|
|
+ $content_type = 'audio/wav';
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ //start output buffer
|
|
|
|
+ ob_start();
|
|
|
|
+ $out = fopen('php://output', 'w');
|
|
|
|
+
|
|
|
|
+ if (isset($api_key) && $api_key != '') {
|
|
|
|
+
|
|
|
|
+ $url = "https://" . $this->api_url . ".api.cognitive.microsoft.com/sts/v1.0/issueToken";
|
|
|
|
+ $headers = [
|
|
|
|
+ "Content-type: application/x-www-form-urlencoded",
|
|
|
|
+ "Content-Length: 0",
|
|
|
|
+ "Ocp-Apim-Subscription-Key: " . $this->api_key
|
|
|
|
+ ];
|
|
|
|
+
|
|
|
|
+ // initialize a curl handle
|
|
|
|
+ $ch = curl_init($url);
|
|
|
|
+
|
|
|
|
+ //set the request method to POST
|
|
|
|
+ curl_setopt($ch, CURLOPT_POST, true);
|
|
|
|
+
|
|
|
|
+ //send the http headers
|
|
|
|
+ curl_setopt($ch, CURLOPT_HTTPHEADER, $headers);
|
|
|
|
+
|
|
|
|
+ //return the response as a string instead of outputting it directly
|
|
|
|
+ curl_setopt($ch, CURLOPT_RETURNTRANSFER, true);
|
|
|
|
+
|
|
|
|
+ //run the curl request to get the access token
|
|
|
|
+ $access_token = curl_exec($ch);
|
|
|
|
+
|
|
|
|
+ //close the handle
|
|
|
|
+ curl_close($ch);
|
|
|
|
+
|
|
|
|
+ //if a token was returned then use it to make the transcribe request
|
|
|
|
+ if (empty($access_token)) {
|
|
|
|
+ return false;
|
|
|
|
+ }
|
|
|
|
+ else {
|
|
|
|
+ $url = "https://" . $this->api_url . ".stt.speech.microsoft.com/speech/recognition/conversation/cognitiveservices/v1?language=" . $this->language . "&format=detailed";
|
|
|
|
+ $file_path = $file_path . '/' . $file_name;
|
|
|
|
+ $headers = [
|
|
|
|
+ "Authorization: Bearer " . $access_token,
|
|
|
|
+ "Content-type: audio/wav; codec=\"audio/pcm\"; samplerate=8000; trustsourcerate=false"
|
|
|
|
+ ];
|
|
|
|
+
|
|
|
|
+ //initialize a curl handle
|
|
|
|
+ $ch = curl_init($url);
|
|
|
|
+
|
|
|
|
+ //set the request method to POST
|
|
|
|
+ curl_setopt($ch, CURLOPT_POST, true);
|
|
|
|
+
|
|
|
|
+ //send the http headers
|
|
|
|
+ curl_setopt($ch, CURLOPT_HTTPHEADER, $headers);
|
|
|
|
+
|
|
|
|
+ //send the file using
|
|
|
|
+ curl_setopt($ch, CURLOPT_POSTFIELDS, file_get_contents($file_path));
|
|
|
|
+
|
|
|
|
+ //return the response as a string instead of outputting it directly
|
|
|
|
+ curl_setopt($ch, CURLOPT_RETURNTRANSFER, true);
|
|
|
|
+
|
|
|
|
+ //add verbose for debugging
|
|
|
|
+ curl_setopt($ch, CURLOPT_VERBOSE, true);
|
|
|
|
+ curl_setopt($ch, CURLOPT_STDERR, $out);
|
|
|
|
+
|
|
|
|
+ //run the curl request to transcribe the message
|
|
|
|
+ $json_response = curl_exec($ch);
|
|
|
|
+
|
|
|
|
+ //check for errors
|
|
|
|
+ if (curl_errno($ch)) {
|
|
|
|
+ echo 'Error: ' . curl_error($ch);
|
|
|
|
+ exit;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ //close the handle
|
|
|
|
+ curl_close($ch);
|
|
|
|
+
|
|
|
|
+ //convert the json to an a
|
|
|
|
+ $array = json_decode($json_response, true);
|
|
|
|
+
|
|
|
|
+ //validate the json
|
|
|
|
+ if ($array === null) {
|
|
|
|
+ return 'invalid json';
|
|
|
|
+ }
|
|
|
|
+ else {
|
|
|
|
+ $this->message = $array['NBest'][0]['Display'];
|
|
|
|
+ }
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ //return the transcription
|
|
|
|
+ if (empty($this->message)) {
|
|
|
|
+ return '';
|
|
|
|
+ }
|
|
|
|
+ else {
|
|
|
|
+ return $this->message;
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+ }
|
|
|
|
+}
|
|
|
|
+
|
|
|
|
+?>
|