added uri read direct

puneithk · puneithk · commit c1f92acf9937 · 2016-05-29T01:07:11.000-07:00
diff --git a/speech/grpc/src/main/java/com/google/cloud/speech/grpc/demos/AudioRequestFactory.java b/speech/grpc/src/main/java/com/google/cloud/speech/grpc/demos/AudioRequestFactory.java
@@ -18,14 +18,9 @@
 package com.google.cloud.speech.grpc.demos;
 
 import com.google.cloud.speech.v1.AudioRequest;
-import com.google.cloud.storage.Blob;
-import com.google.cloud.storage.BlobId;
-import com.google.cloud.storage.Storage;
-import com.google.cloud.storage.StorageOptions;
 import com.google.protobuf.ByteString;
 
 import java.io.IOException;
-
 import java.net.URI;
 import java.nio.file.Files;
 import java.nio.file.Path;
@@ -37,8 +32,8 @@
  */
 public class AudioRequestFactory {
 
-  private static final String FILE = "file";
-  private static final String GS = "gs";
+  private static final String FILE_SCHEME = "file";
+  private static final String GS_SCHEME   = "gs";
 
   /**
    * Takes an input URI of form $scheme:// and converts to audio request.
@@ -48,15 +43,11 @@ public class AudioRequestFactory {
    */
   public static AudioRequest createRequest(URI uri)
       throws IOException {
-    if (uri.getScheme() == null || uri.getScheme().equals(FILE)) {
+    if (uri.getScheme() == null || uri.getScheme().equals(FILE_SCHEME)) {
       Path path = Paths.get(uri);
       return audioFromBytes(Files.readAllBytes(path));
-    } else if (uri.getScheme().equals(GS)) {
-      Storage storage = StorageOptions.defaultInstance().service();
-      String path = uri.getPath();
-      BlobId blobId = BlobId.of(uri.getHost(), path.substring(1, path.length()));
-      Blob blob = storage.get(blobId);
-      return audioFromBytes(blob.content());
+    } else if (uri.getScheme().equals(GS_SCHEME)) {
+      return AudioRequest.newBuilder().setUri(uri.toString()).build();
     }
     throw new RuntimeException("scheme not supported " + uri.getScheme());
   }
diff --git a/speech/grpc/src/main/proto/google/speech/v1/cloud-speech.proto b/speech/grpc/src/main/proto/google/speech/v1/cloud-speech.proto
@@ -23,14 +23,15 @@ option java_multiple_files = true;
 option java_outer_classname = "SpeechProto";
 option java_package = "com.google.cloud.speech.v1";
 
+
 // Service that implements Google Cloud Speech API.
 service Speech {
   // Perform bidirectional streaming speech recognition on audio using gRPC.
   rpc Recognize(stream RecognizeRequest) returns (stream RecognizeResponse);
 
   // Perform non-streaming speech recognition on audio using HTTPS.
   rpc NonStreamingRecognize(RecognizeRequest) returns (NonStreamingRecognizeResponse) {
-    option (.google.api.http) = { post: "/v1/speech:recognize" body: "*" };
+    option (google.api.http) = { post: "/v1/speech:recognize" body: "*" };
   }
 }
 
@@ -54,7 +55,7 @@ message RecognizeRequest {
 
   // The audio data to be recognized. For `NonStreamingRecognize`, all the
   // audio data must be contained in the first (and only) `RecognizeRequest`
-  //  message. For streaming `Recognize`, sequential chunks of audio data are
+  // message. For streaming `Recognize`, sequential chunks of audio data are
   // sent in sequential `RecognizeRequest` messages.
   AudioRequest audio_request = 2;
 }
@@ -64,7 +65,7 @@ message RecognizeRequest {
 message InitialRecognizeRequest {
   // Audio encoding of the data sent in the audio message.
   enum AudioEncoding {
-    // Not specified. Will return result `INVALID_ARGUMENT`.
+    // Not specified. Will return result [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT].
     ENCODING_UNSPECIFIED = 0;
 
     // Uncompressed 16-bit signed little-endian samples.
@@ -118,8 +119,6 @@ message InitialRecognizeRequest {
   // profanities, replacing all but the initial character in each filtered word
   // with asterisks, e.g. "f***". If set to `false` or omitted, profanities
   // won't be filtered out.
-  // Note that profanity filtering is not implemented for all languages.
-  // If the language is not supported, this setting has no effect.
   bool profanity_filter = 5;
 
   // [Optional] If `false` or omitted, the recognizer will detect a single
@@ -146,13 +145,38 @@ message InitialRecognizeRequest {
   // as they become available.
   // If `false` or omitted, no `EndpointerEvents` are returned.
   bool enable_endpointer_events = 8;
+
+  // [Optional] URI that points to a file where the recognition result should
+  // be stored in JSON format. If omitted or empty string, the recognition
+  // result is returned in the response. Should be specified only for
+  // `NonStreamingRecognize`. If specified in a `Recognize` request,
+  // `Recognize` returns [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT].
+  // If specified in a `NonStreamingRecognize` request,
+  // `NonStreamingRecognize` returns immediately, and the output file
+  // is created asynchronously once the audio processing completes.
+  // Currently, only Google Cloud Storage URIs are supported, which must be
+  // specified in the following format: `gs://bucket_name/object_name`
+  // (other URI formats return [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]). For
+  // more information, see [Request URIs](/storage/docs/reference-uris).
+  string output_uri = 9;
 }
 
 // Contains audio data in the format specified in the `InitialRecognizeRequest`.
+// Either `content` or `uri` must be supplied. Supplying both or neither
+// returns [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT].
 message AudioRequest {
-  // [Required] The audio data bytes encoded as specified in
-  // `InitialRecognizeRequest`.
+  // The audio data bytes encoded as specified in
+  // `InitialRecognizeRequest`. Note: as with all bytes fields, protobuffers
+  // use a pure binary representation, whereas JSON representations use base64.
   bytes content = 1;
+
+  // URI that points to a file that contains audio data bytes as specified in
+  // `InitialRecognizeRequest`. Currently, only Google Cloud Storage URIs are
+  // supported, which must be specified in the following format:
+  // `gs://bucket_name/object_name` (other URI formats return
+  // [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]). For more information, see
+  // [Request URIs](/storage/docs/reference-uris).
+  string uri = 2;
 }
 
 // `NonStreamingRecognizeResponse` is the only message returned to the client by
@@ -191,10 +215,14 @@ message RecognizeResponse {
 
   // [Output-only] If set, returns a [google.rpc.Status][] message that
   // specifies the error for the operation.
-  .google.rpc.Status error = 1;
-
-  // [Output-only] May contain zero or one `is_final=true` result (the newly
-  // settled portion). May also contain zero or more `is_final=false` results.
+  google.rpc.Status error = 1;
+
+  // [Output-only] For `continuous=false`, this repeated list contains zero or
+  // one result that corresponds to all of the audio processed so far. For
+  // `continuous=true`, this repeated list contains zero or more results that
+  // correspond to consecutive portions of the audio being processed.
+  // In both cases, contains zero or one `is_final=true` result (the newly
+  // settled portion), followed by zero or more `is_final=false` results.
   repeated SpeechRecognitionResult results = 2;
 
   // [Output-only] Indicates the lowest index in the `results` array that has
@@ -206,7 +234,10 @@ message RecognizeResponse {
   EndpointerEvent endpoint = 4;
 }
 
+// A speech recognition result corresponding to a portion of the audio.
 message SpeechRecognitionResult {
+  // [Output-only] May contain one or more recognition hypotheses (up to the
+  // maximum specified in `max_alternatives`).
   repeated SpeechRecognitionAlternative alternatives = 1;
 
   // [Output-only] Set `true` if this is the final time the speech service will