summaryrefslogtreecommitdiffstats
path: root/java/com/android/voicemail/impl/transcribe/TranscriptionTaskAsync.java
blob: 3c41aef890cd46908d536fd50e4d7051056eec8a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
/*
 * Copyright (C) 2017 The Android Open Source Project
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License
 */
package com.android.voicemail.impl.transcribe;

import android.app.job.JobWorkItem;
import android.content.Context;
import android.util.Pair;
import com.android.dialer.common.Assert;
import com.android.dialer.logging.DialerImpression;
import com.android.voicemail.impl.VvmLog;
import com.android.voicemail.impl.transcribe.TranscriptionService.JobCallback;
import com.android.voicemail.impl.transcribe.grpc.GetTranscriptResponseAsync;
import com.android.voicemail.impl.transcribe.grpc.TranscriptionClientFactory;
import com.android.voicemail.impl.transcribe.grpc.TranscriptionResponseAsync;
import com.google.internal.communications.voicemailtranscription.v1.GetTranscriptRequest;
import com.google.internal.communications.voicemailtranscription.v1.TranscribeVoicemailAsyncRequest;
import com.google.internal.communications.voicemailtranscription.v1.TranscriptionStatus;

/**
 * Background task to get a voicemail transcription using the asynchronous API. The async API works
 * as follows:
 *
 * <ol>
 *   <li>client uploads voicemail data to the server
 *   <li>server responds with a transcription-id and an estimated transcription wait time
 *   <li>client waits appropriate amount of time then begins polling for the result
 * </ol>
 *
 * This implementation blocks until the response or an error is received, even though it is using
 * the asynchronous server API.
 */
public class TranscriptionTaskAsync extends TranscriptionTask {
  private static final String TAG = "TranscriptionTaskAsync";

  public TranscriptionTaskAsync(
      Context context,
      JobCallback callback,
      JobWorkItem workItem,
      TranscriptionClientFactory clientFactory,
      TranscriptionConfigProvider configProvider) {
    super(context, callback, workItem, clientFactory, configProvider);
  }

  @Override
  protected Pair<String, TranscriptionStatus> getTranscription() {
    VvmLog.i(TAG, "getTranscription");

    TranscriptionResponseAsync uploadResponse =
        (TranscriptionResponseAsync)
            sendRequest((client) -> client.sendUploadRequest(getUploadRequest()));

    if (uploadResponse == null) {
      VvmLog.i(TAG, "getTranscription, failed to upload voicemail.");
      return new Pair<>(null, TranscriptionStatus.FAILED_NO_RETRY);
    } else {
      waitForTranscription(uploadResponse);
      return pollForTranscription(uploadResponse);
    }
  }

  @Override
  protected DialerImpression.Type getRequestSentImpression() {
    return DialerImpression.Type.VVM_TRANSCRIPTION_REQUEST_SENT_ASYNC;
  }

  private static void waitForTranscription(TranscriptionResponseAsync uploadResponse) {
    long millis = uploadResponse.getEstimatedWaitMillis();
    VvmLog.i(TAG, "waitForTranscription, " + millis + " millis");
    sleep(millis);
  }

  private Pair<String, TranscriptionStatus> pollForTranscription(
      TranscriptionResponseAsync uploadResponse) {
    VvmLog.i(TAG, "pollForTranscription");
    GetTranscriptRequest request = getGetTranscriptRequest(uploadResponse);
    for (int i = 0; i < configProvider.getMaxGetTranscriptPolls(); i++) {
      GetTranscriptResponseAsync response =
          (GetTranscriptResponseAsync)
              sendRequest((client) -> client.sendGetTranscriptRequest(request));
      if (response == null) {
        VvmLog.i(TAG, "pollForTranscription, no transcription result.");
      } else if (response.isTranscribing()) {
        VvmLog.i(TAG, "pollForTranscription, poll count: " + (i + 1));
      } else if (response.hasFatalError()) {
        VvmLog.i(TAG, "pollForTranscription, fail. " + response.getErrorDescription());
        return new Pair<>(null, response.getTranscriptionStatus());
      } else {
        VvmLog.i(TAG, "pollForTranscription, got transcription");
        return new Pair<>(response.getTranscript(), TranscriptionStatus.SUCCESS);
      }
      sleep(configProvider.getGetTranscriptPollIntervalMillis());
    }
    VvmLog.i(TAG, "pollForTranscription, timed out.");
    return new Pair<>(null, TranscriptionStatus.FAILED_NO_RETRY);
  }

  private TranscribeVoicemailAsyncRequest getUploadRequest() {
    return TranscribeVoicemailAsyncRequest.newBuilder()
        .setVoicemailData(audioData)
        .setAudioFormat(encoding)
        .build();
  }

  private GetTranscriptRequest getGetTranscriptRequest(TranscriptionResponseAsync uploadResponse) {
    Assert.checkArgument(uploadResponse.getTranscriptionId() != null);
    return GetTranscriptRequest.newBuilder()
        .setTranscriptionId(uploadResponse.getTranscriptionId())
        .build();
  }
}