Class: Google::Cloud::Speech::V1p1beta1::RecognitionMetadata

Inherits:
Object
  • Object
show all
Defined in:
lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb

Overview

Description of audio data to be recognized.

Defined Under Namespace

Modules: InteractionType, MicrophoneDistance, OriginalMediaType, RecordingDeviceType

Instance Attribute Summary collapse

Instance Attribute Details

#audio_topicString

Returns Description of the content. Eg. "Recordings of federal supreme court hearings from 2012".

Returns:

  • (String)

    Description of the content. Eg. "Recordings of federal supreme court hearings from 2012".



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#industry_naics_code_of_audioInteger

Returns The industry vertical to which this speech recognition request most closely applies. This is most indicative of the topics contained in the audio. Use the 6-digit NAICS code to identify the industry vertical - see https://www.naics.com/search/.

Returns:

  • (Integer)

    The industry vertical to which this speech recognition request most closely applies. This is most indicative of the topics contained in the audio. Use the 6-digit NAICS code to identify the industry vertical - see https://www.naics.com/search/.



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#interaction_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::InteractionType

Returns The use case most closely describing the audio content to be recognized.

Returns:



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#microphone_distanceGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::MicrophoneDistance

Returns The audio type that most closely describes the audio being recognized.

Returns:



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#obfuscated_idInteger

Returns Obfuscated (privacy-protected) ID of the user, to identify number of unique users using the service.

Returns:

  • (Integer)

    Obfuscated (privacy-protected) ID of the user, to identify number of unique users using the service.



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#original_media_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::OriginalMediaType

Returns The original media the speech was recorded on.

Returns:



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#original_mime_typeString

Returns Mime type of the original audio file. For example +audio/m4a+, +audio/x-alaw-basic+, +audio/mp3+, +audio/3gpp+. A list of possible audio mime types is maintained at http://www.iana.org/assignments/media-types/media-types.xhtml#audio

Returns:



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#recording_device_nameString

Returns The device used to make the recording. Examples 'Nexus 5X' or 'Polycom SoundStation IP 6000' or 'POTS' or 'VoIP' or 'Cardioid Microphone'.

Returns:

  • (String)

    The device used to make the recording. Examples 'Nexus 5X' or 'Polycom SoundStation IP 6000' or 'POTS' or 'VoIP' or 'Cardioid Microphone'.



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#recording_device_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::RecordingDeviceType

Returns The type of device the speech was recorded with.

Returns:



310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 310

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end