Class: Google::Cloud::Speech::V1p1beta1::RecognitionMetadata

Inherits:
Object
  • Object
show all
Defined in:
lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb

Overview

Description of audio data to be recognized.

Defined Under Namespace

Modules: InteractionType, MicrophoneDistance, OriginalMediaType, RecordingDeviceType

Instance Attribute Summary collapse

Instance Attribute Details

#audio_topicString

Returns Description of the content. Eg. "Recordings of federal supreme court hearings from 2012".

Returns:

  • (String)

    Description of the content. Eg. "Recordings of federal supreme court hearings from 2012".



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#industry_naics_code_of_audioInteger

Returns The industry vertical to which this speech recognition request most closely applies. This is most indicative of the topics contained in the audio. Use the 6-digit NAICS code to identify the industry vertical - see https://www.naics.com/search/.

Returns:

  • (Integer)

    The industry vertical to which this speech recognition request most closely applies. This is most indicative of the topics contained in the audio. Use the 6-digit NAICS code to identify the industry vertical - see https://www.naics.com/search/.



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#interaction_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::InteractionType

Returns The use case most closely describing the audio content to be recognized.

Returns:



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#microphone_distanceGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::MicrophoneDistance

Returns The audio type that most closely describes the audio being recognized.

Returns:



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#obfuscated_idInteger

Returns Obfuscated (privacy-protected) ID of the user, to identify number of unique users using the service.

Returns:

  • (Integer)

    Obfuscated (privacy-protected) ID of the user, to identify number of unique users using the service.



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#original_media_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::OriginalMediaType

Returns The original media the speech was recorded on.

Returns:



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#original_mime_typeString

Returns Mime type of the original audio file. For example +audio/m4a+, +audio/x-alaw-basic+, +audio/mp3+, +audio/3gpp+. A list of possible audio mime types is maintained at http://www.iana.org/assignments/media-types/media-types.xhtml#audio

Returns:



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#recording_device_nameString

Returns The device used to make the recording. Examples 'Nexus 5X' or 'Polycom SoundStation IP 6000' or 'POTS' or 'VoIP' or 'Cardioid Microphone'.

Returns:

  • (String)

    The device used to make the recording. Examples 'Nexus 5X' or 'Polycom SoundStation IP 6000' or 'POTS' or 'VoIP' or 'Cardioid Microphone'.



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end

#recording_device_typeGoogle::Cloud::Speech::V1p1beta1::RecognitionMetadata::RecordingDeviceType

Returns The type of device the speech was recorded with.

Returns:



353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
# File 'lib/google/cloud/speech/v1p1beta1/doc/google/cloud/speech/v1p1beta1/cloud_speech.rb', line 353

class RecognitionMetadata
  # Use case categories that the audio recognition request can be described
  # by.
  module InteractionType
    # Use case is either unknown or is something other than one of the other
    # values below.
    INTERACTION_TYPE_UNSPECIFIED = 0

    # Multiple people in a conversation or discussion. For example in a
    # meeting with two or more people actively participating. Typically
    # all the primary people speaking would be in the same room (if not,
    # see PHONE_CALL)
    DISCUSSION = 1

    # One or more persons lecturing or presenting to others, mostly
    # uninterrupted.
    PRESENTATION = 2

    # A phone-call or video-conference in which two or more people, who are
    # not in the same room, are actively participating.
    PHONE_CALL = 3

    # A recorded message intended for another person to listen to.
    VOICEMAIL = 4

    # Professionally produced audio (eg. TV Show, Podcast).
    PROFESSIONALLY_PRODUCED = 5

    # Transcribe spoken questions and queries into text.
    VOICE_SEARCH = 6

    # Transcribe voice commands, such as for controlling a device.
    VOICE_COMMAND = 7

    # Transcribe speech to text to create a written document, such as a
    # text-message, email or report.
    DICTATION = 8
  end

  # Enumerates the types of capture settings describing an audio file.
  module MicrophoneDistance
    # Audio type is not known.
    MICROPHONE_DISTANCE_UNSPECIFIED = 0

    # The audio was captured from a closely placed microphone. Eg. phone,
    # dictaphone, or handheld microphone. Generally if there speaker is within
    # 1 meter of the microphone.
    NEARFIELD = 1

    # The speaker if within 3 meters of the microphone.
    MIDFIELD = 2

    # The speaker is more than 3 meters away from the microphone.
    FARFIELD = 3
  end

  # The original media the speech was recorded on.
  module OriginalMediaType
    # Unknown original media type.
    ORIGINAL_MEDIA_TYPE_UNSPECIFIED = 0

    # The speech data is an audio recording.
    AUDIO = 1

    # The speech data originally recorded on a video.
    VIDEO = 2
  end

  # The type of device the speech was recorded with.
  module RecordingDeviceType
    # The recording device is unknown.
    RECORDING_DEVICE_TYPE_UNSPECIFIED = 0

    # Speech was recorded on a smartphone.
    SMARTPHONE = 1

    # Speech was recorded using a personal computer or tablet.
    PC = 2

    # Speech was recorded over a phone line.
    PHONE_LINE = 3

    # Speech was recorded in a vehicle.
    VEHICLE = 4

    # Speech was recorded outdoors.
    OTHER_OUTDOOR_DEVICE = 5

    # Speech was recorded indoors.
    OTHER_INDOOR_DEVICE = 6
  end
end