Add support for 'remove_atmospherics' and 'speakers_count' (#101)

hrist0stoichev · web-flow · commit 89e56f6120ad · 2023-08-21T10:32:31.000-07:00
diff --git a/src/rev_ai/apiclient.py b/src/rev_ai/apiclient.py
@@ -64,7 +64,9 @@ def submit_job_url(
             speaker_names=None,
             source_config=None,
             notification_config=None,
-            skip_postprocessing=False):
+            skip_postprocessing=False,
+            remove_atmospherics=False,
+            speakers_count=None):
         """Submit media given a URL for transcription.
         The audio data is downloaded from the URL
         :param media_url: web location of the media file
@@ -111,6 +113,9 @@ def submit_job_url(
             invoke on job completion as a webhook and optional authentication headers to use when
             calling the callback url
         :param skip_postprocessing: skip all text postprocessing (punctuation, capitalization, ITN)
+        :param remove_atmospherics: Atmospherics such as <laugh>, <affirmative>, etc. will not appear
+            in the transcript.
+        :param speakers_count: Use to specify the total number of unique speakers in the audio.
         :returns: raw response data
         :raises: HTTPError
         """
@@ -154,7 +159,9 @@ def submit_job_local_file(
             segments_to_transcribe=None,
             speaker_names=None,
             notification_config=None,
-            skip_postprocessing=False):
+            skip_postprocessing=False,
+            remove_atmospherics=False,
+            speakers_count=None):
         """Submit a local file for transcription.
         Note that the content type is inferred if not provided.
 
@@ -198,6 +205,9 @@ def submit_job_local_file(
             invoke on job completion as a webhook and optional authentication headers to use when
             calling the callback url
         :param skip_postprocessing: skip all text postprocessing (punctuation, capitalization, ITN)
+        :param remove_atmospherics: Atmospherics such as <laugh>, <affirmative>, etc. will not appear
+            in the transcript.
+        :param speakers_count: Use to specify the total number of unique speakers in the audio.
         :returns: raw response data
         :raises: HTTPError, ValueError
         """
@@ -463,7 +473,9 @@ def _create_job_options_payload(
             speaker_names=None,
             source_config=None,
             notification_config=None,
-            skip_postprocessing=False):
+            skip_postprocessing=False,
+            remove_atmospherics=None,
+            speakers_count=None):
         payload = {}
         if media_url:
             payload['media_url'] = media_url
@@ -508,6 +520,10 @@ def _create_job_options_payload(
             payload['notification_config'] = notification_config.to_dict()
         if skip_postprocessing:
             payload['skip_postprocessing'] = skip_postprocessing
+        if remove_atmospherics:
+            payload['remove_atmospherics'] = remove_atmospherics
+        if speakers_count:
+            payload['speakers_count'] = speakers_count
         return payload
 
     def _create_captions_query(self, speaker_channel):
diff --git a/src/rev_ai/models/asynchronous/job.py b/src/rev_ai/models/asynchronous/job.py
@@ -26,7 +26,9 @@ def __init__(
             transcriber=None,
             verbatim=None,
             rush=None,
-            segments_to_transcribe=None):
+            segments_to_transcribe=None,
+            remove_atmospherics=None,
+            speakers_count=None):
         """
         :param id_: unique id of job
         :param created_on: date and time at which this job was started
@@ -54,6 +56,9 @@ def __init__(
         :param verbatim: whether to transcribe verbatim if provided for human transcription
         :param rush: whether to transcribe with rush if provided for human transcription
         :param segments_to_transcribe: segments to transcribe if provided for human transcription
+        :param remove_atmospherics: Atmospherics such as <laugh>, <affirmative>, etc. will not appear
+            in the transcript.
+        :param speakers_count: Use to specify the total number of unique speakers in the audio.
         """
         self.id = id_
         self.created_on = created_on
@@ -78,6 +83,8 @@ def __init__(
         self.verbatim = verbatim
         self.rush = rush
         self.segments_to_transcribe = segments_to_transcribe
+        self.remove_atmospherics = remove_atmospherics
+        self.speakers_count = speakers_count
 
     def __eq__(self, other):
         """Override default equality operator"""
@@ -111,5 +118,7 @@ def from_json(cls, json):
             transcriber=json.get('transcriber'),
             verbatim=json.get('verbatim'),
             rush=json.get('rush'),
-            segments_to_transcribe=json.get('segments_to_transcribe')
+            segments_to_transcribe=json.get('segments_to_transcribe'),
+            remove_atmospherics=json.get('remove_atmospherics'),
+            speakers_count=json.get('speakers_count')
         )