feat: add auto_highlights functionality

dmccrystal · s0h3yl · commit b675bf6f85f7 · 2023-06-13T21:34:21.000+02:00
GitOrigin-RevId: 3a68cd7986efea85c30a712dda45b8de245019f7
diff --git a/README.md b/README.md
@@ -412,6 +412,29 @@ for entity in transcript.entities:
 
 [Read more about entity detection here.](https://www.assemblyai.com/docs/Models/entity_detection)
 
+</details>
+<details>
+  <summary>Identify Important Words and Phrases in a Transcript</summary>
+
+```python
+import assemblyai as aai
+
+transcriber = aai.Transcriber()
+transcript = transcriber.transcribe(
+  "https://example.org/audio.mp3",
+  config=aai.TranscriptionConfig(auto_highlights=True)
+)
+
+for result in transcript.auto_highlights_result.results:
+  print(result.text)  # the important phrase
+  print(result.rank)  # relevancy of the phrase
+  print(result.count)  # number of instances of the phrase
+  for timestamp in result.timestamps:
+    print(f"Timestamp: {timestamp.start} - {timestamp.end}")
+```
+
+[Read more about auto highlights here.](https://www.assemblyai.com/docs/Models/key_phrases)
+
 </details>
 
 ---
diff --git a/assemblyai/transcriber.py b/assemblyai/transcriber.py
@@ -226,6 +226,10 @@ def sentiment_analysis_results(self) -> Optional[List[types.Sentiment]]:
     def entities(self) -> Optional[List[types.Entity]]:
         return self._impl.transcript.entities
 
+    @property
+    def auto_highlights_result(self) -> Optional[types.AutohighlightResponse]:
+        return self._impl.transcript.auto_highlights_result
+
     @property
     def status(self) -> types.TranscriptStatus:
         "The current status of the transcript"
diff --git a/assemblyai/types.py b/assemblyai/types.py
@@ -370,8 +370,8 @@ class RawTranscriptionConfig(BaseModel):
     summary_type: Optional[SummarizationType]
     "The summarization type to use in case `summarization` is enabled"
 
-    # auto_highlights: bool = False
-    # "Detect important phrases and words in your transcription text."
+    auto_highlights: Optional[bool]
+    "Detect important phrases and words in your transcription text."
 
     language_detection: Optional[bool]
     """
@@ -424,7 +424,7 @@ def __init__(
         summarization: Optional[bool] = None,
         summary_model: Optional[SummarizationModel] = None,
         summary_type: Optional[SummarizationType] = None,
-        # auto_highlights: bool = False,
+        auto_highlights: Optional[bool] = None,
         language_detection: Optional[bool] = None,
         raw_transcription_config: Optional[RawTranscriptionConfig] = None,
     ) -> None:
@@ -502,7 +502,7 @@ def __init__(
             summary_model,
             summary_type,
         )
-        # self.auto_highlights = auto_highlights
+        self.auto_highlights = auto_highlights
         self.language_detection = language_detection
 
     @property
@@ -793,17 +793,17 @@ def summary_type(self) -> Optional[SummarizationType]:
 
         return self._raw_transcription_config.summary_type
 
-    # @property
-    # def auto_highlights(self) -> bool:
-    #     "Returns whether the Auto Highlights feature is enabled or not."
+    @property
+    def auto_highlights(self) -> Optional[bool]:
+        "Returns whether the Auto Highlights feature is enabled or not."
 
-    #     return self._raw_transcription_config.auto_highlights
+        return self._raw_transcription_config.auto_highlights
 
-    # @auto_highlights.setter
-    # def auto_highlights(self, enable: bool) -> None:
-    #     "Detect important phrases and words in your transcription text."
+    @auto_highlights.setter
+    def auto_highlights(self, enable: Optional[bool]) -> None:
+        "Detect important phrases and words in your transcription text."
 
-    #     self._raw_transcription_config.auto_highlights = enable
+        self._raw_transcription_config.auto_highlights = enable
 
     @property
     def language_detection(self) -> Optional[bool]:
@@ -1380,8 +1380,8 @@ class BaseTranscript(BaseModel):
     summary_type: Optional[SummarizationType]
     "The summarization type to use in case `summarization` is enabled"
 
-    # auto_highlights: bool = False
-    # "Detect important phrases and words in your transcription text."
+    auto_highlights: Optional[bool]
+    "Detect important phrases and words in your transcription text."
 
     language_detection: Optional[bool]
     """
@@ -1442,8 +1442,8 @@ class TranscriptResponse(BaseTranscript):
     summary: Optional[str]
     "The summarization of the transcript"
 
-    # auto_highlights_result: Optional[AutohighlightResponse] = None
-    # "The list of results when enabling Automatic Transcript Highlights"
+    auto_highlights_result: Optional[AutohighlightResponse]
+    "The list of results when enabling Automatic Transcript Highlights"
 
     content_safety_labels: Optional[ContentSafetyResponse]
     "The list of results when Content Safety is enabled"
diff --git a/tests/unit/BUILD.bazel b/tests/unit/BUILD.bazel
@@ -23,6 +23,7 @@ py_test(
     name = "unit_test",
     srcs = [
         "test_auto_chapters.py",
+        "test_auto_highlights.py",
         "test_client.py",
         "test_config.py",
         "test_content_safety.py",
diff --git a/tests/unit/test_auto_highlights.py b/tests/unit/test_auto_highlights.py
@@ -0,0 +1,149 @@
+import json
+from typing import Any, Dict, Tuple
+
+import factory
+import httpx
+from pytest_httpx import HTTPXMock
+
+import assemblyai as aai
+from tests.unit import factories
+
+aai.settings.api_key = "test"
+
+
+class AutohighlightResultFactory(factory.Factory):
+    class Meta:
+        model = aai.types.AutohighlightResult
+
+    count = factory.Faker("pyint")
+    rank = factory.Faker("pyfloat")
+    text = factory.Faker("sentence")
+    timestamps = factory.List([factory.SubFactory(factories.TimestampFactory)])
+
+
+class AutohighlightResponseFactory(factory.Factory):
+    class Meta:
+        model = aai.types.AutohighlightResponse
+
+    status = aai.types.StatusResult.success
+    results = factory.List([factory.SubFactory(AutohighlightResultFactory)])
+
+
+class AutohighlightTranscriptResponseFactory(
+    factories.TranscriptCompletedResponseFactory
+):
+    auto_highlights_result = factory.SubFactory(AutohighlightResponseFactory)
+
+
+def __submit_mock_request(
+    httpx_mock: HTTPXMock,
+    mock_response: Dict[str, Any],
+    config: aai.TranscriptionConfig,
+) -> Tuple[Dict[str, Any], aai.Transcript]:
+    """
+    Helper function to abstract mock transcriber calls with given `TranscriptionConfig`,
+    and perform some common assertions.
+    """
+
+    mock_transcript_id = mock_response.get("id", "mock_id")
+
+    # Mock initial submission response (transcript is processing)
+    mock_processing_response = factories.generate_dict_factory(
+        factories.TranscriptProcessingResponseFactory
+    )()
+
+    httpx_mock.add_response(
+        url=f"{aai.settings.base_url}/transcript",
+        status_code=httpx.codes.OK,
+        method="POST",
+        json={
+            **mock_processing_response,
+            "id": mock_transcript_id,  # inject ID from main mock response
+        },
+    )
+
+    # Mock polling-for-completeness response, with completed transcript
+    httpx_mock.add_response(
+        url=f"{aai.settings.base_url}/transcript/{mock_transcript_id}",
+        status_code=httpx.codes.OK,
+        method="GET",
+        json=mock_response,
+    )
+
+    # == Make API request via SDK ==
+    transcript = aai.Transcriber().transcribe(
+        data="https://example.org/audio.wav",
+        config=config,
+    )
+
+    # Check that submission and polling requests were made
+    assert len(httpx_mock.get_requests()) == 2
+
+    # Extract body of initial submission request
+    request = httpx_mock.get_requests()[0]
+    request_body = json.loads(request.content.decode())
+
+    return request_body, transcript
+
+
+def test_auto_highlights_disabled_by_default(httpx_mock: HTTPXMock):
+    """
+    Tests that excluding `auto_highlights` from the `TranscriptionConfig` will
+    result in the default behavior of it being excluded from the request body
+    """
+    request_body, transcript = __submit_mock_request(
+        httpx_mock,
+        mock_response=factories.generate_dict_factory(
+            factories.TranscriptCompletedResponseFactory
+        )(),
+        config=aai.TranscriptionConfig(),
+    )
+    assert request_body.get("auto_highlights") is None
+    assert transcript.auto_highlights_result is None
+
+
+def test_auto_highlights_enabled(httpx_mock: HTTPXMock):
+    """
+    Tests that including `auto_highlights=True` in the `TranscriptionConfig`
+    will result in `auto_highlights=True` in the request body, and that the
+    response is properly parsed into a `Transcript` object
+    """
+    mock_response = factories.generate_dict_factory(
+        AutohighlightTranscriptResponseFactory
+    )()
+    request_body, transcript = __submit_mock_request(
+        httpx_mock,
+        mock_response=mock_response,
+        config=aai.TranscriptionConfig(auto_highlights=True),
+    )
+
+    # Check that request body was properly defined
+    assert request_body.get("auto_highlights") == True
+
+    # Check that transcript was properly parsed from JSON response
+    assert transcript.error is None
+    assert transcript.auto_highlights_result is not None
+    assert (
+        transcript.auto_highlights_result.status
+        == mock_response["auto_highlights_result"]["status"]
+    )
+
+    assert transcript.auto_highlights_result.results is not None
+    assert len(transcript.auto_highlights_result.results) > 0
+    assert len(transcript.auto_highlights_result.results) == len(
+        mock_response["auto_highlights_result"]["results"]
+    )
+
+    for response_result, transcript_result in zip(
+        mock_response["auto_highlights_result"]["results"],
+        transcript.auto_highlights_result.results,
+    ):
+        assert transcript_result.count == response_result["count"]
+        assert transcript_result.rank == response_result["rank"]
+        assert transcript_result.text == response_result["text"]
+
+        for response_timestamp, transcript_timestamp in zip(
+            response_result["timestamps"], transcript_result.timestamps
+        ):
+            assert transcript_timestamp.start == response_timestamp["start"]
+            assert transcript_timestamp.end == response_timestamp["end"]