Skip to content

Commit ce591e2

Browse files
authored
Fix missing sensitive fields for embedders (#3263)
A few embedder types are missing sensitive field annotations.
1 parent 88b08a7 commit ce591e2

File tree

5 files changed

+10
-4
lines changed

5 files changed

+10
-4
lines changed

Diff for: CHANGELOG.md

+2
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,8 @@
1010

1111
* **`partition()` now forwards `strategy` arg to `partition_docx()`, `partition_ppt()`, and `partition_pptx()`.** A `strategy` argument passed to `partition()` (or the default value "auto" assigned by `partition()`) is now forwarded to `partition_docx()`, `partition_ppt()`, and `partition_pptx()` when those filetypes are detected.
1212

13+
* **Fix missing sensitive field markers** for embedders
14+
1315
## 0.14.7
1416

1517
### Enhancements

Diff for: unstructured/embed/octoai.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@
77
Element,
88
)
99
from unstructured.embed.interfaces import BaseEmbeddingEncoder, EmbeddingConfig
10+
from unstructured.ingest.enhanced_dataclass import enhanced_field
1011
from unstructured.ingest.error import EmbeddingEncoderConnectionError
1112
from unstructured.utils import requires_dependencies
1213

@@ -18,7 +19,7 @@
1819

1920
@dataclass
2021
class OctoAiEmbeddingConfig(EmbeddingConfig):
21-
api_key: str
22+
api_key: str = enhanced_field(sensitive=True)
2223
model_name: str = "thenlper/gte-large"
2324

2425

Diff for: unstructured/embed/openai.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@
77
Element,
88
)
99
from unstructured.embed.interfaces import BaseEmbeddingEncoder, EmbeddingConfig
10+
from unstructured.ingest.enhanced_dataclass import enhanced_field
1011
from unstructured.ingest.error import EmbeddingEncoderConnectionError
1112
from unstructured.utils import requires_dependencies
1213

@@ -16,7 +17,7 @@
1617

1718
@dataclass
1819
class OpenAIEmbeddingConfig(EmbeddingConfig):
19-
api_key: str
20+
api_key: str = enhanced_field(sensitive=True)
2021
model_name: str = "text-embedding-ada-002"
2122

2223

Diff for: unstructured/embed/vertexai.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@
1010
Element,
1111
)
1212
from unstructured.embed.interfaces import BaseEmbeddingEncoder, EmbeddingConfig
13+
from unstructured.ingest.enhanced_dataclass import enhanced_field
1314
from unstructured.ingest.error import EmbeddingEncoderConnectionError
1415
from unstructured.utils import FileHandler, requires_dependencies
1516

@@ -19,7 +20,7 @@
1920

2021
@dataclass
2122
class VertexAIEmbeddingConfig(EmbeddingConfig):
22-
api_key: str
23+
api_key: str = enhanced_field(sensitive=True)
2324
model_name: Optional[str] = "textembedding-gecko@001"
2425

2526

Diff for: unstructured/embed/voyageai.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@
55

66
from unstructured.documents.elements import Element
77
from unstructured.embed.interfaces import BaseEmbeddingEncoder, EmbeddingConfig
8+
from unstructured.ingest.enhanced_dataclass import enhanced_field
89
from unstructured.ingest.error import EmbeddingEncoderConnectionError
910
from unstructured.utils import requires_dependencies
1011

@@ -14,7 +15,7 @@
1415

1516
@dataclass
1617
class VoyageAIEmbeddingConfig(EmbeddingConfig):
17-
api_key: str
18+
api_key: str = enhanced_field(sensitive=True)
1819
model_name: str
1920
batch_size: Optional[int] = None
2021
truncation: Optional[bool] = None

0 commit comments

Comments
 (0)