default source-location identity and opt-in content-digest identity for file move/rename reconciliation, PDF/DOCX-style placeholder ingestion

This commit is contained in:
2026-05-06 13:04:36 +02:00
parent 48dffedc09
commit a4a4759ac4
13 changed files with 724 additions and 39 deletions

View File

@@ -9,6 +9,7 @@ from .ingestion import (
ExtractionResult,
ExtractorCapability,
IngestionFailure,
IngestionIdentityPolicy,
IngestionJob,
IngestionJobStatus,
NormalizedDocument,
@@ -58,6 +59,7 @@ __all__ = [
"IdempotencyRecord",
"IdempotencyStatus",
"IngestionFailure",
"IngestionIdentityPolicy",
"IngestionJob",
"IngestionJobStatus",
"KnowledgeAsset",

View File

@@ -21,6 +21,11 @@ class IngestionJobStatus(str, Enum):
CANCELED = "canceled"
class IngestionIdentityPolicy(str, Enum):
SOURCE_LOCATION = "source_location"
CONTENT_DIGEST = "content_digest"
@dataclass(frozen=True)
class IngestionFailure:
code: str