# This is an automatically generated code sample.
# To make this code sample work in your Oracle Cloud tenancy,
# please replace the values for any parameters whose current values do not fit
# your use case (such as resource IDs, strings containing ‘EXAMPLE’ or ‘unique_id’, and
# boolean, number, and enum parameters with values not fitting your use case).
from datetime import datetime
import oci
# Create a default config using DEFAULT profile in default location
# Refer to
# https://docs.cloud.oracle.com/en-us/iaas/Content/API/Concepts/sdkconfig.htm#SDK_and_CLI_Configuration_File
# for more info
config = oci.config.from_file()
# Initialize service client with default config file
ai_document_client = oci.ai_document.AIServiceDocumentClient(config)
# Send the request to service, some parameters are not required, see API
# doc for more info
analyze_document_response = ai_document_client.analyze_document(
analyze_document_details=oci.ai_document.models.AnalyzeDocumentDetails(
features=[
oci.ai_document.models.DocumentTextExtractionFeature(
feature_type="TEXT_EXTRACTION",
generate_searchable_pdf=False,
model_id="ocid1.test.oc1..<unique_ID>EXAMPLE-modelId-Value",
selection_mark_detection=True)],
document=oci.ai_document.models.ObjectStorageDocumentDetails(
source="OBJECT_STORAGE",
namespace_name="EXAMPLE-namespaceName-Value",
bucket_name="EXAMPLE-bucketName-Value",
object_name="EXAMPLE-objectName-Value",
page_range=["EXAMPLE--Value"]),
compartment_id="ocid1.test.oc1..<unique_ID>EXAMPLE-compartmentId-Value",
output_location=oci.ai_document.models.OutputLocation(
namespace_name="EXAMPLE-namespaceName-Value",
bucket_name="EXAMPLE-bucketName-Value",
prefix="EXAMPLE-prefix-Value"),
language="EXAMPLE-language-Value",
document_type="PAYSLIP",
ocr_data=oci.ai_document.models.AnalyzeDocumentResult(
document_metadata=oci.ai_document.models.DocumentMetadata(
page_count=79,
mime_type="EXAMPLE-mimeType-Value"),
pages=[
oci.ai_document.models.Page(
page_number=525,
dimensions=oci.ai_document.models.Dimensions(
width=6383.161,
height=5292.445,
unit="INCH"),
detected_document_types=[
oci.ai_document.models.DetectedDocumentType(
document_type="EXAMPLE-documentType-Value",
confidence=0.50883406,
document_id="ocid1.test.oc1..<unique_ID>EXAMPLE-documentId-Value")],
detected_languages=[
oci.ai_document.models.DetectedLanguage(
language="EXAMPLE-language-Value",
confidence=0.46551925)],
words=[
oci.ai_document.models.Word(
text="EXAMPLE-text-Value",
confidence=0.5997962,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.2738042,
y=0.8219967)]))],
lines=[
oci.ai_document.models.Line(
text="EXAMPLE-text-Value",
confidence=0.66393584,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.32212847,
y=0.8598904)]),
word_indexes=[511])],
tables=[
oci.ai_document.models.Table(
row_count=549,
column_count=362,
header_rows=[
oci.ai_document.models.TableRow(
cells=[
oci.ai_document.models.Cell(
text="EXAMPLE-text-Value",
row_index=224,
column_index=550,
confidence=0.6347457,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.34505373,
y=0.4139248)]),
word_indexes=[611])])],
confidence=0.18187869,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.7356378,
y=0.04115498)]))],
document_fields=[
oci.ai_document.models.DocumentField(
field_type="LINE_ITEM_FIELD",
field_value=oci.ai_document.models.ValueTime(
value_type="TIME",
confidence=0.49089772,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.8098093,
y=0.37790602)]),
word_indexes=[595],
value=datetime.strptime(
"2034-02-10T12:50:21.029Z",
"%Y-%m-%dT%H:%M:%S.%fZ"),
text="EXAMPLE-text-Value",
normalized_value="EXAMPLE-normalizedValue-Value",
normalized_confidence=0.2273649),
field_label=oci.ai_document.models.FieldLabel(
name="EXAMPLE-name-Value",
confidence=0.58054036),
field_name=oci.ai_document.models.FieldName(
name="EXAMPLE-name-Value",
confidence=0.073206306,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.1410889,
y=0.203111)]),
word_indexes=[127]))],
signatures=[
oci.ai_document.models.Signature(
confidence=0.57584155,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.2771057,
y=0.24466419)]))],
bar_codes=[
oci.ai_document.models.BarCode(
confidence=0.5484517,
value="EXAMPLE-value-Value",
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.42452675,
y=0.26406038)]),
code_type="EXAMPLE-codeType-Value")],
selection_marks=[
oci.ai_document.models.SelectionMark(
state="UNSELECTED",
confidence=0.74348044,
bounding_polygon=oci.ai_document.models.BoundingPolygon(
normalized_vertices=[
oci.ai_document.models.NormalizedVertex(
x=0.035226166,
y=0.24242514)]))])],
detected_document_types=[
oci.ai_document.models.DetectedDocumentType(
document_type="EXAMPLE-documentType-Value",
confidence=0.98944896,
document_id="ocid1.test.oc1..<unique_ID>EXAMPLE-documentId-Value")],
detected_languages=[
oci.ai_document.models.DetectedLanguage(
language="EXAMPLE-language-Value",
confidence=0.538474)],
document_classification_model_version="EXAMPLE-documentClassificationModelVersion-Value",
language_classification_model_version="EXAMPLE-languageClassificationModelVersion-Value",
text_extraction_model_version="EXAMPLE-textExtractionModelVersion-Value",
key_value_extraction_model_version="EXAMPLE-keyValueExtractionModelVersion-Value",
table_extraction_model_version="EXAMPLE-tableExtractionModelVersion-Value",
signature_extraction_model_version="EXAMPLE-signatureExtractionModelVersion-Value",
bar_code_extraction_model_version="EXAMPLE-barCodeExtractionModelVersion-Value",
errors=[
oci.ai_document.models.ProcessingError(
code="EXAMPLE-code-Value",
message="EXAMPLE-message-Value")],
searchable_pdf="4PbLq2uMbnU7mSwzSLnH")),
if_match="EXAMPLE-ifMatch-Value",
opc_request_id="4908UPQFCDVP1KJSN8VT<unique_ID>")
# Get the data from response
print(analyze_document_response.data)