Module: pdf_content

Expand source code
# Copyright (C) 2023-present The Project Contributors
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from abc import abstractmethod
from dataclasses import dataclass
from typing_extensions import Self
from cl.runtime.records.dataclasses_extensions import missing
from cl.convince.content.content import Content


@dataclass(slots=True, kw_only=True)
class PdfContent(Content):
    """Single-page content in text format."""

    pdf_bytes: bytes = missing()
    """PDF document in its original format."""

    @abstractmethod
    def as_str(self) -> str:
        raise NotImplementedError()

    @classmethod
    @abstractmethod
    def from_str(cls, value: str) -> Self:
        raise NotImplementedError()

Classes

class PdfContent (*, content_id: str = None, pdf_bytes: bytes = None)

Single-page content in text format.

Expand source code
@dataclass(slots=True, kw_only=True)
class PdfContent(Content):
    """Single-page content in text format."""

    pdf_bytes: bytes = missing()
    """PDF document in its original format."""

    @abstractmethod
    def as_str(self) -> str:
        raise NotImplementedError()

    @classmethod
    @abstractmethod
    def from_str(cls, value: str) -> Self:
        raise NotImplementedError()

Ancestors

Static methods

def from_str(value: str) -> Self

Inherited from: Content.from_str

Convert from string format.

def get_key_type() -> Type

Inherited from: Content.get_key_type

Return key type even when called from a record.

Fields

var content_id -> str

Inherited from: Content.content_id

Unique content identifier.

var pdf_bytes -> bytes

PDF document in its original format.

Methods

def as_str(self) -> str

Inherited from: Content.as_str

Convert to string format.

def get_key(self) -> ContentKey

Inherited from: Content.get_key

Return a new key object whose fields populated from self, do not return self.

def init_all(self) -> None

Inherited from: Content.init_all

Invoke ‘init’ for each class in the order from base to derived, then validate against schema.