Loaders
__all__ = ['BaseLoader', 'BaseTextLoader', 'TextLoader', 'PdfLoader', 'WebLoader', 'SqlLoader', 'CsvLoader', 'DataFrameLoader', 'EmailLoader', 'ImageLoader', 'BlobLoader']
module-attribute
BaseLoader
Bases: ABC
Source code in griptape/loaders/base_loader.py
encoding: Optional[str] = field(default=None, kw_only=True)
class-attribute
instance-attribute
futures_executor: futures.Executor = field(default=Factory(lambda: futures.ThreadPoolExecutor()), kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
abstractmethod
load_collection(sources, *args, **kwargs)
Source code in griptape/loaders/base_loader.py
to_key(source, *args, **kwargs)
BaseTextLoader
Bases: BaseLoader
, ABC
Source code in griptape/loaders/base_text_loader.py
MAX_TOKEN_RATIO = 0.5
class-attribute
instance-attribute
chunker: BaseChunker = field(default=Factory(lambda self: TextChunker(tokenizer=self.tokenizer, max_tokens=self.max_tokens), takes_self=True), kw_only=True)
class-attribute
instance-attribute
embedding_driver: Optional[BaseEmbeddingDriver] = field(default=None, kw_only=True)
class-attribute
instance-attribute
encoding: str = field(default='utf-8', kw_only=True)
class-attribute
instance-attribute
max_tokens: int = field(default=Factory(lambda self: round(self.tokenizer.max_input_tokens * self.MAX_TOKEN_RATIO), takes_self=True), kw_only=True)
class-attribute
instance-attribute
tokenizer: OpenAiTokenizer = field(default=Factory(lambda: OpenAiTokenizer(model=OpenAiTokenizer.DEFAULT_OPENAI_GPT_3_CHAT_MODEL)), kw_only=True)
class-attribute
instance-attribute
load_collection(sources, *args, **kwargs)
BlobLoader
Bases: BaseLoader
Source code in griptape/loaders/blob_loader.py
load(source, *args, **kwargs)
load_collection(sources, *args, **kwargs)
CsvLoader
Bases: BaseLoader
Source code in griptape/loaders/csv_loader.py
delimiter: str = field(default=',', kw_only=True)
class-attribute
instance-attribute
embedding_driver: Optional[BaseEmbeddingDriver] = field(default=None, kw_only=True)
class-attribute
instance-attribute
encoding: str = field(default='utf-8', kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/csv_loader.py
load_collection(sources, *args, **kwargs)
Source code in griptape/loaders/csv_loader.py
DataFrameLoader
Bases: BaseLoader
Source code in griptape/loaders/dataframe_loader.py
embedding_driver: Optional[BaseEmbeddingDriver] = field(default=None, kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/dataframe_loader.py
load_collection(sources, *args, **kwargs)
to_key(source, *args, **kwargs)
EmailLoader
Bases: BaseLoader
Source code in griptape/loaders/email_loader.py
imap_url: str = field(kw_only=True)
class-attribute
instance-attribute
password: str = field(kw_only=True)
class-attribute
instance-attribute
username: str = field(kw_only=True)
class-attribute
instance-attribute
EmailQuery
An email retrieval query
Attributes:
Name | Type | Description |
---|---|---|
label |
str
|
Label to retrieve emails from such as 'INBOX' or 'SENT'. |
key |
Optional[str]
|
Optional key for filtering such as 'FROM' or 'SUBJECT'. |
search_criteria |
Optional[str]
|
Optional search criteria to filter emails by key. |
max_count |
Optional[int]
|
Optional max email count. |
Source code in griptape/loaders/email_loader.py
key: Optional[str] = field(default=None, kw_only=True)
class-attribute
instance-attribute
label: str = field(kw_only=True)
class-attribute
instance-attribute
max_count: Optional[int] = field(default=None, kw_only=True)
class-attribute
instance-attribute
search_criteria: Optional[str] = field(default=None, kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/email_loader.py
load_collection(sources, *args, **kwargs)
ImageLoader
Bases: BaseLoader
Loads images into image artifacts.
Attributes:
Name | Type | Description |
---|---|---|
format |
Optional[str]
|
If provided, attempts to ensure image artifacts are in this format when loaded. For example, when set to 'PNG', loading image.jpg will return an ImageArtifact containing the image bytes in PNG format. |
Source code in griptape/loaders/image_loader.py
FORMAT_TO_MIME_TYPE = {'bmp': 'image/bmp', 'gif': 'image/gif', 'jpeg': 'image/jpeg', 'png': 'image/png', 'tiff': 'image/tiff', 'webp': 'image/webp'}
class-attribute
instance-attribute
format: Optional[str] = field(default=None, kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/image_loader.py
PdfLoader
Bases: BaseTextLoader
Source code in griptape/loaders/pdf_loader.py
chunker: PdfChunker = field(default=Factory(lambda self: PdfChunker(tokenizer=self.tokenizer, max_tokens=self.max_tokens), takes_self=True), kw_only=True)
class-attribute
instance-attribute
encoding: None = field(default=None, kw_only=True)
class-attribute
instance-attribute
load(source, password=None, *args, **kwargs)
Source code in griptape/loaders/pdf_loader.py
load_collection(sources, *args, **kwargs)
SqlLoader
Bases: BaseLoader
Source code in griptape/loaders/sql_loader.py
embedding_driver: Optional[BaseEmbeddingDriver] = field(default=None, kw_only=True)
class-attribute
instance-attribute
sql_driver: BaseSqlDriver = field(kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/sql_loader.py
TextLoader
Bases: BaseTextLoader
Source code in griptape/loaders/text_loader.py
MAX_TOKEN_RATIO = 0.5
class-attribute
instance-attribute
chunker: TextChunker = field(default=Factory(lambda self: TextChunker(tokenizer=self.tokenizer, max_tokens=self.max_tokens), takes_self=True), kw_only=True)
class-attribute
instance-attribute
embedding_driver: Optional[BaseEmbeddingDriver] = field(default=None, kw_only=True)
class-attribute
instance-attribute
encoding: str = field(default='utf-8', kw_only=True)
class-attribute
instance-attribute
max_tokens: int = field(default=Factory(lambda self: round(self.tokenizer.max_input_tokens * self.MAX_TOKEN_RATIO), takes_self=True), kw_only=True)
class-attribute
instance-attribute
tokenizer: OpenAiTokenizer = field(default=Factory(lambda: OpenAiTokenizer(model=OpenAiTokenizer.DEFAULT_OPENAI_GPT_3_CHAT_MODEL)), kw_only=True)
class-attribute
instance-attribute
load(source, *args, **kwargs)
Source code in griptape/loaders/text_loader.py
load_collection(sources, *args, **kwargs)
Source code in griptape/loaders/text_loader.py
WebLoader
Bases: BaseTextLoader