diff options
| author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2024-04-08 00:23:52 +0200 |
|---|---|---|
| committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2024-04-08 00:23:52 +0200 |
| commit | 8211705debf9d1335223c606275f46c43c78d8a2 (patch) | |
| tree | f09f902c7d31b2035813c42cbb4a47e720fa363b /rag/db/document.py | |
| parent | 95f47c4900a96d91daaef93bf87094ed3d4da43c (diff) | |
Updates
Diffstat (limited to 'rag/db/document.py')
| -rw-r--r-- | rag/db/document.py | 7 |
1 files changed, 4 insertions, 3 deletions
diff --git a/rag/db/document.py b/rag/db/document.py index 528a399..54ac451 100644 --- a/rag/db/document.py +++ b/rag/db/document.py @@ -1,6 +1,7 @@ import hashlib import os +from langchain_community.document_loaders.blob_loaders import Blob import psycopg from loguru import logger as log @@ -26,11 +27,11 @@ class DocumentDB: cur.execute(TABLES) self.conn.commit() - def __hash(self, blob: bytes) -> str: + def __hash(self, blob: Blob) -> str: log.debug("Hashing document...") - return hashlib.sha256(blob).hexdigest() + return hashlib.sha256(blob.as_bytes()).hexdigest() - def add(self, blob: bytes) -> bool: + def add(self, blob: Blob) -> bool: with self.conn.cursor() as cur: hash = self.__hash(blob) cur.execute( |