alt-text/tests/test.py

60 lines
1.8 KiB
Python

import sys
sys.path.append("../")
import src.alttext.alttext as alttext
from src.alttext.descengine.bliplocal import BlipLocal
from src.alttext.descengine.replicateapi import ReplicateAPI
from src.alttext.ocrengine.tesseract import Tesseract
from src.alttext.langengine.privategpt import PrivateGPT
from src.alttext.langengine.openaiapi import OpenAIAPI
import keys
# HTML BOOK FILEPATHS
HTML_ADVENTURES = "../books/pg76-h/pg76-images.html"
HTML_BIRD = "../books/pg30221-h/pg30221-images.html"
HTML_HUNTING = "../books/pg37122-h/pg37122-images.html"
HTML_MECHANIC = "../books/pg71856-h/pg71856-images.html"
HTML_INFINITY = "../books/pg71859-h/pg71859-images.html"
# EPUB BOOK FILEPATHS
EPUB1 = "../books/pg71856-images-3.epub"
EPUB2 = "../books/pg71908-images-3.epub"
EPUB3 = "../books/seuss.epub"
HOST1 = "http://127.0.0.1:8001"
def testHTML():
print("TESTING HTML")
alt: alttext.AltTextHTML = alttext.AltTextHTML(
# BlipLocal("C:/Users/dacru/Desktop/ALT/image-captioning"),
ReplicateAPI(keys.ReplicateEricKey()),
Tesseract(),
# PrivateGPT(HOST1),
OpenAIAPI(keys.OpenAIKey(), "gpt-3.5-turbo"),
)
# imgs = alt.getAllImgs()
alt.parseFile(HTML_ADVENTURES)
img = alt.getImg("images/c01-21.jpg")
src = img.attrs["src"]
imgData = alt.getImgData(src)
chars = alt.genChars(imgData, src)
desc = alt.genDesc(imgData, src, alt.getContext(img))
altText = alt.genAltText(src)
print(chars)
print("=====================================")
print(desc)
print("=====================================")
print(altText)
# desc = alt.genDesc(alt.getImgData(src), src)
# print(desc)
# associations = alt.genAltAssociations(imgs)
# print(associations)
if __name__ == "__main__":
testHTML()