alt-text/tests/test.py

50 lines
1.4 KiB
Python

import sys
sys.path.append("../")
import src.alttext.alttext as alttext
from src.alttext.descengine.bliplocal import BlipLocal
from src.alttext.descengine.replicateapi import ReplicateAPI
from src.alttext.ocrengine.tesseract import Tesseract
from src.alttext.langengine.privategpt import PrivateGPT
from src.alttext.langengine.openaiapi import OpenAIAPI
import keys
# HTML BOOK FILEPATHS
HTML_BIRD = "../books/pg30221-h/pg30221-images.html"
HTML_HUNTING = "../books/pg37122-h/pg37122-images.html"
HTML_MECHANIC = "../books/pg71856-h/pg71856-images.html"
HTML_INFINITY = "../books/pg71859-h/pg71859-images.html"
# EPUB BOOK FILEPATHS
EPUB1 = "../books/pg71856-images-3.epub"
EPUB2 = "../books/pg71908-images-3.epub"
EPUB3 = "../books/seuss.epub"
HOST1 = "http://127.0.0.1:8001"
def testHTML():
print("TESTING HTML")
alt: alttext.AltTextHTML = alttext.AltTextHTML(
# BlipLocal("C:/Users/dacru/Desktop/ALT/image-captioning"),
ReplicateAPI(keys.ReplicateEricKey()),
Tesseract(),
# PrivateGPT(HOST1),
OpenAIAPI(keys.OpenAIKey(), "gpt-3.5-turbo"),
)
alt.parseFile(HTML_HUNTING)
imgs = alt.getAllImgs()
src = imgs[7].attrs["src"]
print(src)
print(alt.genAltText(src))
# desc = alt.genDesc(alt.getImgData(src), src)
# print(desc)
# associations = alt.genAltAssociations(imgs)
# print(associations)
if __name__ == "__main__":
testHTML()