import sys sys.path.append("../") import src.alttext.alttext as alttext from src.alttext.descengine.bliplocal import BlipLocal from src.alttext.descengine.replicateapi import ReplicateAPI from src.alttext.ocrengine.tesseract import Tesseract from src.alttext.langengine.privategpt import PrivateGPT from src.alttext.langengine.openaiapi import OpenAIAPI import keys # HTML BOOK FILEPATHS HTML_BIRD = "../books/pg30221-h/pg30221-images.html" HTML_HUNTING = "../books/pg37122-h/pg37122-images.html" HTML_MECHANIC = "../books/pg71856-h/pg71856-images.html" HTML_INFINITY = "../books/pg71859-h/pg71859-images.html" # EPUB BOOK FILEPATHS EPUB1 = "../books/pg71856-images-3.epub" EPUB2 = "../books/pg71908-images-3.epub" EPUB3 = "../books/seuss.epub" HOST1 = "http://127.0.0.1:8001" def testHTML(): print("TESTING HTML") alt: alttext.AltTextHTML = alttext.AltTextHTML( # BlipLocal("C:/Users/dacru/Desktop/ALT/image-captioning"), ReplicateAPI(keys.ReplicateEricKey()), Tesseract(), # PrivateGPT(HOST1), OpenAIAPI(keys.OpenAIKey(), "gpt-3.5-turbo"), ) alt.parseFile(HTML_HUNTING) imgs = alt.getAllImgs() src = imgs[7].attrs["src"] print(src) print(alt.genAltText(src)) # desc = alt.genDesc(alt.getImgData(src), src) # print(desc) # associations = alt.genAltAssociations(imgs) # print(associations) if __name__ == "__main__": testHTML()