50 lines
1.4 KiB
Python
50 lines
1.4 KiB
Python
import sys
|
|
|
|
sys.path.append("../")
|
|
import src.alttext.alttext as alttext
|
|
from src.alttext.descengine.bliplocal import BlipLocal
|
|
from src.alttext.descengine.replicateapi import ReplicateAPI
|
|
from src.alttext.ocrengine.tesseract import Tesseract
|
|
from src.alttext.langengine.privategpt import PrivateGPT
|
|
from src.alttext.langengine.openaiapi import OpenAIAPI
|
|
import keys
|
|
|
|
# HTML BOOK FILEPATHS
|
|
HTML_BIRD = "../books/pg30221-h/pg30221-images.html"
|
|
HTML_HUNTING = "../books/pg37122-h/pg37122-images.html"
|
|
HTML_MECHANIC = "../books/pg71856-h/pg71856-images.html"
|
|
HTML_INFINITY = "../books/pg71859-h/pg71859-images.html"
|
|
|
|
# EPUB BOOK FILEPATHS
|
|
EPUB1 = "../books/pg71856-images-3.epub"
|
|
EPUB2 = "../books/pg71908-images-3.epub"
|
|
EPUB3 = "../books/seuss.epub"
|
|
|
|
HOST1 = "http://127.0.0.1:8001"
|
|
|
|
|
|
def testHTML():
|
|
print("TESTING HTML")
|
|
alt: alttext.AltTextHTML = alttext.AltTextHTML(
|
|
# BlipLocal("C:/Users/dacru/Desktop/ALT/image-captioning"),
|
|
ReplicateAPI(keys.ReplicateEricKey()),
|
|
Tesseract(),
|
|
# PrivateGPT(HOST1),
|
|
OpenAIAPI(keys.OpenAIKey(), "gpt-3.5-turbo"),
|
|
)
|
|
|
|
alt.parseFile(HTML_HUNTING)
|
|
imgs = alt.getAllImgs()
|
|
src = imgs[7].attrs["src"]
|
|
print(src)
|
|
print(alt.genAltText(src))
|
|
|
|
# desc = alt.genDesc(alt.getImgData(src), src)
|
|
# print(desc)
|
|
# associations = alt.genAltAssociations(imgs)
|
|
# print(associations)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
testHTML()
|