TODO:
Need to add the VLM backend and integrate calling from the Framework class.
from framework import Framework
import base64
from IPython.display import Image, display
framework = Framework()
framework.start()
#Waiting for the container to be ready...
#Container started successfully with ID: ad9a149907197a70c5430255f870e3367b56777e549f4d9d6187eb17f0e94c3a
framework.mouse_move(coordinate=[800,800])
#<Response [200]>
screenshot = framework.screenshot()
display(Image(data=base64.b64decode(screenshot.json()['base64_image'])))
framework.left_click()
#<Response [200]>
screenshot = framework.screenshot()
display(Image(data=base64.b64decode(screenshot.json()['base64_image'])))
framework.stop()
#Container with ID: ad9a149907197a70c5430255f870e3367b56777e549f4d9d6187eb17f0e94c3a has been stopped