RoboPoint is a specialized multimodal model for robotic perception and understanding. With InferX, you can run RoboPoint on any device using the same API - perfect for robotics applications across different hardware platforms.
from inferx.models.robopoint import robopointimport cv2# Initialize the modelmodel = robopoint()# Load an imageimage = cv2.imread("path/to/your/image.jpg")# Run inference with text instructionresults = model.inference( image=image, text_instruction="Find grasping points on the cup")# Process resultsprint(f"Detected keypoints: {len(results['keypoints'])}")for i, keypoint in enumerate(results['keypoints']): print(f"Keypoint {i}: ({keypoint['x']}, {keypoint['y']}) - confidence: {keypoint['confidence']}")