CLASSES = {0:"body", 1:"face", 2:"frame", 3:"text"}     # confirmed by user

def get_yolo_predictions(yolo_model,img_path:str):
    results = yolo_model.predict(source=img_path, device='cuda')
    dets = {"body":[], "face":[], "frame":[], "text":[]}
    for box in results[0].boxes:
        c  = int(box.cls[0])
        x1, y1, x2, y2 = map(int, box.xyxy[0])
        dets[CLASSES[c]].append([x1,y1,x2,y2])
    return dets