You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
[Display(Name="None",Description="Free text prompt without a predefined task.")]
27
28
NONE,
29
+
30
+
[Display(Name="OCR",Description="Reads all the visible text in an image.")]
28
31
OCR,
32
+
33
+
[Display(Name="OCR with Region",Description="Reads text in an image and also gives the region where each piece of text is found.")]
29
34
OCR_WITH_REGION,
35
+
36
+
[Display(Name="Caption",Description="Generates a short description of the overall image.")]
30
37
CAPTION,
38
+
39
+
[Display(Name="Detailed Caption",Description="Produces a richer description of the image with more detail than a normal caption.")]
31
40
DETAILED_CAPTION,
41
+
42
+
[Display(Name="More Detailed Caption",Description="Gives a very thorough and verbose description of the image.")]
32
43
MORE_DETAILED_CAPTION,
44
+
45
+
[Display(Name="Object Detection",Description="Identifies and localizes objects in the image with bounding boxes.")]
33
46
OD,
47
+
48
+
[Display(Name="Dense Region Caption",Description="Splits the image into many regions and generates a caption for each region.")]
34
49
DENSE_REGION_CAPTION,
50
+
51
+
[Display(Name="Caption to Phrase Grounding",Description="Finds the specific region(s) in the image that correspond to a given phrase in a caption.")]
35
52
CAPTION_TO_PHRASE_GROUNDING,
53
+
54
+
[Display(Name="Referring Expression Segmentation",Description="Given a phrase (e.g., 'the red car'), segments out that exact object region at the pixel level.")]
36
55
REFERRING_EXPRESSION_SEGMENTATION,
56
+
57
+
[Display(Name="Region to Segmentation",Description="Converts a region (bounding box) into a precise pixel-level segmentation mask.")]
37
58
REGION_TO_SEGMENTATION,
59
+
60
+
[Display(Name="Open Vocabulary Detection",Description="Detects objects of arbitrary categories, even ones not seen during training.")]
38
61
OPEN_VOCABULARY_DETECTION,
62
+
63
+
[Display(Name="Region to Category",Description="Assigns a category label (e.g., 'cat', 'chair') to a given region.")]
39
64
REGION_TO_CATEGORY,
65
+
66
+
[Display(Name="Region to Description",Description="Generates a natural-language description for a given region.")]
40
67
REGION_TO_DESCRIPTION,
68
+
69
+
[Display(Name="Region to OCR",Description="Extracts text only from within a specified region.")]
41
70
REGION_TO_OCR,
71
+
72
+
[Display(Name="Region Proposal",Description="Suggests candidate regions of interest in the image (without labeling them).")]
0 commit comments