File size: 1,763 Bytes
5d15f06
 
 
 
3b99a8a
 
1858b2a
 
5d15f06
9c79daa
5d15f06
 
 
3b99a8a
 
1858b2a
 
 
9c79daa
 
5d15f06
 
 
3b99a8a
 
1858b2a
 
 
9c79daa
5d15f06
 
 
 
1858b2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5d15f06
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
OBJECT_DETECTION_TASK_NAME = "Object Detection"
CAPTION_TASK_NAME = "Caption"
DETAILED_CAPTION_TASK_NAME = "Detailed Caption"
MORE_DETAILED_CAPTION_TASK_NAME = "More Detailed Caption"
OCR_TASK_NAME = "OCR"
OCR_WITH_REGION_TASK_NAME = "OCR with Region"
REGION_TO_CATEGORY_TASK_NAME = "Region to Category"
REGION_TO_DESCRIPTION_TASK_NAME = "Region to Description"

TASK_NAMES = [
    OBJECT_DETECTION_TASK_NAME,
    CAPTION_TASK_NAME,
    DETAILED_CAPTION_TASK_NAME,
    MORE_DETAILED_CAPTION_TASK_NAME,
    OCR_TASK_NAME,
    OCR_WITH_REGION_TASK_NAME,
    REGION_TO_CATEGORY_TASK_NAME,
    REGION_TO_DESCRIPTION_TASK_NAME
]
TASKS = {
    OBJECT_DETECTION_TASK_NAME: "<OD>",
    CAPTION_TASK_NAME: "<CAPTION>",
    DETAILED_CAPTION_TASK_NAME: "<DETAILED_CAPTION>",
    MORE_DETAILED_CAPTION_TASK_NAME: "<MORE_DETAILED_CAPTION>",
    OCR_TASK_NAME: "<OCR>",
    OCR_WITH_REGION_TASK_NAME: "<OCR_WITH_REGION>",
    REGION_TO_CATEGORY_TASK_NAME: "<REGION_TO_CATEGORY>",
    REGION_TO_DESCRIPTION_TASK_NAME: "<REGION_TO_DESCRIPTION>"
}
CAPTION_TASK_NAMES = [
    CAPTION_TASK_NAME,
    DETAILED_CAPTION_TASK_NAME,
    MORE_DETAILED_CAPTION_TASK_NAME
]

IMAGE_INPUT_TASK_NAMES = [
    OBJECT_DETECTION_TASK_NAME,
    CAPTION_TASK_NAME,
    DETAILED_CAPTION_TASK_NAME,
    MORE_DETAILED_CAPTION_TASK_NAME,
    OCR_TASK_NAME,
    OCR_WITH_REGION_TASK_NAME,
]
IMAGE_PROMPTER_INPUT_TASK_NAMES = [
    REGION_TO_CATEGORY_TASK_NAME,
    REGION_TO_DESCRIPTION_TASK_NAME
]
IMAGE_OUTPUT_TASK_NAMES = [
    OBJECT_DETECTION_TASK_NAME,
    OCR_WITH_REGION_TASK_NAME,
    REGION_TO_CATEGORY_TASK_NAME,
    REGION_TO_DESCRIPTION_TASK_NAME
]
TEXTBOX_OUTPUT_TASK_NAMES = [
    CAPTION_TASK_NAME,
    DETAILED_CAPTION_TASK_NAME,
    MORE_DETAILED_CAPTION_TASK_NAME,
    OCR_TASK_NAME
]