File size: 9,785 Bytes
d5f5654
 
 
 
 
f51aacc
d5f5654
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f51aacc
d5f5654
 
 
 
 
 
f51aacc
 
 
 
 
 
 
 
 
 
d5f5654
 
 
f51aacc
d5f5654
 
f51aacc
d5f5654
f51aacc
d5f5654
 
 
 
 
f4f2229
 
 
 
d5f5654
 
 
 
 
 
 
 
 
 
 
 
f4f2229
 
 
 
 
d5f5654
 
 
 
 
 
 
 
 
 
b4d7111
f12a178
 
d5f5654
b4d7111
f4f2229
b4d7111
 
 
 
 
 
2d7ff06
 
 
 
 
 
 
 
 
d5f5654
 
 
 
 
 
 
f12a178
d5f5654
 
 
b4d7111
d5f5654
f51aacc
 
 
 
 
d5f5654
f51aacc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d5f5654
 
 
 
 
 
 
 
e85412e
 
 
 
 
 
 
 
 
 
f4f2229
b4d7111
 
f4f2229
b4d7111
d5f5654
 
 
 
 
 
 
 
d08dd28
 
f51aacc
 
 
 
 
 
 
 
 
f12a178
d5f5654
f51aacc
d5f5654
f51aacc
d5f5654
 
f12a178
d5f5654
 
f51aacc
d5f5654
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
import gradio as gr
import json
import time
import traceback
from validation import validate_json, validate_croissant, validate_records
import requests

def process_file(file):
    results = []
    
    # Check 1: JSON validation
    json_valid, json_message, json_data = validate_json(file.name)
    results.append(("JSON Format Validation", json_valid, json_message))
    
    if not json_valid:
        return results
    
    # Check 2: Croissant validation
    croissant_valid, croissant_message = validate_croissant(json_data)
    results.append(("Croissant Schema Validation", croissant_valid, croissant_message))
    
    if not croissant_valid:
        return results
    
    # Check 3: Records validation
    records_valid, records_message = validate_records(json_data)
    results.append(("Records Generation Test", records_valid, records_message))
    
    return results

def create_ui():
    with gr.Blocks(theme=gr.themes.Soft()) as app:
        gr.Markdown("# Croissant JSON-LD Validator for NeurIPS")
        gr.Markdown("""
        Upload your Croissant JSON-LD file or enter a URL to validate if it meets the requirements for NeurIPS submission.
        The validator will check:
        1. If the file is valid JSON
        2. If it passes Croissant schema validation
        3. If records can be generated within a reasonable time
        """)
        
        with gr.Tabs() as tabs:
            with gr.TabItem("Upload File"):
                file_input = gr.File(label="Upload Croissant JSON-LD File", file_types=[".json", ".jsonld"])
            
            with gr.TabItem("URL Input"):
                url_input = gr.Textbox(
                    label="Enter Croissant JSON-LD URL",
                    placeholder="https://huggingface.co/api/datasets/facebook/natural_reasoning/croissant"
                )
                fetch_btn = gr.Button("Fetch and Validate", variant="primary")
        
        upload_progress = gr.HTML(
            """<div class="progress-container">
                 <div class="progress-status">Ready for validation</div>
               </div>""", visible=True)
        
        validate_btn = gr.Button("Validate Uploaded File", variant="primary")
        
        # Create containers for validation results
        validation_results = gr.HTML(visible=False)
        
        # Define CSS for the validation UI
        gr.HTML("""
        <style>
        .gradio-container {
            max-width: 800px;
            margin: 0 auto;
        }
        .validation-step {
            margin-bottom: 15px;
            border: 1px solid #e0e0e0;
            border-radius: 8px;
            overflow: hidden;
        }
        .step-header {
            padding: 10px 15px;
            background-color: #f5f5f5;
            display: flex;
            align-items: center;
            cursor: pointer;
        }
        .step-left {
            display: flex;
            align-items: center;
            flex-grow: 1;
        }
        .step-status {
            margin-right: 10px;
            width: 24px;
            height: 24px;
            border-radius: 50%;
            display: flex;
            align-items: center;
            justify-content: center;
            font-weight: bold;
            color: white !important;
            font-size: 16px;
            text-shadow: 0px 0px 1px rgba(0,0,0,0.5);
        }
        .arrow-indicator {
            margin-left: 10px;
            font-size: 16px;
            transition: transform 0.3s ease;
        }
        .arrow-down {
            transform: rotate(90deg);
        }
        .status-success {
            background-color: #4caf50;
        }
        .status-error {
            background-color: #f44336;
        }
        .status-waiting {
            background-color: #9e9e9e;
        }
        </style>
        """)
        
        def on_file_upload(file):
            if file is None:
                return """<div class="progress-container">
                         <div class="progress-status">Ready for upload</div>
                       </div>""", gr.update(visible=False)
            
            return """<div class="progress-container">
                     <div class="progress-status">βœ… File uploaded successfully</div>
                   </div>""", gr.update(visible=False)
        
        def fetch_from_url(url):
            if not url:
                return """<div class="progress-container">
                         <div class="progress-status">Please enter a URL</div>
                       </div>""", gr.update(visible=False)
            
            try:
                # Fetch JSON from URL
                response = requests.get(url, timeout=10)
                response.raise_for_status()  # Raise exception for 4XX/5XX status codes
                
                # Try to parse as JSON
                json_data = response.json()
                
                # Show success message
                progress_html = """<div class="progress-container">
                                 <div class="progress-status">βœ… JSON fetched successfully from URL</div>
                               </div>"""
                
                # Validate the fetched JSON
                results = []
                
                # Check 1: JSON validation (already done by parsing)
                results.append(("JSON Format Validation", True, "βœ… The URL returned valid JSON."))
                
                # Check 2: Croissant validation
                croissant_valid, croissant_message = validate_croissant(json_data)
                results.append(("Croissant Schema Validation", croissant_valid, croissant_message))
                
                if not croissant_valid:
                    return progress_html, build_results_html(results)
                
                # Check 3: Records validation
                records_valid, records_message = validate_records(json_data)
                results.append(("Records Generation Test", records_valid, records_message))
                
                return progress_html, build_results_html(results)
                
            except requests.exceptions.RequestException as e:
                error_message = f"❌ Error fetching URL: {str(e)}"
                return f"""<div class="progress-container">
                         <div class="progress-status">{error_message}</div>
                       </div>""", gr.update(visible=False)
            except json.JSONDecodeError as e:
                error_message = f"❌ URL did not return valid JSON: {str(e)}"
                return f"""<div class="progress-container">
                         <div class="progress-status">{error_message}</div>
                       </div>""", gr.update(visible=False)
            except Exception as e:
                error_message = f"❌ Unexpected error: {str(e)}"
                return f"""<div class="progress-container">
                         <div class="progress-status">{error_message}</div>
                       </div>""", gr.update(visible=False)
        
        def build_results_html(results):
            # Extract the HTML generation logic to a reusable function
            html = '<div class="validation-results">'
            
            for i, (test_name, passed, message) in enumerate(results):
                status_class = "status-success" if passed else "status-error"
                status_icon = "βœ“" if passed else "βœ—"
                
                html += f'''
                <div class="validation-step" id="step-{i}">
                    <div class="step-header" onclick="
                        var details = document.getElementById('details-{i}');
                        var arrow = document.getElementById('arrow-{i}');
                        if(details.style.display === 'none') {{
                            details.style.display = 'block';
                            arrow.classList.add('arrow-down');
                        }} else {{
                            details.style.display = 'none';
                            arrow.classList.remove('arrow-down');
                        }}">
                        <div class="step-left">
                            <div class="step-status {status_class}">{status_icon}</div>
                            <div class="step-title">{test_name}</div>
                            <div class="arrow-indicator" id="arrow-{i}">β–Ά</div>
                        </div>
                    </div>
                    <div class="step-details" id="details-{i}" style="display: none;">
                        {message}
                    </div>
                </div>
                '''
            
            html += '</div>'
            return gr.update(value=html, visible=True)
        
        def on_validate(file):
            if file is None:
                return gr.update(visible=False)
            
            # Process the file and get results
            results = process_file(file)
            return build_results_html(results)
        
        # Connect UI events to functions
        file_input.change(on_file_upload, inputs=file_input, outputs=[upload_progress, validation_results])
        validate_btn.click(on_validate, inputs=file_input, outputs=validation_results)
        fetch_btn.click(fetch_from_url, inputs=url_input, outputs=[upload_progress, validation_results])
        
        # Footer
        gr.HTML("""
        <div style="text-align: center; margin-top: 20px;">
            <p>Based on the <a href="https://github.com/mlcommons/croissant" target="_blank">Croissant format</a> from MLCommons.</p>
        </div>
        """)
    
    return app

if __name__ == "__main__":
    app = create_ui()
    app.launch()