File size: 7,014 Bytes
233cefb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
import 'dart:convert';
import 'package:http/http.dart' as http;

/// Represents the availability status of a model for a specific provider
class ModelProviderAvailability {
  final String providerId;
  final String status; // 'live' or 'staging'
  final String task; // e.g., 'conversational'
  final String? mappedLLMProviderId; // Our internal provider ID

  const ModelProviderAvailability({
    required this.providerId,
    required this.status,
    required this.task,
    this.mappedLLMProviderId,
  });

  bool get isLive => status == 'live';

  factory ModelProviderAvailability.fromJson(
    String hfProviderId,
    Map<String, dynamic> json,
  ) {
    return ModelProviderAvailability(
      providerId: json['providerId'] ?? hfProviderId,
      status: json['status'] ?? 'unknown',
      task: json['task'] ?? 'unknown',
    );
  }
}

/// Cached model availability information
class ModelAvailabilityCache {
  final String modelId;
  final List<ModelProviderAvailability> providers;
  final DateTime lastUpdated;

  const ModelAvailabilityCache({
    required this.modelId,
    required this.providers,
    required this.lastUpdated,
  });

  bool get isExpired {
    final now = DateTime.now();
    final difference = now.difference(lastUpdated);
    return difference.inSeconds > 30; // 30 seconds cache duration
  }

  List<ModelProviderAvailability> get liveProviders =>
      providers.where((p) => p.isLive).toList();
}

/// Service for querying and caching model availability from Hugging Face API
class ModelAvailabilityService {
  static const String _baseUrl = 'https://huggingface.co/api/models';

  // Cache for model availability data
  final Map<String, ModelAvailabilityCache> _cache = {};

  /// Mapping from HF provider IDs to our internal LLM provider IDs
  static const Map<String, String> _providerMapping = {
    'cerebras': 'cerebras',
    'cohere': 'cohere',
    'fal-ai': 'fal-ai',
    'featherless': 'featherless',
    'fireworks': 'fireworks',
    'groq': 'groq',
    'hf-inference': 'hf-inference',
    'hyperbolic': 'hyperbolic',
    'nebius': 'nebius',
    'novita': 'novita',
    'nscale': 'nscale',
    'replicate': 'replicate',
    'sambanova': 'sambanova',
    'together': 'together',
  };

  /// Get model availability, using cache if available and not expired
  Future<ModelAvailabilityCache?> getModelAvailability(String modelId) async {
    // Check cache first
    final cached = _cache[modelId];
    if (cached != null && !cached.isExpired) {
      return cached;
    }

    // Fetch fresh data from API
    try {
      final availability = await _fetchModelAvailability(modelId);
      if (availability != null) {
        _cache[modelId] = availability;
      }
      return availability;
    } catch (e) {
      // If API call fails and we have cached data, return it even if expired
      if (cached != null) {
        return cached;
      }
      rethrow;
    }
  }

  /// Fetch model availability from Hugging Face API
  Future<ModelAvailabilityCache?> _fetchModelAvailability(
    String modelId,
  ) async {
    final url = '$_baseUrl/$modelId?expand[]=inferenceProviderMapping';

    try {
      final response = await http.get(
        Uri.parse(url),
        headers: {'Accept': 'application/json', 'User-Agent': '#tikslop-App/1.0'},
      );

      if (response.statusCode == 200) {
        final data = json.decode(response.body) as Map<String, dynamic>;
        return _parseModelAvailability(modelId, data);
      } else if (response.statusCode == 404) {
        // Model not found, return empty availability
        return ModelAvailabilityCache(
          modelId: modelId,
          providers: [],
          lastUpdated: DateTime.now(),
        );
      } else {
        throw ModelAvailabilityException(
          'Failed to fetch model availability: HTTP ${response.statusCode}',
        );
      }
    } catch (e) {
      if (e is ModelAvailabilityException) {
        rethrow;
      }
      throw ModelAvailabilityException('Network error: $e');
    }
  }

  /// Parse the API response into ModelAvailabilityCache
  ModelAvailabilityCache _parseModelAvailability(
    String modelId,
    Map<String, dynamic> data,
  ) {
    final providers = <ModelProviderAvailability>[];

    final inferenceMapping =
        data['inferenceProviderMapping'] as Map<String, dynamic>?;
    if (inferenceMapping != null) {
      for (final entry in inferenceMapping.entries) {
        final hfProviderId = entry.key;
        final providerData = entry.value as Map<String, dynamic>;

        final availability = ModelProviderAvailability.fromJson(
          hfProviderId,
          providerData,
        );

        // Map HF provider ID to our internal provider ID
        final mappedProviderId = _providerMapping[hfProviderId];
        if (mappedProviderId != null) {
          providers.add(
            ModelProviderAvailability(
              providerId: availability.providerId,
              status: availability.status,
              task: availability.task,
              mappedLLMProviderId: mappedProviderId,
            ),
          );
        } else {
          // Keep unmapped providers for potential future use
          providers.add(availability);
        }
      }
    }

    return ModelAvailabilityCache(
      modelId: modelId,
      providers: providers,
      lastUpdated: DateTime.now(),
    );
  }

  /// Get list of compatible LLM providers for a model
  List<String> getCompatibleProviders(String modelId) {
    final cached = _cache[modelId];
    if (cached == null) {
      return [];
    }

    return cached.liveProviders
        .where((p) => p.mappedLLMProviderId != null)
        .map((p) => p.mappedLLMProviderId!)
        .toList();
  }

  /// Check if a specific provider supports a model
  bool isProviderCompatible(String modelId, String llmProviderId) {
    final compatibleProviders = getCompatibleProviders(modelId);
    return compatibleProviders.contains(llmProviderId);
  }

  /// Get the provider-specific model name for a given model and provider
  String? getProviderSpecificModelName(String modelId, String llmProviderId) {
    final cached = _cache[modelId];
    if (cached == null) {
      return null;
    }

    final providerAvailability = cached.liveProviders
        .where((p) => p.mappedLLMProviderId == llmProviderId)
        .firstOrNull;

    return providerAvailability?.providerId;
  }

  /// Clear cache for a specific model
  void clearCache(String modelId) {
    _cache.remove(modelId);
  }

  /// Clear all cached data
  void clearAllCache() {
    _cache.clear();
  }

  /// Get cache status for debugging
  Map<String, bool> getCacheStatus() {
    return _cache.map((key, value) => MapEntry(key, !value.isExpired));
  }
}

/// Exception thrown when model availability operations fail
class ModelAvailabilityException implements Exception {
  final String message;

  ModelAvailabilityException(this.message);

  @override
  String toString() => 'ModelAvailabilityException: $message';
}