ppuva1 commited on
Commit
b0d0803
·
verified ·
1 Parent(s): d975336

Add BERTopic model

Browse files
Files changed (2) hide show
  1. topic_embeddings.safetensors +2 -2
  2. topics.json +258 -160
topic_embeddings.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de587e014d6a0af6f1f676efdb47fa5bd26b8d8fed32b5c72dfe32dba295d284
3
- size 4696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50a95c827a65bb016dbfc7b565cb2ea404f65ee6df8fe2400c63893073c94acc
3
+ size 7768
topics.json CHANGED
@@ -2,240 +2,299 @@
2
  "topic_representations": {
3
  "-1": [
4
  [
5
- "charge",
6
- 0.1437641778909261
7
  ],
8
  [
9
- "on",
10
- 0.1178154768085835
11
  ],
12
  [
13
- "account",
14
- 0.11021919978363973
15
  ],
16
  [
17
- "seeing",
18
- 0.1022161186535828
19
  ],
20
  [
21
- "random",
22
- 0.1022161186535828
23
  ],
24
  [
25
- "saw",
26
- 0.1022161186535828
27
  ],
28
  [
29
- "my",
30
- 0.0984618790345695
31
  ],
32
  [
33
- "buy",
34
- 0.08782214790690118
35
  ],
36
  [
37
- "charged",
38
- 0.08782214790690118
39
  ],
40
  [
41
- "im",
42
- 0.0826643998377298
43
  ]
44
  ],
45
  "0": [
 
 
 
 
 
 
 
 
46
  [
47
  "my",
48
- 0.10390739366309902
 
 
 
 
 
 
 
 
 
 
 
 
49
  ],
50
  [
51
  "to",
52
- 0.09071191064477435
53
  ],
54
  [
55
- "klarna",
56
- 0.08118481702761375
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  ],
58
  [
59
  "the",
60
- 0.06553510864541155
61
  ],
62
  [
63
- "it",
64
- 0.058823167261863776
65
  ],
66
  [
67
- "and",
68
- 0.05797918596010623
69
  ],
70
  [
71
  "for",
72
- 0.04867142710037787
73
  ],
74
  [
75
- "email",
76
- 0.04547149587226583
77
  ],
78
  [
79
- "but",
80
- 0.04540059233774568
 
 
 
 
81
  ],
82
  [
83
- "in",
84
- 0.04494803747556551
 
 
 
 
85
  ]
86
  ],
87
- "1": [
88
  [
89
- "refund",
90
- 0.11480022821235052
 
 
 
 
91
  ],
92
  [
93
  "my",
94
- 0.08942725570982173
95
  ],
96
  [
97
- "nike",
98
- 0.08905467107379061
99
  ],
100
  [
101
- "for",
102
- 0.08460308243237606
103
  ],
104
  [
105
- "store",
106
- 0.07534184980024404
107
  ],
108
  [
109
- "returned",
110
- 0.07387449643163027
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
  ],
112
  [
113
  "to",
114
- 0.07041279581631162
115
  ],
116
  [
117
- "credit",
118
- 0.06273866511558329
119
  ],
120
  [
121
- "week",
122
- 0.05911540552381123
123
  ],
124
  [
125
- "but",
126
- 0.05610871184366852
 
 
 
 
 
 
 
 
 
 
 
 
127
  ]
128
  ]
129
  },
130
  "topics": [
 
 
 
 
 
 
131
  0,
132
  0,
 
 
 
 
 
133
  0,
 
 
 
 
 
134
  0,
 
 
135
  0,
 
136
  0,
137
  1,
 
138
  1,
139
  0,
140
  0,
141
  0,
142
- 0,
143
- 0,
 
144
  1,
145
  0,
146
  0,
147
  0,
 
 
 
148
  -1,
149
  0,
150
- 1,
151
  0,
152
  0,
 
 
153
  1,
 
154
  0,
 
 
 
 
 
155
  0,
156
  0,
157
  0,
158
  0,
159
- 1,
160
- 1,
161
- 1,
162
- 0,
163
  0,
 
164
  0,
165
  0,
166
- 1,
167
- 1,
168
- 1,
169
  0,
170
  0,
171
  0,
172
- 0,
173
- 1,
174
- 1,
175
  1,
176
  0,
177
  0,
178
  0,
179
  0,
180
- 1,
181
- 0,
182
  0,
183
  0,
184
  0,
185
  0,
186
- 1,
187
- 1,
188
- 1,
189
- 1,
190
- 1,
191
- -1,
192
- 1,
193
- 1,
194
- 1,
195
- 1,
196
  0,
197
  0,
198
- 1,
199
- 1,
200
- 1,
201
- 1,
202
- 1,
203
- 1,
204
- 1,
205
- 1,
206
- 1,
207
- 1,
208
- 1,
209
- 1,
210
- 1,
211
- 1,
212
- 1,
213
- 1,
214
- 1,
215
- 1,
216
- 1,
217
- 1,
218
- 1,
219
- 1,
220
- 1,
221
- 1,
222
- 1,
223
- 1,
224
- 1,
225
- 1,
226
- 1,
227
- 1,
228
- 1,
229
- 1,
230
  0,
231
  0,
232
  0,
233
  0,
234
- -1,
235
  0,
236
- 1,
237
  0,
238
- 1,
239
  0,
240
  0,
241
  0,
@@ -246,94 +305,121 @@
246
  0,
247
  0,
248
  0,
249
- 1,
250
  0,
251
  0,
252
  0,
253
  0,
254
  0,
255
  0,
 
256
  1,
257
- 0,
258
  1,
259
- 0,
 
260
  1,
261
  0,
 
262
  0,
263
  1,
264
- 0,
265
- 0,
266
  1,
267
  1,
268
- 0,
 
269
  1,
 
 
270
  0,
271
  1,
 
 
 
 
 
272
  0,
 
273
  0,
 
274
  0,
 
275
  -1,
276
  0,
277
  1,
 
278
  0,
279
  0,
280
- 0,
281
- 0,
282
- 0,
283
  0,
284
  1,
285
  0,
286
- 0,
287
- 0,
288
- 0,
289
- 0,
290
  1,
291
- 0,
292
- 0,
293
  -1,
294
  1,
295
  0,
 
296
  1,
297
  1,
 
298
  1,
299
- 0,
300
- 0,
301
- 0,
302
- 0,
303
- 0,
304
- 0,
305
- 0,
306
- 0,
307
- 0,
308
- 0,
309
- 0,
310
- 0,
311
- 0,
312
- 0,
313
- 0,
314
- 0,
315
- 0,
316
- 0,
317
- 0,
318
- 0,
319
- 0,
320
- 0,
321
- 0,
322
- 0,
323
  0,
324
  1,
 
 
 
 
325
  0,
326
  -1,
 
 
327
  0,
 
328
  0,
329
  0,
330
  0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
331
  -1
332
  ],
333
  "topic_sizes": {
334
- "0": 119,
335
- "1": 75,
336
- "-1": 7
 
 
337
  },
338
  "topic_mapper": [
339
  [
@@ -350,12 +436,24 @@
350
  1,
351
  1,
352
  1
 
 
 
 
 
 
 
 
 
 
353
  ]
354
  ],
355
  "topic_labels": {
356
- "-1": "-1_charge_on_account_seeing",
357
- "0": "0_my_to_klarna_the",
358
- "1": "1_refund_my_nike_for"
 
 
359
  },
360
  "custom_labels": null,
361
  "_outliers": 1,
 
2
  "topic_representations": {
3
  "-1": [
4
  [
5
+ "my",
6
+ 0.0770687485801542
7
  ],
8
  [
9
+ "to",
10
+ 0.06417179022150182
11
  ],
12
  [
13
+ "and",
14
+ 0.05869595770002569
15
  ],
16
  [
17
+ "on",
18
+ 0.05448336727588492
19
  ],
20
  [
21
+ "out",
22
+ 0.05383918807100145
23
  ],
24
  [
25
+ "account",
26
+ 0.05050500504995713
27
  ],
28
  [
29
+ "help",
30
+ 0.04832176586666326
31
  ],
32
  [
33
+ "now",
34
+ 0.04405604868058506
35
  ],
36
  [
37
+ "card",
38
+ 0.04318695320025447
39
  ],
40
  [
41
+ "for",
42
+ 0.04289496600548463
43
  ]
44
  ],
45
  "0": [
46
+ [
47
+ "refund",
48
+ 0.09708432581084771
49
+ ],
50
+ [
51
+ "nike",
52
+ 0.07503725849254604
53
+ ],
54
  [
55
  "my",
56
+ 0.07245116415320181
57
+ ],
58
+ [
59
+ "for",
60
+ 0.07154419223998229
61
+ ],
62
+ [
63
+ "store",
64
+ 0.06376824305420041
65
+ ],
66
+ [
67
+ "returned",
68
+ 0.06267539937266918
69
  ],
70
  [
71
  "to",
72
+ 0.05811061688767775
73
  ],
74
  [
75
+ "credit",
76
+ 0.05357265743698659
77
+ ],
78
+ [
79
+ "week",
80
+ 0.05041027049833845
81
+ ],
82
+ [
83
+ "but",
84
+ 0.04973139930114579
85
+ ]
86
+ ],
87
+ "1": [
88
+ [
89
+ "my",
90
+ 0.08515420676452827
91
  ],
92
  [
93
  "the",
94
+ 0.07187645306567553
95
  ],
96
  [
97
+ "payment",
98
+ 0.06526750070113646
99
  ],
100
  [
101
+ "klarna",
102
+ 0.06525687041828662
103
  ],
104
  [
105
  "for",
106
+ 0.060504478365630956
107
  ],
108
  [
109
+ "to",
110
+ 0.054477221523321726
111
  ],
112
  [
113
+ "app",
114
+ 0.05077461050592647
115
+ ],
116
+ [
117
+ "balance",
118
+ 0.05066940490140783
119
  ],
120
  [
121
+ "it",
122
+ 0.0505896314940509
123
+ ],
124
+ [
125
+ "pay",
126
+ 0.04884020967943698
127
  ]
128
  ],
129
+ "2": [
130
  [
131
+ "email",
132
+ 0.09407229596102178
133
+ ],
134
+ [
135
+ "to",
136
+ 0.08522763583930289
137
  ],
138
  [
139
  "my",
140
+ 0.07951468632851966
141
  ],
142
  [
143
+ "account",
144
+ 0.06707654817798166
145
  ],
146
  [
147
+ "the",
148
+ 0.06594700723933207
149
  ],
150
  [
151
+ "im",
152
+ 0.06001585889608886
153
  ],
154
  [
155
+ "and",
156
+ 0.05680937762227116
157
+ ],
158
+ [
159
+ "klarna",
160
+ 0.05641926608211562
161
+ ],
162
+ [
163
+ "cant",
164
+ 0.05314565614406856
165
+ ],
166
+ [
167
+ "log",
168
+ 0.05141755695742052
169
+ ]
170
+ ],
171
+ "3": [
172
+ [
173
+ "card",
174
+ 0.18293415799353993
175
+ ],
176
+ [
177
+ "klarna",
178
+ 0.14610703556827512
179
+ ],
180
+ [
181
+ "it",
182
+ 0.1154887207073202
183
  ],
184
  [
185
  "to",
186
+ 0.09757753066304958
187
  ],
188
  [
189
+ "need",
190
+ 0.09325562067939731
191
  ],
192
  [
193
+ "details",
194
+ 0.09320799686749423
195
  ],
196
  [
197
+ "call",
198
+ 0.09003453379599928
199
+ ],
200
+ [
201
+ "my",
202
+ 0.08437552184979603
203
+ ],
204
+ [
205
+ "lost",
206
+ 0.08317587481576641
207
+ ],
208
+ [
209
+ "do",
210
+ 0.07679626299794899
211
  ]
212
  ]
213
  },
214
  "topics": [
215
+ 2,
216
+ -1,
217
+ 2,
218
+ 1,
219
+ 2,
220
+ -1,
221
  0,
222
  0,
223
+ -1,
224
+ 1,
225
+ 1,
226
+ 2,
227
+ 2,
228
  0,
229
+ -1,
230
+ -1,
231
+ -1,
232
+ -1,
233
+ 2,
234
  0,
235
+ 2,
236
+ 1,
237
  0,
238
+ 1,
239
  0,
240
  1,
241
+ 2,
242
  1,
243
  0,
244
  0,
245
  0,
246
+ 2,
247
+ -1,
248
+ 1,
249
  1,
250
  0,
251
  0,
252
  0,
253
+ 1,
254
+ 2,
255
+ -1,
256
  -1,
257
  0,
 
258
  0,
259
  0,
260
+ -1,
261
+ -1,
262
  1,
263
+ 2,
264
  0,
265
+ 3,
266
+ 1,
267
+ 3,
268
+ 2,
269
+ -1,
270
  0,
271
  0,
272
  0,
273
  0,
 
 
 
 
274
  0,
275
+ -1,
276
  0,
277
  0,
 
 
 
278
  0,
279
  0,
280
  0,
 
 
 
281
  1,
282
  0,
283
  0,
284
  0,
285
  0,
 
 
286
  0,
287
  0,
288
  0,
289
  0,
 
 
 
 
 
 
 
 
 
 
290
  0,
291
  0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
292
  0,
293
  0,
294
  0,
295
  0,
 
296
  0,
 
297
  0,
 
298
  0,
299
  0,
300
  0,
 
305
  0,
306
  0,
307
  0,
 
308
  0,
309
  0,
310
  0,
311
  0,
312
  0,
313
  0,
314
+ -1,
315
  1,
 
316
  1,
317
+ 3,
318
+ -1,
319
  1,
320
  0,
321
+ -1,
322
  0,
323
  1,
324
+ 2,
325
+ 2,
326
  1,
327
  1,
328
+ -1,
329
+ 3,
330
  1,
331
+ 1,
332
+ 3,
333
  0,
334
  1,
335
+ 1,
336
+ 1,
337
+ 1,
338
+ 1,
339
+ 3,
340
  0,
341
+ -1,
342
  0,
343
+ 2,
344
  0,
345
+ 2,
346
  -1,
347
  0,
348
  1,
349
+ 2,
350
  0,
351
  0,
352
+ 2,
 
 
353
  0,
354
  1,
355
  0,
 
 
 
 
356
  1,
357
+ -1,
358
+ 1,
359
  -1,
360
  1,
361
  0,
362
+ -1,
363
  1,
364
  1,
365
+ 3,
366
  1,
367
+ 2,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
368
  0,
369
  1,
370
+ 3,
371
+ 3,
372
+ 2,
373
+ 1,
374
  0,
375
  -1,
376
+ -1,
377
+ -1,
378
  0,
379
+ 2,
380
  0,
381
  0,
382
  0,
383
+ 2,
384
+ 1,
385
+ 1,
386
+ 1,
387
+ 1,
388
+ 1,
389
+ 1,
390
+ 1,
391
+ 1,
392
+ 3,
393
+ 3,
394
+ 1,
395
+ 1,
396
+ -1,
397
+ 1,
398
+ 1,
399
+ 2,
400
+ 2,
401
+ 2,
402
+ 2,
403
+ 2,
404
+ 2,
405
+ 2,
406
+ 2,
407
+ 2,
408
+ -1,
409
+ -1,
410
+ -1,
411
+ 3,
412
+ -1,
413
+ 3,
414
+ 3,
415
  -1
416
  ],
417
  "topic_sizes": {
418
+ "2": 31,
419
+ "-1": 32,
420
+ "1": 48,
421
+ "0": 76,
422
+ "3": 14
423
  },
424
  "topic_mapper": [
425
  [
 
436
  1,
437
  1,
438
  1
439
+ ],
440
+ [
441
+ 2,
442
+ 2,
443
+ 2
444
+ ],
445
+ [
446
+ 3,
447
+ 3,
448
+ 3
449
  ]
450
  ],
451
  "topic_labels": {
452
+ "-1": "-1_my_to_and_on",
453
+ "0": "0_refund_nike_my_for",
454
+ "1": "1_my_the_payment_klarna",
455
+ "2": "2_email_to_my_account",
456
+ "3": "3_card_klarna_it_to"
457
  },
458
  "custom_labels": null,
459
  "_outliers": 1,