pszemraj's picture
Add BERTopic model
2f37a66
raw
history blame
32.8 kB
{
"topic_representations": {
"-1": [
[
"no_saic_raw_sp",
0.8556114435195923
],
[
"sep_4",
0.81075119972229
],
[
"sec",
0.7599493861198425
],
[
"data",
0.7535145282745361
],
[
"image",
0.7453169822692871
],
[
"information",
0.7431399822235107
],
[
"re",
0.7418415546417236
],
[
"system",
0.740649938583374
],
[
"article",
0.7392792701721191
],
[
"as",
0.7361999154090881
]
],
"0": [
[
"lecture",
0.7621833086013794
],
[
"applications",
0.7610516548156738
],
[
"methods",
0.7550681233406067
],
[
"learning",
0.753812313079834
],
[
"topics",
0.7511876821517944
],
[
"processing",
0.7412316799163818
],
[
"students",
0.7411034107208252
],
[
"course",
0.7392420768737793
],
[
"research",
0.7388631105422974
],
[
"learn",
0.7382574081420898
]
],
"1": [
[
"cogvideo",
0.8285708427429199
],
[
"videos",
0.7789747714996338
],
[
"cogview2",
0.7652571797370911
],
[
"cog",
0.7602906227111816
],
[
"video",
0.7426279783248901
],
[
"model",
0.7371622323989868
],
[
"models",
0.7349198460578918
],
[
"pretrained",
0.7322494387626648
],
[
"images",
0.7298381924629211
],
[
"generative",
0.7297838926315308
]
],
"2": [
[
"ship",
0.7606195211410522
],
[
"rainsford",
0.7572601437568665
],
[
"hunted",
0.751890242099762
],
[
"island",
0.7502785325050354
],
[
"hunts",
0.7416767477989197
],
[
"hunt",
0.7376853227615356
],
[
"hunting",
0.7322002649307251
],
[
"sea",
0.7211506366729736
],
[
"hears",
0.7165385484695435
],
[
"he",
0.7158846855163574
]
],
"3": [
[
"films",
0.760940670967102
],
[
"dissertation",
0.7475396394729614
],
[
"film",
0.7468894124031067
],
[
"noir",
0.7389432787895203
],
[
"identity",
0.732159435749054
],
[
"trauma",
0.7161113023757935
],
[
"movements",
0.7109761834144592
],
[
"identities",
0.7109147310256958
],
[
"materiality",
0.7108149528503418
],
[
"zinnemann",
0.7104987502098083
]
],
"4": [
[
"linguistics",
0.7948346138000488
],
[
"language",
0.7632309794425964
],
[
"languages",
0.7601754665374756
],
[
"foundational",
0.7537258863449097
],
[
"systems",
0.7422805428504944
],
[
"explanation",
0.7387273907661438
],
[
"structure",
0.7380946278572083
],
[
"explanations",
0.7358152270317078
],
[
"computational",
0.7318733930587769
],
[
"questions",
0.7239676117897034
]
],
"5": [
[
"nemo",
0.8223493695259094
],
[
"dory",
0.7749705910682678
],
[
"transcript",
0.7340698838233948
],
[
"clownfish",
0.7280408143997192
],
[
"fish",
0.7232930660247803
],
[
"find",
0.721244752407074
],
[
"finding",
0.7209229469299316
],
[
"gill",
0.7187108397483826
],
[
"some",
0.7142731547355652
],
[
"turtles",
0.709677517414093
]
],
"6": [
[
"train",
0.7295479774475098
],
[
"bruno",
0.7284721732139587
],
[
"washington",
0.7216507792472839
],
[
"station",
0.7200955152511597
],
[
"tennis",
0.7148782014846802
],
[
"anthony",
0.7146422863006592
],
[
"men",
0.7142789363861084
],
[
"guy",
0.7111189961433411
],
[
"who",
0.7095263004302979
],
[
"what",
0.7079984545707703
]
],
"7": [
[
"images",
0.8006479144096375
],
[
"representations",
0.7684509754180908
],
[
"image",
0.764212965965271
],
[
"captions",
0.7594517469406128
],
[
"representation",
0.750898540019989
],
[
"models",
0.746273398399353
],
[
"manipulations",
0.7451709508895874
],
[
"model",
0.7430041432380676
],
[
"embeddings",
0.7421921491622925
],
[
"generative",
0.7397007942199707
]
],
"8": [
[
"merge",
0.767553448677063
],
[
"merging",
0.7648005485534668
],
[
"explain",
0.7347870469093323
],
[
"concept",
0.7299387454986572
],
[
"problems",
0.7189124226570129
],
[
"structure",
0.7187449932098389
],
[
"workspace",
0.7175571918487549
],
[
"linguistics",
0.7161640524864197
],
[
"objects",
0.7156375646591187
],
[
"definition",
0.7154124975204468
]
],
"9": [
[
"enhancement",
0.7681708931922913
],
[
"enhancing",
0.7659841775894165
],
[
"recordings",
0.7583848834037781
],
[
"improve",
0.7478545904159546
],
[
"waveforms",
0.747260332107544
],
[
"enhance",
0.746477484703064
],
[
"vocoding",
0.7439472079277039
],
[
"spectrogram",
0.737808346748352
],
[
"diffwave",
0.7316944599151611
],
[
"improving",
0.7316482067108154
]
],
"10": [
[
"arendelle",
0.798922061920166
],
[
"elsa",
0.777582049369812
],
[
"frozen",
0.7636111378669739
],
[
"kristoff",
0.761407732963562
],
[
"olaf",
0.7487310171127319
],
[
"snow",
0.7269754409790039
],
[
"hans",
0.7218987941741943
],
[
"anna",
0.7175288796424866
],
[
"ice",
0.7125762701034546
],
[
"sven",
0.7123910188674927
]
],
"11": [
[
"scene",
0.7549106478691101
],
[
"story",
0.7533068060874939
],
[
"script",
0.7518723011016846
],
[
"movie",
0.7438328862190247
],
[
"gillis",
0.735901951789856
],
[
"boulevard",
0.732673168182373
],
[
"some",
0.7262394428253174
],
[
"was",
0.715401828289032
],
[
"money",
0.715157151222229
],
[
"what",
0.7143906950950623
]
],
"12": [
[
"lecture",
0.7755166888237
],
[
"lemmatization",
0.7615716457366943
],
[
"nlp",
0.7565118670463562
],
[
"medical",
0.754940390586853
],
[
"techniques",
0.745952844619751
],
[
"tokenization",
0.7456807494163513
],
[
"learning",
0.7393791079521179
],
[
"preprocessing",
0.7301928997039795
],
[
"clinical",
0.7289255261421204
],
[
"normalization",
0.7277066111564636
]
],
"13": [
[
"questions",
0.7605725526809692
],
[
"topics",
0.7526620626449585
],
[
"conversation",
0.7503987550735474
],
[
"terrance",
0.7387130260467529
],
[
"talk",
0.7369388937950134
],
[
"things",
0.7316636443138123
],
[
"asking",
0.7304785251617432
],
[
"some",
0.7281580567359924
],
[
"asks",
0.7276471257209778
],
[
"jonathan",
0.7220789194107056
]
],
"14": [
[
"sniper",
0.7596232295036316
],
[
"kill",
0.7467747926712036
],
[
"fury",
0.7431679964065552
],
[
"combat",
0.7327852249145508
],
[
"narrator",
0.7320101261138916
],
[
"300",
0.727806806564331
],
[
"kills",
0.7277351021766663
],
[
"ip",
0.7257020473480225
],
[
"military",
0.7209112644195557
],
[
"armed",
0.720558226108551
]
],
"15": [
[
"images",
0.7750052213668823
],
[
"lecture",
0.7550859451293945
],
[
"ezurich",
0.7535472512245178
],
[
"pathology",
0.7511546611785889
],
[
"medical",
0.7412455081939697
],
[
"image",
0.7388397455215454
],
[
"convolutional",
0.7381254434585571
],
[
"learning",
0.7299654483795166
],
[
"techniques",
0.7295058965682983
],
[
"clinical",
0.7254665493965149
]
],
"16": [
[
"timeseries",
0.7711629867553711
],
[
"framework",
0.7490929365158081
],
[
"interpretability",
0.74543696641922
],
[
"representations",
0.7396618723869324
],
[
"next_concept",
0.7367282509803772
],
[
"interpretable",
0.7348772287368774
],
[
"predictions",
0.7275879383087158
],
[
"representation",
0.7271812558174133
],
[
"rnns",
0.7269995212554932
],
[
"method",
0.7259383797645569
]
],
"17": [
[
"prediction",
0.7627924084663391
],
[
"predictions",
0.7577962875366211
],
[
"forecasting",
0.7536972165107727
],
[
"predict",
0.7470806837081909
],
[
"markov",
0.7415806651115417
],
[
"medical",
0.7372077107429504
],
[
"model",
0.7367797493934631
],
[
"clinical",
0.7349631786346436
],
[
"datasets",
0.7328702211380005
],
[
"modeling",
0.7324564456939697
]
],
"18": [
[
"images",
0.7678451538085938
],
[
"imaging",
0.7669191360473633
],
[
"computational",
0.7625638246536255
],
[
"convolutional",
0.761376678943634
],
[
"lecture",
0.7450449466705322
],
[
"pathology",
0.744610607624054
],
[
"techniques",
0.7427186965942383
],
[
"medical",
0.740394115447998
],
[
"classification",
0.7339968085289001
],
[
"clustering",
0.7338482141494751
]
],
"19": [
[
"technology",
0.7525465488433838
],
[
"treatment",
0.7522265315055847
],
[
"methods",
0.750868558883667
],
[
"medical",
0.7508047223091125
],
[
"detection",
0.7446655631065369
],
[
"scans",
0.7435606718063354
],
[
"medicine",
0.7433589696884155
],
[
"techniques",
0.7426445484161377
],
[
"diagnosis",
0.7395122051239014
],
[
"images",
0.7294250130653381
]
],
"20": [
[
"novel",
0.7397549748420715
],
[
"translation",
0.7291005849838257
],
[
"henry",
0.727873682975769
],
[
"read",
0.7266944050788879
],
[
"learn",
0.7247153520584106
],
[
"prototype",
0.7236534357070923
],
[
"learning",
0.7218745350837708
],
[
"learns",
0.7194956541061401
],
[
"help",
0.7185222506523132
],
[
"machines",
0.7183353900909424
]
],
"21": [
[
"abridged",
0.8131064772605896
],
[
"brief",
0.775554895401001
],
[
"synopsis",
0.7743421792984009
],
[
"short",
0.7560427784919739
],
[
"citations",
0.7556378841400146
],
[
"reports",
0.7472920417785645
],
[
"footnotes",
0.732883095741272
],
[
"description",
0.7284342050552368
],
[
"events",
0.7235608100891113
],
[
"overview",
0.7230038642883301
]
],
"22": [
[
"lecture",
0.7524600028991699
],
[
"pathology",
0.7389881610870361
],
[
"medical",
0.7359194755554199
],
[
"computational",
0.7320494055747986
],
[
"patients",
0.7307963371276855
],
[
"learning",
0.7302024364471436
],
[
"autoencoders",
0.7273372411727905
],
[
"learn",
0.724185585975647
],
[
"datasets",
0.7207432985305786
],
[
"techniques",
0.7194994688034058
]
]
},
"topics": [
7,
12,
7,
0,
5,
1,
0,
2,
0,
13,
13,
18,
7,
3,
20,
18,
4,
5,
0,
1,
17,
3,
16,
4,
1,
10,
5,
4,
0,
4,
12,
13,
17,
2,
1,
0,
7,
5,
9,
6,
-1,
5,
0,
11,
9,
12,
11,
5,
10,
10,
11,
0,
4,
8,
8,
15,
12,
7,
8,
0,
0,
16,
0,
0,
0,
1,
2,
6,
13,
1,
0,
1,
12,
2,
3,
0,
13,
-1,
6,
1,
19,
5,
3,
2,
3,
0,
0,
5,
14,
11,
3,
0,
5,
10,
20,
8,
5,
7,
1,
-1,
14,
1,
2,
11,
9,
3,
1,
0,
4,
0,
0,
11,
13,
6,
2,
13,
8,
4,
-1,
4,
4,
12,
0,
-1,
6,
12,
5,
1,
-1,
6,
6,
0,
9,
2,
20,
5,
18,
8,
0,
1,
18,
16,
11,
0,
1,
7,
6,
8,
12,
11,
0,
-1,
7,
2,
2,
0,
21,
7,
0,
9,
14,
10,
14,
7,
4,
8,
5,
1,
7,
0,
1,
10,
1,
1,
0,
3,
11,
13,
8,
17,
4,
0,
0,
6,
-1,
9,
4,
0,
9,
-1,
10,
7,
1,
9,
12,
0,
2,
0,
4,
4,
13,
0,
0,
9,
0,
0,
12,
14,
4,
8,
4,
0,
0,
3,
10,
6,
0,
3,
12,
14,
0,
6,
19,
13,
4,
11,
16,
5,
8,
7,
9,
0,
2,
10,
20,
0,
2,
10,
21,
6,
21,
4,
7,
12,
4,
15,
6,
0,
2,
8,
19,
0,
6,
20,
8,
10,
14,
6,
3,
0,
7,
1,
10,
6,
-1,
-1,
1,
14,
6,
7,
2,
22,
11,
4,
4,
20,
-1,
0,
0,
6,
0,
5,
13,
0,
3,
15,
0,
3,
9,
2,
1,
1,
8,
12,
0,
14,
6,
0,
0,
10,
1,
-1,
19,
5,
7,
3,
11,
13,
1,
13,
2,
2,
10,
0,
15,
13,
19,
7,
-1,
3,
0,
7,
2,
11,
8,
11,
10,
16,
0,
12,
1,
2,
20,
12,
21,
-1,
11,
1,
0,
8,
2,
16,
13,
17,
11,
0,
21,
8,
6,
1,
7,
15,
14,
15,
5,
15,
2,
5,
18,
-1,
0,
0,
7,
1,
1,
7,
6,
9,
11,
7,
0,
10,
0,
18,
0,
3,
0,
5,
14,
9,
2,
3,
15,
5,
11,
4,
4,
7,
0,
14,
13,
13,
6,
17,
0,
12,
14,
0,
10,
6,
12,
15,
17,
7,
11,
0,
10,
12,
4,
2,
21,
20,
15,
12,
11,
4,
8,
0,
5,
10,
4,
11,
10,
11,
-1,
7,
-1,
4,
8,
5,
6,
4,
4,
14,
9,
2,
8,
11,
2,
12,
2,
2,
-1,
-1,
7,
8,
12,
8,
1,
2,
3,
7,
8,
3,
1,
6,
0,
14,
11,
8,
0,
9,
15,
13,
6,
3,
3,
2,
5,
0,
7,
-1,
7,
13,
8,
6,
8,
2,
2,
16,
9,
11,
3,
0,
5,
8,
7,
4,
12,
11,
9,
1,
7,
0,
8,
3,
12,
6,
8,
0,
9,
4,
3,
7,
4,
0,
6,
10,
3,
7,
3,
5,
0,
-1,
4,
13,
3,
8,
2,
10,
7,
4,
0,
1,
10,
14,
12,
16,
5,
9,
10,
3,
1,
3,
11,
1,
0,
0,
8,
11,
6,
14,
14,
16,
5,
14,
12,
5,
8,
4,
13,
3,
0,
20,
0,
1,
20,
2,
4,
17,
12,
5,
4,
-1,
13,
5,
3,
0,
10,
1,
9,
12,
6,
13,
19,
1,
2,
9,
0,
12,
7,
14,
5,
6,
7,
9,
-1,
4,
-1,
-1,
13,
2,
1,
4,
3,
22,
5,
10,
3,
0,
8,
6,
1,
0,
0,
0,
17,
8,
0,
1,
5,
5,
5,
6,
4,
14,
13,
12,
19,
1,
1,
5,
12,
12,
21,
3,
10,
10,
2,
2,
10,
8,
2,
10,
1,
15,
5,
2,
2,
9,
4,
13,
1,
14,
1,
6,
0,
0,
7,
0,
2,
8,
0,
10,
16,
8,
10,
12,
5,
8,
9,
10,
12,
5,
0,
15,
2,
4,
0,
1,
1,
5,
6,
3,
0,
17,
0,
13,
9,
6,
6,
4,
6,
1,
6,
9,
0,
2,
4,
5,
0,
0,
6,
3,
19,
11,
1,
8,
0,
0,
17,
0,
6,
1,
7,
7,
3,
1,
12,
2,
11,
4,
9,
0,
5,
2,
11,
11,
6,
8,
18,
18,
3,
9,
0,
14,
17,
0,
12,
3,
-1,
12,
3,
11,
-1,
12,
11,
1,
5,
10,
10,
4,
7,
7,
14,
12,
-1,
14,
5,
11,
12,
7,
0,
6,
2,
8,
14,
9,
11,
12,
9,
10,
0,
0,
0,
3,
-1,
0,
0,
4,
12,
20,
10,
14,
0,
1,
5,
0,
8,
18,
4,
2,
11,
5,
12,
7,
5,
0,
0,
9,
15,
4,
7,
3,
5,
4,
19,
-1,
0,
4,
8,
6,
11,
0,
5,
18,
0,
0,
0,
11,
5,
13,
0,
2,
13,
14,
9,
3,
5,
0,
0,
-1,
-1,
-1,
6,
-1,
0,
19,
12,
3,
12,
9,
8,
-1,
9,
18,
-1,
15,
0,
9,
9,
1,
0,
10,
5,
0,
-1,
5,
15,
7,
0,
0,
19,
3,
2,
7,
3,
11,
11,
0,
-1,
0,
11,
14,
6,
0,
0,
21,
0,
17,
3,
0,
0,
6,
3,
2,
11,
13,
8,
2,
4,
5,
12,
3,
3,
0,
13,
7,
2,
10,
7,
0,
11,
10,
2,
19,
6,
22,
4,
1,
4,
4,
12,
0,
3,
-1,
3,
19,
-1,
4,
0,
2,
13,
1,
10,
-1,
0,
11,
6,
1,
14,
7,
10,
0,
10,
12,
9,
9,
6,
6,
1,
0,
11,
1,
18,
7,
2,
4,
21,
0,
9,
-1,
7,
11,
2,
9,
0,
11,
19,
0,
8,
11,
10,
0,
0,
1,
6,
11,
3,
0,
3,
2,
0,
8,
3,
21,
10,
5,
0,
1,
0,
21,
22,
0,
17,
1,
-1,
5,
8,
15,
12,
17,
9,
2,
10,
18,
-1,
-1,
17,
12,
11,
12,
2,
-1,
8,
6,
9,
6,
18,
-1,
-1,
-1,
3,
10,
3,
2,
0,
22,
2,
17,
12,
13,
7,
11,
4,
6,
18,
7,
6,
0,
7,
12,
3,
2,
14,
3,
13,
2,
10,
14,
0,
1,
0,
20,
2,
6,
14,
3,
9,
0,
0,
3,
5,
19,
7,
8,
13,
10,
0,
1,
-1,
14,
0,
0,
13,
0,
3,
10,
8,
1,
3,
12,
7,
4,
6,
6,
14,
4,
15,
19,
0,
5,
0,
0,
15,
2,
5,
13,
13,
0,
0,
8,
11,
-1,
0,
16,
1,
10,
22,
8,
-1,
10,
5,
10,
13,
5,
9,
0,
0,
11,
5,
16,
13,
14,
11,
1,
17,
0,
9,
0,
18,
17,
0,
5,
15,
0,
17,
9,
12,
10,
-1,
7,
11,
16,
4,
12,
0,
14,
8,
1,
2,
-1,
14,
8,
10,
4,
13,
14,
11,
10,
10,
4,
10,
6,
13,
-1,
10,
7,
4,
16,
-1,
11,
6,
-1,
1,
5,
10,
13,
4,
6,
7,
0,
-1,
5,
3,
7,
0,
12,
7,
2,
10,
0,
2,
8,
0,
12,
1,
16,
7,
13,
10,
0,
5,
4,
8,
11,
0,
22,
1,
20,
0,
1,
0,
6,
7,
2,
4,
6,
3,
2,
10,
4,
8,
15,
5,
1,
0,
1,
8,
1,
0,
8,
7,
0,
3,
4,
0,
-1,
15,
17,
9,
0,
4,
12,
-1,
10,
3,
2,
8,
3,
0,
6,
9,
6,
18,
6,
4,
9,
10,
21,
8,
7,
20,
0,
0,
2,
7,
5,
14,
12,
16,
0,
11,
3,
8,
11,
13,
2,
9,
-1,
4,
6,
3,
17,
10,
0,
21,
-1,
13,
18,
-1,
2,
2,
3,
10,
6,
14,
-1,
10,
8,
0,
1,
0,
16,
4,
15,
13,
9,
4,
7,
3,
0,
11,
1,
3,
9,
9,
10,
14,
11,
7,
2,
6,
10,
2,
8,
2,
2,
0,
8,
7,
-1,
0,
13,
0,
1,
9,
6,
0,
7,
0,
0,
4,
20,
3,
5,
7,
14,
0,
13,
0,
-1,
6,
19,
0,
7,
0,
18,
-1,
0,
11,
0,
6,
1,
-1,
8,
4,
6,
7,
11,
11,
0,
3,
5,
10,
5,
16,
11,
0,
-1,
22,
13,
0,
12,
0,
6,
0,
0,
0,
1,
8,
14,
1,
13,
6,
2,
8,
1,
19,
14,
15,
17,
2,
13,
10,
7,
-1,
8,
3,
9,
9,
22,
12,
6,
10,
9,
10,
9,
8,
14,
15,
20,
7,
3,
3,
22,
13,
5,
13,
0,
11,
-1,
4,
4,
9,
4,
0,
4,
8,
11,
6,
10,
4,
16,
11,
16,
3,
12,
8,
4,
5,
13,
9,
5,
8,
9,
4,
4,
0,
0,
8,
-1,
-1,
13,
0,
5,
14,
0,
10,
14,
18,
11,
-1,
3,
9,
19,
9,
3,
8,
5,
3,
-1,
-1,
14,
4,
10,
2,
0,
7,
12,
7,
15,
10,
10,
4,
3,
13,
2,
22,
8,
7,
0,
-1,
0,
4,
4,
5,
3,
2,
9,
0,
0,
4,
10,
0,
16,
0,
6,
14,
0,
2,
-1,
8,
1,
1,
11,
9,
8,
1,
-1,
0,
12,
12,
4,
9,
1,
8,
3,
0,
1,
4,
0,
14,
4,
11,
15,
14,
1,
14,
20,
6,
12,
11,
0,
9,
0,
5,
12,
13,
9,
0,
0,
0,
10,
0,
9,
6,
-1,
11,
5,
8,
0,
11,
5,
6,
19,
8,
13,
4,
12,
1,
9,
4,
7,
12,
5,
10,
10,
11,
2,
3,
13,
20,
11,
19,
3,
-1,
13,
21,
1,
7,
0,
4,
7,
3,
11,
0,
5,
13,
1,
6,
9,
14,
11,
12,
1,
-1,
9,
10,
0,
12,
3,
7,
-1,
10,
18,
12,
11,
2,
11,
5,
0,
0,
20,
2,
10,
1,
2,
12,
16,
1,
-1,
7,
13,
0,
-1,
9,
11,
5,
0,
11,
0,
8,
-1,
12,
12,
7,
6,
11,
7,
9,
16,
2,
0,
12,
12,
11,
12,
4,
5,
0,
0,
0,
0,
2,
9,
19,
7,
0,
14,
3,
11,
-1,
5,
1,
7,
-1,
5,
2,
6,
7,
-1,
6,
1,
2,
0,
14,
13,
7,
5,
2,
10,
7,
5,
0,
12,
15,
15,
0,
1,
0,
-1,
5,
13,
7,
8,
3,
9,
1,
6,
3,
9,
1,
12,
6,
0,
1,
3,
3,
0,
15,
0,
14,
6,
13,
6,
12,
5,
1,
0,
1,
9,
11,
9,
-1,
0,
0,
9,
0,
1,
18,
1,
21,
13,
4,
-1,
17,
17,
1,
4,
8,
0,
0,
13,
5,
7,
6,
11,
12,
-1,
14,
14,
20,
9,
0,
8,
2,
5,
0,
-1,
1,
3,
4,
-1,
1,
14,
11,
3,
7,
4,
6,
15,
9,
16,
9,
15,
13,
0,
13,
11,
10,
15,
9,
10,
6,
1,
5,
18,
22,
0,
9,
18,
0,
6,
14,
0,
12,
13,
3,
6,
17,
6,
8,
7,
1,
11,
8,
13,
14,
20,
0,
16,
0,
0,
3,
-1,
0,
0,
0,
14,
21,
16,
7,
5,
0,
13,
14,
0,
10,
8,
0,
0,
-1,
0,
18,
8,
4,
3,
1,
0,
13,
6,
8,
0,
10,
-1,
13,
2,
1,
5,
0,
10,
13,
7,
14,
12,
-1,
8,
0,
11,
5,
9,
9,
6,
17,
9,
0,
2,
3,
7,
8,
9,
20,
10,
17,
1,
10,
0,
0,
9,
4,
16,
2,
8,
18,
9,
3,
8,
2,
11,
9,
9,
-1,
4,
0,
9,
12,
7,
13,
8,
15,
9,
9,
5,
14,
0,
0,
-1,
13,
-1,
6,
5,
2,
7,
8,
9,
13,
1,
3,
3,
5,
2,
10,
3,
0,
2,
10,
6,
10,
8,
13,
0,
5,
5,
0,
2,
15,
9,
19,
1,
8,
7,
-1,
18,
2,
1,
8,
0,
7,
14,
6,
11,
0,
2,
15,
9,
13,
11,
22,
15
],
"topic_sizes": {
"7": 102,
"12": 85,
"0": 303,
"5": 102,
"1": 117,
"2": 106,
"13": 81,
"18": 27,
"3": 104,
"20": 22,
"4": 103,
"17": 27,
"16": 27,
"10": 97,
"9": 99,
"6": 102,
"-1": 104,
"11": 96,
"8": 100,
"15": 37,
"19": 23,
"14": 67,
"21": 16,
"22": 13
},
"topic_mapper": [
[
-1,
-1,
-1
],
[
0,
0,
14
],
[
1,
1,
9
],
[
2,
2,
5
],
[
3,
3,
3
],
[
4,
4,
2
],
[
5,
5,
10
],
[
6,
6,
0
],
[
7,
7,
11
],
[
8,
8,
6
],
[
9,
9,
7
],
[
10,
10,
1
],
[
11,
11,
21
],
[
12,
12,
13
],
[
13,
13,
8
],
[
14,
14,
20
],
[
15,
15,
4
],
[
16,
16,
12
],
[
17,
17,
18
],
[
18,
18,
15
],
[
19,
19,
19
],
[
20,
20,
16
],
[
21,
21,
22
],
[
22,
22,
17
]
],
"topic_labels": {
"-1": "-1_no_saic_raw_sp_sep_4_sec_data",
"0": "0_lecture_applications_methods_learning",
"1": "1_cogvideo_videos_cogview2_cog",
"2": "2_ship_rainsford_hunted_island",
"3": "3_films_dissertation_film_noir",
"4": "4_linguistics_language_languages_foundational",
"5": "5_nemo_dory_transcript_clownfish",
"6": "6_train_bruno_washington_station",
"7": "7_images_representations_image_captions",
"8": "8_merge_merging_explain_concept",
"9": "9_enhancement_enhancing_recordings_improve",
"10": "10_arendelle_elsa_frozen_kristoff",
"11": "11_scene_story_script_movie",
"12": "12_lecture_lemmatization_nlp_medical",
"13": "13_questions_topics_conversation_terrance",
"14": "14_sniper_kill_fury_combat",
"15": "15_images_lecture_ezurich_pathology",
"16": "16_timeseries_framework_interpretability_representations",
"17": "17_prediction_predictions_forecasting_predict",
"18": "18_images_imaging_computational_convolutional",
"19": "19_technology_treatment_methods_medical",
"20": "20_novel_translation_henry_read",
"21": "21_abridged_brief_synopsis_short",
"22": "22_lecture_pathology_medical_computational"
},
"custom_labels": null,
"_outliers": 1,
"topic_aspects": {}
}