pszemraj's picture
Add BERTopic model
f30bdc1
raw
history blame
16.6 kB
{
"topic_representations": {
"-1": [
[
"convolutional",
0.812958836555481
],
[
"images",
0.789915144443512
],
[
"networks",
0.7750969529151917
],
[
"superpixels",
0.7669301629066467
],
[
"overfitting",
0.766011118888855
],
[
"image",
0.7607262134552002
],
[
"segmentation",
0.7580690383911133
],
[
"neural",
0.7571927905082703
],
[
"input",
0.7562020421028137
],
[
"nn",
0.7535852789878845
]
],
"0": [
[
"bruno",
0.782376766204834
],
[
"guy",
0.7694101333618164
],
[
"pdf",
0.7633169889450073
],
[
"screentalk",
0.7479361295700073
],
[
"he",
0.7390514612197876
],
[
"int",
0.7379845380783081
],
[
"his",
0.7341611385345459
],
[
"converted",
0.7340353727340698
],
[
"out",
0.7325744032859802
],
[
"voice",
0.7307334542274475
]
],
"1": [
[
"elsa",
0.8160275816917419
],
[
"arendelle",
0.7971220016479492
],
[
"kristoff",
0.7863443493843079
],
[
"frozen",
0.7767009139060974
],
[
"anna",
0.7665482759475708
],
[
"olaf",
0.7611944675445557
],
[
"hans",
0.7529194355010986
],
[
"snow",
0.7397163510322571
],
[
"no",
0.7334048748016357
],
[
"sven",
0.7317110300064087
]
],
"2": [
[
"gillis",
0.780834436416626
],
[
"script",
0.7442724704742432
],
[
"room",
0.7441475987434387
],
[
"ll",
0.7397430539131165
],
[
"artie",
0.7382926940917969
],
[
"norma",
0.7371121048927307
],
[
"house",
0.7355591058731079
],
[
"some",
0.7345719933509827
],
[
"no",
0.7334718108177185
],
[
"out",
0.7313063144683838
]
],
"3": [
[
"interpretation",
0.7614122629165649
],
[
"explanation",
0.7482936382293701
],
[
"theory",
0.7403494119644165
],
[
"structure",
0.7351824045181274
],
[
"merge",
0.7320129871368408
],
[
"conditions",
0.7313622236251831
],
[
"simplest",
0.7254719734191895
],
[
"interesting",
0.7216659784317017
],
[
"system",
0.7192807197570801
],
[
"something",
0.7187553644180298
]
],
"4": [
[
"topics",
0.7710573673248291
],
[
"topic",
0.764340877532959
],
[
"documents",
0.7622215747833252
],
[
"corpus",
0.7556679844856262
],
[
"document",
0.7548444271087646
],
[
"data",
0.7541389465332031
],
[
"words",
0.7497113943099976
],
[
"frequency",
0.7443191409111023
],
[
"vocabulary",
0.7432523369789124
],
[
"example",
0.7350988388061523
]
],
"5": [
[
"nemo",
0.8560476303100586
],
[
"dory",
0.8030993938446045
],
[
"chum",
0.7655107975006104
],
[
"gill",
0.7619814872741699
],
[
"fish",
0.7474814653396606
],
[
"sharkbait",
0.7334390878677368
],
[
"swim",
0.732296347618103
],
[
"uh",
0.7292873859405518
],
[
"coral",
0.728416919708252
],
[
"no",
0.7282388210296631
]
],
"6": [
[
"films",
0.7558428645133972
],
[
"film",
0.7491594552993774
],
[
"identity",
0.7483522891998291
],
[
"trauma",
0.7400946617126465
],
[
"zinnemann",
0.7322919368743896
],
[
"identities",
0.7272083163261414
],
[
"traces",
0.7219871282577515
],
[
"urban",
0.721187174320221
],
[
"between",
0.7194730639457703
],
[
"materiality",
0.7193468809127808
]
],
"7": [
[
"computational",
0.7724958658218384
],
[
"data",
0.7706875205039978
],
[
"pathology",
0.7677849531173706
],
[
"medical",
0.7668463587760925
],
[
"informatics",
0.7635326385498047
],
[
"classification",
0.7610385417938232
],
[
"medical_",
0.7591860890388489
],
[
"data_",
0.7576411962509155
],
[
"icu",
0.7570323944091797
],
[
"images",
0.7569260597229004
]
],
"8": [
[
"images",
0.8044949173927307
],
[
"captions",
0.783771812915802
],
[
"representations",
0.7822390794754028
],
[
"embeddings",
0.7761370539665222
],
[
"image",
0.7710026502609253
],
[
"embedding",
0.766433835029602
],
[
"conditioning",
0.7635176777839661
],
[
"encoder",
0.7606396675109863
],
[
"decoder",
0.7513459920883179
],
[
"classifier",
0.7493197917938232
]
],
"9": [
[
"zaroff",
0.7830722332000732
],
[
"rainsford",
0.7752155065536499
],
[
"hunt",
0.7669715285301208
],
[
"hunting",
0.758228063583374
],
[
"general",
0.7424396872520447
],
[
"he",
0.7389982342720032
],
[
"ll",
0.7381408214569092
],
[
"hunter",
0.7372696995735168
],
[
"had",
0.733473539352417
],
[
"man",
0.7315329909324646
]
],
"10": [
[
"cogvideo",
0.8041282892227173
],
[
"interpolation",
0.7749236226081848
],
[
"videos",
0.7728286981582642
],
[
"coglm",
0.7700319290161133
],
[
"frames",
0.7670143246650696
],
[
"iterations",
0.7624410390853882
],
[
"sequential",
0.7571900486946106
],
[
"cog",
0.7526829242706299
],
[
"pretraining",
0.7518821954727173
],
[
"model",
0.7496122121810913
]
],
"11": [
[
"assignment",
0.7819938659667969
],
[
"essays",
0.7542336583137512
],
[
"questions",
0.7518027424812317
],
[
"projects",
0.7412513494491577
],
[
"students",
0.7385664582252502
],
[
"learning",
0.7382364273071289
],
[
"readings",
0.7367334365844727
],
[
"homework",
0.7351245880126953
],
[
"session",
0.7344810962677002
],
[
"required",
0.729199230670929
]
],
"12": [
[
"things",
0.7505715489387512
],
[
"ll",
0.7484922409057617
],
[
"some",
0.7481634616851807
],
[
"lol",
0.7392996549606323
],
[
"explain",
0.732305645942688
],
[
"why",
0.7317633628845215
],
[
"can",
0.7299840450286865
],
[
"think",
0.7281968593597412
],
[
"thoughts",
0.727929949760437
],
[
"am",
0.7273967862129211
]
],
"13": [
[
"videos",
0.7792222499847412
],
[
"arxiv",
0.7715873718261719
],
[
"visual",
0.7565194964408875
],
[
"preprint",
0.7493596076965332
],
[
"generative",
0.7435239553451538
],
[
"models",
0.7431691884994507
],
[
"ieeeicvf",
0.7431351542472839
],
[
"ieee",
0.7425673007965088
],
[
"generating",
0.7353911995887756
],
[
"video",
0.7344731092453003
]
],
"14": [
[
"spectrograms",
0.8015516996383667
],
[
"musecoder",
0.7912242412567139
],
[
"melspectrogram",
0.7880717515945435
],
[
"vocoding",
0.7843880653381348
],
[
"spectrogram",
0.7839890122413635
],
[
"waveforms",
0.7807684540748596
],
[
"enhancement",
0.7761921286582947
],
[
"recordings",
0.7706590294837952
],
[
"waveform",
0.7621763348579407
],
[
"diffwave",
0.7587536573410034
]
]
},
"topics": [
7,
-1,
-1,
-1,
8,
-1,
-1,
-1,
-1,
-1,
-1,
7,
7,
7,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
7,
7,
7,
7,
-1,
7,
7,
7,
7,
7,
7,
8,
7,
7,
7,
7,
7,
7,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
9,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
5,
0,
11,
4,
4,
11,
11,
11,
11,
11,
11,
11,
-1,
-1,
4,
-1,
11,
4,
11,
4,
4,
4,
4,
4,
4,
11,
12,
12,
12,
12,
12,
12,
12,
12,
12,
12,
12,
12,
12,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
0,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
6,
10,
13,
10,
-1,
10,
10,
10,
10,
10,
10,
10,
10,
10,
10,
10,
10,
13,
13,
13,
13,
10,
10,
10,
-1,
11,
11,
11,
4,
4,
4,
4,
4,
4,
4,
-1,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
-1,
11,
6,
0,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
2,
0,
2,
2,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
8,
13,
13,
-1,
13,
13,
13,
13,
13,
-1,
8,
8,
8,
0,
14,
14,
14,
14,
14,
14,
14,
14,
14,
14,
14,
13,
-1,
-1,
14,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
11,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
4,
7,
4,
4,
4,
4,
4,
4,
4,
-1,
7,
7,
7,
4,
-1,
-1,
-1,
-1,
7,
7,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1
],
"topic_sizes": {
"7": 26,
"-1": 26,
"8": 24,
"0": 94,
"9": 24,
"5": 54,
"11": 16,
"4": 56,
"12": 13,
"6": 47,
"10": 17,
"13": 13,
"2": 72,
"14": 12,
"3": 63,
"1": 73
},
"topic_mapper": [
[
-1,
-1,
-1
],
[
0,
0,
1
],
[
1,
1,
5
],
[
2,
2,
6
],
[
3,
3,
9
],
[
4,
4,
0
],
[
5,
5,
2
],
[
6,
6,
12
],
[
7,
7,
3
],
[
8,
8,
11
],
[
9,
9,
4
],
[
10,
10,
7
],
[
11,
11,
14
],
[
12,
12,
8
],
[
13,
13,
13
],
[
14,
14,
10
]
],
"topic_labels": {
"-1": "-1_convolutional_images_networks_superpixels",
"0": "0_bruno_guy_pdf_screentalk",
"1": "1_elsa_arendelle_kristoff_frozen",
"2": "2_gillis_script_room_ll",
"3": "3_interpretation_explanation_theory_structure",
"4": "4_topics_topic_documents_corpus",
"5": "5_nemo_dory_chum_gill",
"6": "6_films_film_identity_trauma",
"7": "7_computational_data_pathology_medical",
"8": "8_images_captions_representations_embeddings",
"9": "9_zaroff_rainsford_hunt_hunting",
"10": "10_cogvideo_interpolation_videos_coglm",
"11": "11_assignment_essays_questions_projects",
"12": "12_things_ll_some_lol",
"13": "13_videos_arxiv_visual_preprint",
"14": "14_spectrograms_musecoder_melspectrogram_vocoding"
},
"custom_labels": null,
"_outliers": 1,
"topic_aspects": {}
}