diff --git a/.gitattributes b/.gitattributes index 2b1a2dd26f82f7eeb01e627167f0b0beb3e68793..843d6bff1705e8ec8e82679b2fb25f834dbc131e 100644 --- a/.gitattributes +++ b/.gitattributes @@ -35,3 +35,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text classifierDL-lang-detect/stages/1_UNIVERSAL_SENTENCE_ENCODER_4de71669b7ec/use_tensorflow filter=lfs diff=lfs merge=lfs -text classifierDL-lang-detect/stages/2_ClassifierDLModel_7d8464466588/classifierdl_tensorflow filter=lfs diff=lfs merge=lfs -text +classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/bert_onnx filter=lfs diff=lfs merge=lfs -text +classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/classifierdl_tensorflow filter=lfs diff=lfs merge=lfs -text diff --git a/classifierDL-bert-lang-detect/metadata/_SUCCESS b/classifierDL-bert-lang-detect/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/metadata/_committed_6593034593231839734 b/classifierDL-bert-lang-detect/metadata/_committed_6593034593231839734 new file mode 100644 index 0000000000000000000000000000000000000000..0aa845f1a67cc8318cfa533c769eac6728d26c51 --- /dev/null +++ b/classifierDL-bert-lang-detect/metadata/_committed_6593034593231839734 @@ -0,0 +1 @@ +{"added":["part-00000-tid-6593034593231839734-2eaa5d67-5ef0-4066-9f3b-ecc65cf0d06f-302-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/metadata/_started_6593034593231839734 b/classifierDL-bert-lang-detect/metadata/_started_6593034593231839734 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/metadata/part-00000-tid-6593034593231839734-2eaa5d67-5ef0-4066-9f3b-ecc65cf0d06f-302-1-c000.txt b/classifierDL-bert-lang-detect/metadata/part-00000-tid-6593034593231839734-2eaa5d67-5ef0-4066-9f3b-ecc65cf0d06f-302-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..8a42321d9495df5cc5607c59dd46749a77ddc282 --- /dev/null +++ b/classifierDL-bert-lang-detect/metadata/part-00000-tid-6593034593231839734-2eaa5d67-5ef0-4066-9f3b-ecc65cf0d06f-302-1-c000.txt @@ -0,0 +1 @@ +{"class":"org.apache.spark.ml.PipelineModel","timestamp":1727274381634,"sparkVersion":"3.5.0","uid":"PipelineModel_1e1260dd05f2","paramMap":{"stageUids":["DocumentAssembler_a85d70e054b5","REGEX_TOKENIZER_bc93b0d170c6","BERT_EMBEDDINGS_69dd9fb1854f","SentenceEmbeddings_5f3b5483102a","ClassifierDLModel_a78c9498f386"]},"defaultParamMap":{}} diff --git a/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_SUCCESS b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_committed_4249049908337889056 b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_committed_4249049908337889056 new file mode 100644 index 0000000000000000000000000000000000000000..8a1eb25b878cd837ae6b1cd08aa8df58d77133e8 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_committed_4249049908337889056 @@ -0,0 +1 @@ +{"added":["part-00000-tid-4249049908337889056-a4a31c1d-3f7b-4051-adb3-64864ba4b29e-303-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_started_4249049908337889056 b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/_started_4249049908337889056 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/part-00000-tid-4249049908337889056-a4a31c1d-3f7b-4051-adb3-64864ba4b29e-303-1-c000.txt b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/part-00000-tid-4249049908337889056-a4a31c1d-3f7b-4051-adb3-64864ba4b29e-303-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..bac06b907a17fd5186909b490717b74dbe6b58d3 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/0_DocumentAssembler_a85d70e054b5/metadata/part-00000-tid-4249049908337889056-a4a31c1d-3f7b-4051-adb3-64864ba4b29e-303-1-c000.txt @@ -0,0 +1 @@ +{"class":"com.johnsnowlabs.nlp.DocumentAssembler","timestamp":1727274382400,"sparkVersion":"3.5.0","uid":"DocumentAssembler_a85d70e054b5","paramMap":{"inputCol":"text","outputCol":"document"},"defaultParamMap":{"cleanupMode":"disabled","outputCol":"document"}} diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/_SUCCESS b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00000 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00000 new file mode 100644 index 0000000000000000000000000000000000000000..e70980676cc70ca503389d2c9ee2247c40389794 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00000 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00001 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00001 new file mode 100644 index 0000000000000000000000000000000000000000..08b7402a12a4262c10747ad6eff4e4569d542081 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00001 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00002 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00002 new file mode 100644 index 0000000000000000000000000000000000000000..d59dd8feb127dec726b9ab9a20333f865a865c34 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00002 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00003 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00003 new file mode 100644 index 0000000000000000000000000000000000000000..f258c574d517176733e5293ebb6fc070b9eaa6a7 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00003 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00004 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00004 new file mode 100644 index 0000000000000000000000000000000000000000..a9c4fa3a07668e2fd5324d215cadf8e8662b72e0 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00004 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00005 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00005 new file mode 100644 index 0000000000000000000000000000000000000000..cfcbece56ab1fde904d873ecc8c0b3455e924ae3 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00005 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00006 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00006 new file mode 100644 index 0000000000000000000000000000000000000000..277411c1a02bbb22d9e5dfe907b227fe372fdd71 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00006 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00007 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00007 new file mode 100644 index 0000000000000000000000000000000000000000..bad6ca93fcb2536071894eb090bcd19838540621 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/fields/rules/part-00007 differ diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_SUCCESS b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_committed_5570049922655100179 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_committed_5570049922655100179 new file mode 100644 index 0000000000000000000000000000000000000000..0ad504c36e0d8b384b0d38a4cd0aec30fe75aac2 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_committed_5570049922655100179 @@ -0,0 +1 @@ +{"added":["part-00000-tid-5570049922655100179-03384181-9cc1-419d-ad0b-7e906f83f8f0-304-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_started_5570049922655100179 b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/_started_5570049922655100179 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/part-00000-tid-5570049922655100179-03384181-9cc1-419d-ad0b-7e906f83f8f0-304-1-c000.txt b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/part-00000-tid-5570049922655100179-03384181-9cc1-419d-ad0b-7e906f83f8f0-304-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..83d19e735c7c70b2bbf67a8c36c1327e1ced29ff --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/1_REGEX_TOKENIZER_bc93b0d170c6/metadata/part-00000-tid-5570049922655100179-03384181-9cc1-419d-ad0b-7e906f83f8f0-304-1-c000.txt @@ -0,0 +1 @@ +{"class":"com.johnsnowlabs.nlp.annotators.TokenizerModel","timestamp":1727274383139,"sparkVersion":"3.5.0","uid":"REGEX_TOKENIZER_bc93b0d170c6","paramMap":{"maxLength":99999,"minLength":0,"caseSensitiveExceptions":true,"outputCol":"token","inputCols":["document"],"targetPattern":"\\S+"},"defaultParamMap":{"maxLength":99999,"minLength":0,"caseSensitiveExceptions":true,"outputCol":"token","inputCols":["document"],"targetPattern":"\\S+","lazyAnnotator":false}} diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/bert_onnx b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/bert_onnx new file mode 100644 index 0000000000000000000000000000000000000000..997aef12d52231fe8c633c41cf845c7dca6e6bc0 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/bert_onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d2af9c6956ed07090dcb7663b1ba95f0721da09ba92b5d08f1af77f6d31d04 +size 152122568 diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/_SUCCESS b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00000 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00000 new file mode 100644 index 0000000000000000000000000000000000000000..abd31fdca3e8ff8840233ae705d962a9fc40bc16 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00000 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00001 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00001 new file mode 100644 index 0000000000000000000000000000000000000000..4c6f501a2201e54032be4d387dab42eb7bcea816 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00001 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00002 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00002 new file mode 100644 index 0000000000000000000000000000000000000000..d36a9d3c169191664955db7b9a17e48c3e992811 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00002 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00003 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00003 new file mode 100644 index 0000000000000000000000000000000000000000..c8ccce68326e801e9efea9dbc4a75d09d2371949 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00003 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00004 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00004 new file mode 100644 index 0000000000000000000000000000000000000000..26343ea2c79f37becb78b1f8ae156227c3198abb Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00004 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00005 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00005 new file mode 100644 index 0000000000000000000000000000000000000000..9681a6ca1bf4d4c286bca223e9c5e926c76090f7 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00005 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00006 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00006 new file mode 100644 index 0000000000000000000000000000000000000000..a63b5752f59ceb5ab533d58ba3d3bf888c74bfe7 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00006 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00007 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00007 new file mode 100644 index 0000000000000000000000000000000000000000..c78fc8fd5ca5e909e40a513bb85809d9c311a383 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/fields/vocabulary/part-00007 differ diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_SUCCESS b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_committed_4031617553090561353 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_committed_4031617553090561353 new file mode 100644 index 0000000000000000000000000000000000000000..c0a4bf9380edec8dc91782ad637cafcbdc916e16 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_committed_4031617553090561353 @@ -0,0 +1 @@ +{"added":["part-00000-tid-4031617553090561353-9ae763c5-4ae4-41a4-bc41-0a6d28282a0c-313-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_started_4031617553090561353 b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/_started_4031617553090561353 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/part-00000-tid-4031617553090561353-9ae763c5-4ae4-41a4-bc41-0a6d28282a0c-313-1-c000.txt b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/part-00000-tid-4031617553090561353-9ae763c5-4ae4-41a4-bc41-0a6d28282a0c-313-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..97dc217d6e3f34404fe183b4cb57a4e9c3c2d810 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/2_BERT_EMBEDDINGS_69dd9fb1854f/metadata/part-00000-tid-4031617553090561353-9ae763c5-4ae4-41a4-bc41-0a6d28282a0c-313-1-c000.txt @@ -0,0 +1 @@ +{"class":"com.johnsnowlabs.nlp.embeddings.BertEmbeddings","timestamp":1727274384268,"sparkVersion":"3.5.0","uid":"BERT_EMBEDDINGS_69dd9fb1854f","paramMap":{"dimension":768,"outputCol":"embeddings","caseSensitive":false,"storageRef":"small_bert_L2_768","inputCols":["document","token"],"engine":"onnx"},"defaultParamMap":{"dimension":768,"caseSensitive":false,"storageRef":"BERT_EMBEDDINGS_69dd9fb1854f","maxSentenceLength":128,"engine":"tensorflow","lazyAnnotator":false,"batchSize":8}} diff --git a/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_SUCCESS b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_committed_3272538039056848776 b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_committed_3272538039056848776 new file mode 100644 index 0000000000000000000000000000000000000000..383f9ab99532402c8ca2843a4cceb1a455f1edd2 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_committed_3272538039056848776 @@ -0,0 +1 @@ +{"added":["part-00000-tid-3272538039056848776-6af10195-5094-49e2-a0ad-e92bb8525b0a-322-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_started_3272538039056848776 b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/_started_3272538039056848776 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/part-00000-tid-3272538039056848776-6af10195-5094-49e2-a0ad-e92bb8525b0a-322-1-c000.txt b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/part-00000-tid-3272538039056848776-6af10195-5094-49e2-a0ad-e92bb8525b0a-322-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..5e808afaedaec2fd6e43865c6b76f32a0ef5e09c --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/3_SentenceEmbeddings_5f3b5483102a/metadata/part-00000-tid-3272538039056848776-6af10195-5094-49e2-a0ad-e92bb8525b0a-322-1-c000.txt @@ -0,0 +1 @@ +{"class":"com.johnsnowlabs.nlp.embeddings.SentenceEmbeddings","timestamp":1727274387626,"sparkVersion":"3.5.0","uid":"SentenceEmbeddings_5f3b5483102a","paramMap":{"outputCol":"sentence_embeddings","storageRef":"small_bert_L2_768","poolingStrategy":"AVERAGE","inputCols":["document","embeddings"]},"defaultParamMap":{"dimension":100,"outputCol":"sentence_embeddings","poolingStrategy":"AVERAGE","storageRef":"SentenceEmbeddings_5f3b5483102a","inputCols":["document","word_embeddings"],"lazyAnnotator":false}} diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/classifierdl_tensorflow b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/classifierdl_tensorflow new file mode 100644 index 0000000000000000000000000000000000000000..87116f5fcf27e18ab05d997ce95596d032211558 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/classifierdl_tensorflow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bcd8b7cea838731d7dfa5f1ee827386370f6eb2847660db33efb48a6f90e925 +size 51639695 diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/_SUCCESS b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00000 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00000 new file mode 100644 index 0000000000000000000000000000000000000000..7429dec4784a268d6e785204db82c25d05526325 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00000 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00001 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00001 new file mode 100644 index 0000000000000000000000000000000000000000..c2ea076b6a8402ab6c8285f89d4aac974a838fa5 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00001 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00002 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00002 new file mode 100644 index 0000000000000000000000000000000000000000..6969bd561996462f3dd22382241fe59fa18550e3 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00002 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00003 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00003 new file mode 100644 index 0000000000000000000000000000000000000000..c4ad7476dcae800aaeeb190cf7bdb0c667146773 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00003 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00004 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00004 new file mode 100644 index 0000000000000000000000000000000000000000..b906f69395b0f0a439b9c7e094243f03684be835 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00004 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00005 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00005 new file mode 100644 index 0000000000000000000000000000000000000000..745a85a9be89df3619a63ae4fe702963b647dbfa Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00005 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00006 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00006 new file mode 100644 index 0000000000000000000000000000000000000000..606a34fd59438055b30fb1051409f5bb2f63b1f4 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00006 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00007 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00007 new file mode 100644 index 0000000000000000000000000000000000000000..68b32347e6a46f29353bc8b017fe4e3e1addfaf1 Binary files /dev/null and b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/fields/datasetParams/part-00007 differ diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_SUCCESS b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_SUCCESS new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_committed_3497803354294866002 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_committed_3497803354294866002 new file mode 100644 index 0000000000000000000000000000000000000000..bab144e72338c79a851cb7dd9f444e8d68fd16d2 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_committed_3497803354294866002 @@ -0,0 +1 @@ +{"added":["part-00000-tid-3497803354294866002-5dd99f8c-edda-4395-a837-5aa00e5d12ad-323-1-c000.txt"],"removed":[]} \ No newline at end of file diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_started_3497803354294866002 b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/_started_3497803354294866002 new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/part-00000-tid-3497803354294866002-5dd99f8c-edda-4395-a837-5aa00e5d12ad-323-1-c000.txt b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/part-00000-tid-3497803354294866002-5dd99f8c-edda-4395-a837-5aa00e5d12ad-323-1-c000.txt new file mode 100644 index 0000000000000000000000000000000000000000..61a7a62d1096407e28b03ba9d6f879d8882a53d8 --- /dev/null +++ b/classifierDL-bert-lang-detect/stages/4_ClassifierDLModel_a78c9498f386/metadata/part-00000-tid-3497803354294866002-5dd99f8c-edda-4395-a837-5aa00e5d12ad-323-1-c000.txt @@ -0,0 +1 @@ +{"class":"com.johnsnowlabs.nlp.annotators.classifier.dl.ClassifierDLModel","timestamp":1727274388341,"sparkVersion":"3.5.0","uid":"ClassifierDLModel_a78c9498f386","paramMap":{"inputCols":["sentence_embeddings"],"storageRef":"small_bert_L2_768","outputCol":"class"},"defaultParamMap":{"storageRef":"ClassifierDLModel_a78c9498f386","engine":"tensorflow","lazyAnnotator":false}}