diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_en.md new file mode 100644 index 00000000000000..929f5a9f950935 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Base Sentence Embeddings +author: John Snow Labs +name: e5_base +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_en_5.1.0_3.0_1692963566674.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_en_5.1.0_3.0_1692963566674.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|258.6 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_opt_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_opt_en.md new file mode 100644 index 00000000000000..f99faf717c9112 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_opt_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Base Sentence Embeddings +author: John Snow Labs +name: e5_base_opt +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_opt_en_5.1.0_3.0_1692963694288.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_opt_en_5.1.0_3.0_1692963694288.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base_opt| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|258.7 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_quantized_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_quantized_en.md new file mode 100644 index 00000000000000..54ef0a2318bf87 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_quantized_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Base Sentence Embeddings +author: John Snow Labs +name: e5_base_quantized +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_quantized_en_5.1.0_3.0_1692963757236.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_quantized_en_5.1.0_3.0_1692963757236.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base_quantized| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|67.1 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_en.md new file mode 100644 index 00000000000000..15e45179946d28 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_en.md @@ -0,0 +1,68 @@ +--- +layout: model +title: E5 Base v2 Sentence Embeddings +author: John Snow Labs +name: e5_base_v2 +date: 2023-08-25 +tags: [e5, sentence_embeddings, en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_v2_en_5.1.0_3.0_1692964050132.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_v2_en_5.1.0_3.0_1692964050132.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") + +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base_v2| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|258.7 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_opt_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_opt_en.md new file mode 100644 index 00000000000000..0d653f873d5d8c --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_opt_en.md @@ -0,0 +1,68 @@ +--- +layout: model +title: E5 Base v2 Sentence Embeddings +author: John Snow Labs +name: e5_base_v2_opt +date: 2023-08-25 +tags: [e5, sentence_embeddings, en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_v2_opt_en_5.1.0_3.0_1692964193495.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_v2_opt_en_5.1.0_3.0_1692964193495.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") + +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base_v2_opt| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|258.8 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_quantized_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_quantized_en.md new file mode 100644 index 00000000000000..75437db6e111ab --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_base_v2_quantized_en.md @@ -0,0 +1,68 @@ +--- +layout: model +title: E5 Base v2 Sentence Embeddings +author: John Snow Labs +name: e5_base_v2_quantized +date: 2023-08-25 +tags: [e5, sentence_embeddings, en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_base_v2_quantized_en_5.1.0_3.0_1692964219731.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_base_v2_quantized_en_5.1.0_3.0_1692964219731.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_base_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_base_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") + +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_base_v2_quantized| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|67.0 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_large_v2_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_large_v2_en.md new file mode 100644 index 00000000000000..4a298c0a806b54 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_large_v2_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Large V2 Sentence Embeddings +author: John Snow Labs +name: e5_large_v2 +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_large_v2_en_5.1.0_3.0_1692966772284.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_large_v2_en_5.1.0_3.0_1692966772284.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_large_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_large_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_large_v2| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|796.3 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_en.md new file mode 100644 index 00000000000000..fbddfdeb65d03e --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small Sentence Embeddings +author: John Snow Labs +name: e5_small +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_en_5.1.0_3.0_1692963401947.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_en_5.1.0_3.0_1692963401947.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|79.9 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_opt_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_opt_en.md new file mode 100644 index 00000000000000..1e4e5a465a95c0 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_opt_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small Sentence Embeddings +author: John Snow Labs +name: e5_small_opt +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_opt_en_5.1.0_3.0_1692963460075.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_opt_en_5.1.0_3.0_1692963460075.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small_opt| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|80.0 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_quantized_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_quantized_en.md new file mode 100644 index 00000000000000..1390bd612bc4be --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_quantized_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small Sentence Embeddings +author: John Snow Labs +name: e5_small_quantized +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_quantized_en_5.1.0_3.0_1692963474009.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_quantized_en_5.1.0_3.0_1692963474009.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small_quantized| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|22.6 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_en.md new file mode 100644 index 00000000000000..1b09d77aafd5a8 --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small V2 Sentence Embeddings +author: John Snow Labs +name: e5_small_v2 +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_v2_en_5.1.0_3.0_1692963575848.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_v2_en_5.1.0_3.0_1692963575848.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small_v2| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|79.9 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_opt_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_opt_en.md new file mode 100644 index 00000000000000..3278b5279d205c --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_opt_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small V2 Sentence Embeddings +author: John Snow Labs +name: e5_small_v2_opt +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_v2_opt_en_5.1.0_3.0_1692963627616.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_v2_opt_en_5.1.0_3.0_1692963627616.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small_v2_opt| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|79.9 MB| \ No newline at end of file diff --git a/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_quantized_en.md b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_quantized_en.md new file mode 100644 index 00000000000000..62165b979f010d --- /dev/null +++ b/docs/_posts/ahmedlone127/2023-08-25-e5_small_v2_quantized_en.md @@ -0,0 +1,67 @@ +--- +layout: model +title: E5 Small V2 Sentence Embeddings +author: John Snow Labs +name: e5_small_v2_quantized +date: 2023-08-25 +tags: [en, open_source, onnx] +task: Embeddings +language: en +edition: Spark NLP 5.1.0 +spark_version: 3.0 +supported: true +engine: onnx +annotator: E5Embeddings +article_header: + type: cover +use_language_switcher: "Python-Scala-Java" +--- + +## Description + +Text Embeddings by Weakly-Supervised Contrastive Pre-training. Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, Furu Wei, arXiv 2022 + +## Predicted Entities + + + +{:.btn-box} + + +[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/e5_small_v2_quantized_en_5.1.0_3.0_1692963639263.zip){:.button.button-orange.button-orange-trans.arr.button-icon} +[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/e5_small_v2_quantized_en_5.1.0_3.0_1692963639263.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3} + +## How to use + + + +
+{% include programmingLanguageSelectScalaPythonNLU.html %} +```python +embeddings =E5Embeddings.pretrained("e5_small_v2","en") \ + .setInputCols(["documents"]) \ + .setOutputCol("instructor") + +pipeline = Pipeline().setStages([document_assembler, embeddings]) +``` +```scala +val embeddings = E5Embeddings.pretrained("e5_small_v2","en") + .setInputCols(["document"]) + .setOutputCol("e5_embeddings") +val pipeline = new Pipeline().setStages(Array(document, embeddings)) +``` +
+ +{:.model-param} +## Model Information + +{:.table-model} +|---|---| +|Model Name:|e5_small_v2_quantized| +|Compatibility:|Spark NLP 5.1.0+| +|License:|Open Source| +|Edition:|Official| +|Input Labels:|[documents]| +|Output Labels:|[e5]| +|Language:|en| +|Size:|22.1 MB| \ No newline at end of file