Skip to content

Commit a95c2b6

Browse files
Models hub (#14557)
* Add model 2025-04-09-nicolasmaduro_en * Add model 2025-04-09-ascii211_pipeline_en * Add model 2025-04-09-baklan_en * Add model 2025-04-09-scottmorrisonmp_en * Add model 2025-04-09-armin_van_buuren_pipeline_en * Add model 2025-04-09-exp_w2v2t_english_wav2vec2_s878_pipeline_en * Add model 2025-04-08-wav2vec2_large_xls_r_300m_russian_pipeline_ru * Add model 2025-04-09-sent_bert_base_multilingual_cased_finetuned_yiddish_experiment_6_pipeline_xx * Add model 2025-04-09-danny_macaskill_martynashton_en * Add model 2025-04-09-alfieghill1_en * Add model 2025-04-09-milesperhoward_pipeline_en * Add model 2025-04-08-wav2vec2_xlsr_53_espeak_chuvash_ft_bak_ntsema_colab_en * Add model 2025-04-09-natesilver538_pipeline_en * Add model 2025-04-09-wav2vec2_xlsr_dendi_ddn_for_numerals_pipeline_en * Add model 2025-04-09-ofrainandruin_pipeline_en * Add model 2025-04-09-spknnk_en * Add model 2025-04-09-gitanasnauseda_maldeikiene_pipeline_en * Add model 2025-04-09-pico8degalaleo_en * Add model 2025-04-08-craft_chem_modified_biobert_large_cased_en * Add model 2025-04-09-fullbitchschol1_pipeline_en * Add model 2025-04-08-liv_garde_en * Add model 2025-04-08-rubert_base_finetuned_sayula_popoluca_ru * Add model 2025-04-09-vit_base_patch16_224_finetuned_cedar_pipeline_en * Add model 2025-04-09-wav2vec2_large_100k_voxpopuli_ft_tts_dataset_plus_data_augmentation_portuguese_pt * Add model 2025-04-09-hw1_pipeline_en * Add model 2025-04-09-beesforbo_cafe_orbitinnit_weebbutt_pipeline_en * Add model 2025-04-09-wikineural_multilingual_ner_finetuned_ner_lanakru_pipeline_xx * Add model 2025-04-09-oneonlygriffin_pipeline_en * Add model 2025-04-08-itslucikeller_pipeline_en * Add model 2025-04-09-sustainability_chatbot_pipeline_en * Add model 2025-04-09-vit_base_patch16_224_in21k_finetuned_eurosat_finetuned2_en * Add model 2025-04-09-vit_base_oxford_iiit_pets_niko132_en * Add model 2025-04-09-smids_3x_deit_tiny_adamax_001_fold4_en * Add model 2025-04-09-mri_classifier_djibri_en * Add model 2025-04-09-glamour_ai_skin_model_en * Add model 2025-04-09-brand_renault_v2_pipeline_en * Add model 2025-04-09-hushem_5x_deit_tiny_sgd_00001_fold3_en * Add model 2025-04-09-hvvvvns_en * Add model 2025-04-09-w2v2_libri_10min_philipepper_en * Add model 2025-04-09-vit_base_patch16_224_finetuned_cifar10_phuong_tk_nguyen_en * Add model 2025-04-09-autotrain_6l0e2_ufos2_pipeline_en * Add model 2025-04-09-burmese_awesome_food_model_sharon_kurant_en * Add model 2025-04-09-autotrain_khvt4_4vmox_pipeline_en * Add model 2025-04-09-wav2vec2_base_timit_demo_colab_pinot_en * Add model 2025-04-09-dialogpt_marge_en * Add model 2025-04-08-itslucikeller_en * Add model 2025-04-09-wav2vec2_large_xls_r_300m_sakha_pipeline_en * Add model 2025-04-09-dialopgpt_small_harrypotter_en * Add model 2025-04-09-ckinzthompson_pipeline_en * Add model 2025-04-09-natesilver538_en * Add model 2025-04-09-sent_bert_large_retrained_2_epochs_pipeline_en * Add model 2025-04-09-fine_tuned_gpt_project_en * Add model 2025-04-08-task_assigner_model_en * Add model 2025-04-08-biolinkbert_base_finetuned_ner_pipeline_en * Add model 2025-04-09-wav2vec2_base_timit_demo_colab90_en * Add model 2025-04-09-dbert_ner_pipeline_en * Add model 2025-04-08-vit_base_oxford_iiit_pets_wilbur1240_pipeline_en * Add model 2025-04-09-brand_mobilize_v1_en * Add model 2025-04-09-deleteevelyn_pipeline_en * Add model 2025-04-09-wav2vec2_8_pipeline_en * Add model 2025-04-09-hushem_5x_deit_small_sgd_00001_fold5_pipeline_en * Add model 2025-04-09-wav2vec2_large_xls_r_300m_tamil_colab_aakhilesh_pipeline_en * Add model 2025-04-08-mc_kirundi_en * Add model 2025-04-09-sent_smlm_bert_pipeline_en * Add model 2025-04-08-sent_bert_c1_english_german_pipeline_en * Add model 2025-04-09-genesis_harrybotter_en * Add model 2025-04-08-project_code_py_pipeline_en * Add model 2025-04-09-sent_drclips_pipeline_en * Add model 2025-04-09-akasarahjean_pipeline_en * Add model 2025-04-09-gpt_imdb_hinge_beta_0_1_en * Add model 2025-04-09-kyliejenner_pipeline_en * Add model 2025-04-09-turtle_species_classification_en * Add model 2025-04-09-vit_base_patch16_224_in21k_achyudev_pipeline_en * Add model 2025-04-09-sent_dam_bert_base_mlm_msmarco_trec_covid_en * Add model 2025-04-09-waste_detector_pipeline_en * Add model 2025-04-09-dpakman_en * Add model 2025-04-08-lynnbee01_pipeline_en * Add model 2025-04-08-dialogpt_small_rick_kshaunish_pipeline_en * Add model 2025-04-09-vit_female_age_classification_pipeline_en * Add model 2025-04-07-one_crk10_m0_5_e5_b128_l6_pipeline_en * Add model 2025-04-09-distilbert_token_itr0_0_0001_editorials_01_03_2022_15_20_12_en * Add model 2025-04-09-smids_10x_deit_small_adamax_001_fold4_en * Add model 2025-04-08-the_velvet_underground_en * Add model 2025-04-09-hushem_5x_deit_tiny_adamax_001_fold2_en * Add model 2025-04-08-parikpatelcfa_en * Add model 2025-04-09-bertbek_ner_uznews_pipeline_uz * Add model 2025-04-09-dialogpt_marge_pipeline_en * Add model 2025-04-08-wav2vec2_large_xls_r_300m_kor_lr_3e_3_en * Add model 2025-04-09-hushem_1x_deit_tiny_sgd_00001_fold3_en * Add model 2025-04-09-sent_bert_base_frozen_generics_mlm_en * Add model 2025-04-09-soashworth_pipeline_en * Add model 2025-04-08-bert_ner_ep5_pad_50_finetuned_ner_pipeline_en * Add model 2025-04-09-gpt2_bash_history_baseline_pipeline_en * Add model 2025-04-09-flutterbot_en * Add model 2025-04-07-frankietime_en * Add model 2025-04-09-hushem_5x_deit_small_sgd_0001_fold4_en * Add model 2025-04-08-bmu_finetuned_pubmedbert_mlm_medquad_en * Add model 2025-04-09-db_slr_1_1e_pipeline_en * Add model 2025-04-09-saudiah_repat_someone_470_pipeline_en * Add model 2025-04-09-sent_cxr_bioclinicalbert_v1_en * Add model 2025-04-09-xlsr_vorarlbergerisch_en * Add model 2025-04-09-sent_bert_base_multilingual_uncased_pretrained_xx * Add model 2025-04-08-emotion_classification_dafa_w_en * Add model 2025-04-09-wav2vec2_base_timit_demo_google_colab_atgarcia_pipeline_en * Add model 2025-04-08-bert_finetuned_ner_cti_en * Add model 2025-04-09-sent_arabic_monomodel_monotok_en * Add model 2025-04-09-sent_schwurpert_pipeline_de * Add model 2025-04-08-wav2vec2_large_xls_r_300m_hindi_devendr_en * Add model 2025-04-08-dialogpt_medium_harry_pipeline_en * Add model 2025-04-09-gpt_2_finetuning_airaid_en * Add model 2025-04-08-mchammer_pipeline_en * Add model 2025-04-09-wav2vec2_large_xls_r_300m_kor_11385_2_en * Add model 2025-04-09-sent_bert_base_stackoverflow_comments_2m_pipeline_en * Add model 2025-04-08-shape_nato_pipeline_en * Add model 2025-04-09-burmese_awesome_wnut_model_ai_pipeline_en * Add model 2025-04-09-vit_female_age_classification_en * Add model 2025-04-09-vit_base_oxford_iiit_pets_niko132_pipeline_en * Add model 2025-04-09-koriposting_en * Add model 2025-04-09-rockdrigoma_pipeline_en * Add model 2025-04-09-vit_base_patch16_224_finetuned_cedar_en * Add model 2025-04-09-williamblakebot_pipeline_en * Add model 2025-04-09-bert_base_train_book_ent_15p_ra_en * Add model 2025-04-09-tinybert_train_book_ent_15p_en * Add model 2025-04-08-exp_w2v2t_indonesian_xlsr_53_s358_id * Add model 2025-04-08-bert_finetuned_ner_accelerate_atichets_pipeline_en * Add model 2025-04-09-brad_buchsbaum_en * Add model 2025-04-09-honeytech_pipeline_en * Add model 2025-04-09-extended_gender_classifier_en * Add model 2025-04-09-smids_1x_deit_tiny_rms_001_fold3_pipeline_en * Add model 2025-04-09-icelynjennings_pipeline_en * Add model 2025-04-09-jackposobiec_pipeline_en * Add model 2025-04-09-sent_finnish_monomodel_monotok_pipeline_en * Add model 2025-04-08-exp5_10partition_modelo_asl6000_pipeline_en * Add model 2025-04-08-output_pipeline_pt * Add model 2025-04-09-bert_finetuned_ner_huizhoucheng_en * Add model 2025-04-09-icelynjennings_en * Add model 2025-04-09-sent_tiny_mlm_glue_mnli_from_scratch_custom_tokenizer_expand_vocab_en * Add model 2025-04-09-sent_drclips_en * Add model 2025-04-09-sent_nbme_bio_clinicalbert_en * Add model 2025-04-09-finetune_model_bert_en * Add model 2025-04-09-bert_finetuned_ner_fundrais123_en * Add model 2025-04-09-filler_username_pipeline_en * Add model 2025-04-09-gpt2_chatbot_kuttersn_en * Add model 2025-04-09-musebiihi_pipeline_en * Add model 2025-04-09-disconcision_pipeline_en * Add model 2025-04-09-arxiv_classifier_debertav3_en * Add model 2025-04-08-wenger_en * Add model 2025-04-08-burmese_awesome_model_recod_en * Add model 2025-04-09-exp_w2v2t_portuguese_norwegian_pretraining_s84_pt * Add model 2025-04-09-sent_bert_base_uncased_finetuned_mol_mlm_0_3_en * Add model 2025-04-09-sent_tlm_rct_20k_large_scale_pipeline_en * Add model 2025-04-08-jen_122_pipeline_en * Add model 2025-04-09-dkulchar_pipeline_en * Add model 2025-04-09-pico8degalaleo_pipeline_en * Add model 2025-04-09-dialogpt_medium_captainprice_extended_en * Add model 2025-04-09-wav2vec2_gujarati_stt_pipeline_en * Add model 2025-04-08-smids_5x_deit_small_rms_00001_fold1_en * Add model 2025-04-09-sent_minilm_l12_h384_uncased_finetuned_imdb_en * Add model 2025-04-09-bert_suicide_detection_hk_large_nepal_bhasa_pipeline_en * Add model 2025-04-09-distilbert_base_uncased_news_sentiment_finetuned_english_en * Add model 2025-04-08-monopolyfornite_en * Add model 2025-04-08-dialogpt_small_shy_en * Add model 2025-04-09-distilbert_token_itr0_0_0001_editorials_01_03_2022_15_20_12_pipeline_en * Add model 2025-04-09-kehlani_pipeline_en * Add model 2025-04-09-burmese_awesome_humanaction_model_pipeline_en * Add model 2025-04-09-tigers_side_vit_en * Add model 2025-04-09-stp_classifier_13_1_en * Add model 2025-04-08-nepali_grammar_error_detection_20250311_1323_en * Add model 2025-04-09-mldz4shad_en * Add model 2025-04-09-exp_w2v2t_swedish_northern_sami_xlsr_53_s328_en * Add model 2025-04-09-bert_base_uncased_token_itr0_0_0001_train_essays_test_test_set_05_03_2022_05_58_31_en * Add model 2025-04-09-wav2vec2_xlsr_53_marathi_large_en * Add model 2025-04-09-hushem_5x_deit_small_adamax_0001_fold1_pipeline_en * Add model 2025-04-09-lora_toxic_comment_pipeline_en * Add model 2025-04-09-absa_turkish_bert_based_small_tr * Add model 2025-04-08-smids_1x_deit_tiny_rms_001_fold5_en * Add model 2025-04-09-wav2vec2_base_timit_demo_colab_bsen_pipeline_en * Add model 2025-04-09-bert_base_turkish_sentiment_analysis_pipeline_tr * Add model 2025-04-09-bert_base_turkish_sentiment_analysis_tr * Add model 2025-04-09-bert_base_turkish_offensive_pipeline_tr * Add model 2025-04-09-document_type_identification_en * Add model 2025-04-09-sent_bnbert_pipeline_en * Add model 2025-04-09-wav2vec2_large_xls_r_300m_tamil_colab_aakhilesh_en * Add model 2025-04-08-sent_mbert_tlm_sent_english_chinese_en * Add model 2025-04-08-pii_protection_model_pipeline_en * Add model 2025-04-09-bert_tiny_finetuned_xglue_ner_en * Add model 2025-04-08-wav2vec2_large_xls_r_300m_urdu_colab_pipeline_en * Add model 2025-04-09-sent_bert_base_uncased_issues_128_xxr_pipeline_en * Add model 2025-04-09-sent_mbert_tlm_chat_english_german_en * Add model 2025-04-09-db_slr_1_1e_en * Add model 2025-04-08-cher_pipeline_en * Add model 2025-04-09-wav2vec2_base_libir_zenodo_pipeline_en * Add model 2025-04-09-vit_epochs5_batch32_lr5e_05_size224_tiles4_seed3_q3_dropout_v2_en * Add model 2025-04-09-wav2vec2_base_test_pipeline_en * Add model 2025-04-09-lesseyecontact_en * Add model 2025-04-09-wav2vec2_base_swbd_turn_eos_long_short_utt_removed_5percent_pipeline_en * Add model 2025-04-09-micbucci_pipeline_en * Add model 2025-04-09-veganseltzer_pipeline_en * Add model 2025-04-08-dialogpt_medium_ff7_en * Add model 2025-04-09-sent_storieslm_v1_1945_pipeline_en * Add model 2025-04-09-sent_mbert_tlm_chat_english_chinese_pipeline_en * Add model 2025-04-09-dialogpt_medium_milo_en * Add model 2025-04-09-dataandme_en * Add model 2025-04-09-lumetroid_en * Add model 2025-04-09-dialogpt_medium_milo_pipeline_en * Add model 2025-04-09-bbcqos_fitslut63_kellyg_official_en * Add model 2025-04-09-stp_classifier_13_1_pipeline_en * Add model 2025-04-09-vit_base_beans_demo_v5_hwooo92_pipeline_en * Add model 2025-04-09-ridiculouscrabs_en * Add model 2025-04-08-autotrain_20_12_2022_exam_part3_2543877946_pipeline_en * Add model 2025-04-09-zemfira_en * Add model 2025-04-09-michaeltrazzi_pipeline_en * Add model 2025-04-09-absa_turkish_bert_based_small_pipeline_tr * Add model 2025-04-09-gunna_pipeline_en * Add model 2025-04-09-ourqueeningreen_pipeline_en * Add model 2025-04-09-jenslennartsson_pipeline_en * Add model 2025-04-09-sent_bottleneckbertsmall_en * Add model 2025-04-09-dialogpt_mid_hpai_en * Add model 2025-04-09-shelbythanna_en * Add model 2025-04-09-macintoxic_en * Add model 2025-04-09-square_rundi_square_rundi_second_vote_full_pic_25_age_gender_en * Add model 2025-04-09-sent_first_try_rubert_200_16_16_25ep_en * Add model 2025-04-09-postpostpostr_en * Add model 2025-04-09-richardsocher_en * Add model 2025-04-09-bert_base_german_cased_finetuned_subj_v1_pipeline_en * Add model 2025-04-09-guggersylvain_pipeline_en * Add model 2025-04-09-guggersylvain_en * Add model 2025-04-09-macegrunow_en * Add model 2025-04-09-macegrunow_pipeline_en * Add model 2025-04-09-nueclear333_pipeline_en * Add model 2025-04-09-olikuchi_en * Add model 2025-04-09-wav2vec2_large_xlsr_53_full_train_full_train_pipeline_en * Add model 2025-04-09-lanalilligant_en * Add model 2025-04-08-peppa_pipeline_en * Add model 2025-04-08-3_epochs_classifier_en * Add model 2025-04-08-bert_base_greek_uncased_v1_finetuned_ner_pipeline_en * Add model 2025-04-09-deit_base_patch16_224_rice_leaf_disease_augmented_tagalog_pipeline_en * Add model 2025-04-08-wav2vec2_large_xlsr_estonian_m3hrdadfi_pipeline_et * Add model 2025-04-08-sent_bert_base_uncased_multi_128_pipeline_en * Add model 2025-04-09-mspunks_en * Add model 2025-04-09-mspunks_pipeline_en * Add model 2025-04-09-vit_base_patch16_224_masaratti_pipeline_en * Add model 2025-04-09-burmese_awesome_emotion_identifier_model_en * Add model 2025-04-09-wav2vec2_large_xls_r_300m_chichewa_colab_en * Add model 2025-04-09-lesseyecontact_pipeline_en * Add model 2025-04-07-dialogpt_small_rick_havokx_pipeline_en * Add model 2025-04-08-wav2vec2_large_uralic_voxpopuli_v2_sami_parl_ext_ft_en * Add model 2025-04-09-dnlklr_pipeline_en * Add model 2025-04-09-wav2vec2_base_cynthia_timit_pipeline_en * Add model 2025-04-09-mri_classifier_djibri_pipeline_en --------- Co-authored-by: ahmedlone127 <[email protected]>
1 parent ac203f2 commit a95c2b6

File tree

31,012 files changed

+2489912
-0
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

31,012 files changed

+2489912
-0
lines changed
Lines changed: 102 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,102 @@
1+
---
2+
layout: model
3+
title: Multilingual BioLORD-2023-M XlmRoBertaSentenceEmbeddings from FremyCompany
4+
author: John Snow Labs
5+
name: sent_xlm_roberta_biolord_2023_m
6+
date: 2025-02-14
7+
tags: [multilingual, sentence_embeddings, xlm_roberta, open_source, xx, onnx]
8+
task: Embeddings
9+
language: xx
10+
edition: Spark NLP 5.5.2
11+
spark_version: 3.0
12+
supported: true
13+
engine: onnx
14+
annotator: XlmRoBertaSentenceEmbeddings
15+
article_header:
16+
type: cover
17+
use_language_switcher: "Python-Scala-Java"
18+
---
19+
20+
## Description
21+
22+
Pretrained `XlmRoBertaSentenceEmbeddings` model, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP. `sent_xlm_roberta_biolord_2023_m` is a multilingual model originally trained by FremyCompany. It supports English, Spanish, French, German, Dutch, Danish and Swedish.
23+
24+
## Predicted Entities
25+
26+
27+
28+
{:.btn-box}
29+
<button class="button button-orange" disabled>Live Demo</button>
30+
<button class="button button-orange" disabled>Open in Colab</button>
31+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/sent_xlm_roberta_biolord_2023_m_xx_5.5.2_3.0_1739548358592.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
32+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/sent_xlm_roberta_biolord_2023_m_xx_5.5.2_3.0_1739548358592.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
33+
34+
## How to use
35+
36+
37+
38+
<div class="tabs-box" markdown="1">
39+
{% include programmingLanguageSelectScalaPythonNLU.html %}
40+
```python
41+
documentAssembler = DocumentAssembler() \
42+
.setInputCol("text") \
43+
.setOutputCol("document")
44+
45+
embeddings = XlmRoBertaSentenceEmbeddings.pretrained("sent_xlm_roberta_biolord_2023_m","xx") \
46+
.setInputCols(["document"]) \
47+
.setOutputCol("embeddings")
48+
49+
pipeline = Pipeline().setStages([documentAssembler, embeddings])
50+
51+
data = spark.createDataFrame([["Disfruto trabajando con Spark-NLP."]]).toDF("text")
52+
pipelineModel = pipeline.fit(data)
53+
result = pipelineModel.transform(data)
54+
```
55+
```scala
56+
val documentAssembler = new DocumentAssembler()
57+
.setInputCol("text")
58+
.setOutputCol("document")
59+
60+
val embeddings = XlmRoBertaSentenceEmbeddings
61+
.pretrained("sent_xlm_roberta_biolord_2023_m", "xx")
62+
.setInputCols(Array("document"))
63+
.setOutputCol("embeddings")
64+
65+
val pipeline = new Pipeline().setStages(Array(documentAssembler, embeddings))
66+
67+
68+
val data = Seq("Disfruto trabajando con Spark-NLP.").toDF("text")
69+
70+
val pipelineModel = pipeline.fit(data)
71+
val result = pipelineModel.transform(data)
72+
```
73+
</div>
74+
75+
## Results
76+
77+
```bash
78+
+----------------------------------+----------------------------------------------------------------------+----------------------------------------------------------------------+
79+
| text| document| sentence_embeddings|
80+
+----------------------------------+----------------------------------------------------------------------+----------------------------------------------------------------------+
81+
|Disfruto trabajando con Spark-NLP.|[{document, 0, 33, Disfruto trabajando con Spark-NLP., {sentence ->...|[{sentence_embeddings, 0, 33, Disfruto trabajando con Spark-NLP., {...|
82+
+----------------------------------+----------------------------------------------------------------------+----------------------------------------------------------------------+
83+
84+
```
85+
86+
{:.model-param}
87+
## Model Information
88+
89+
{:.table-model}
90+
|---|---|
91+
|Model Name:|sent_xlm_roberta_biolord_2023_m|
92+
|Compatibility:|Spark NLP 5.5.2+|
93+
|License:|Open Source|
94+
|Edition:|Official|
95+
|Input Labels:|[document]|
96+
|Output Labels:|[xlm_sentence_embeddings]|
97+
|Language:|xx|
98+
|Size:|1.0 GB|
99+
100+
## References
101+
102+
https://huggingface.co/FremyCompany/BioLORD-2023-M
Lines changed: 172 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,172 @@
1+
---
2+
layout: model
3+
title: LLaVA v1.5 7B Q4 GGUF
4+
author: John Snow Labs
5+
name: llava_v1.5_7b_Q4_0_gguf
6+
date: 2025-01-18
7+
tags: [gguf, llamacpp, llava, en, quantized, open_source]
8+
task: Image Captioning
9+
language: en
10+
edition: Spark NLP 6.0.0
11+
spark_version: 3.0
12+
supported: true
13+
engine: llamacpp
14+
annotator: AutoGGUFVisionModel
15+
article_header:
16+
type: cover
17+
use_language_switcher: "Python-Scala-Java"
18+
---
19+
20+
## Description
21+
22+
LLaVA is an open-source chatbot trained by fine-tuning LLaMA/Vicuna on GPT-generated multimodal instruction-following data. It is an auto-regressive language model, based on the transformer architecture.
23+
24+
Originally from https://huggingface.co/Mozilla/llava-v1.5-7b-llamafile
25+
26+
## Predicted Entities
27+
28+
29+
30+
{:.btn-box}
31+
<button class="button button-orange" disabled>Live Demo</button>
32+
<button class="button button-orange" disabled>Open in Colab</button>
33+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/llava_v1.5_7b_Q4_0_gguf_en_6.0.0_3.0_1737207768652.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
34+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/llava_v1.5_7b_Q4_0_gguf_en_6.0.0_3.0_1737207768652.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
35+
36+
## How to use
37+
38+
39+
40+
<div class="tabs-box" markdown="1">
41+
{% include programmingLanguageSelectScalaPythonNLU.html %}
42+
```python
43+
import sparknlp
44+
from sparknlp.base import *
45+
from sparknlp.annotator import *
46+
from pyspark.ml import Pipeline
47+
from pyspark.sql.functions import lit
48+
49+
documentAssembler = DocumentAssembler() \
50+
.setInputCol("caption") \
51+
.setOutputCol("caption_document")
52+
imageAssembler = ImageAssembler() \
53+
.setInputCol("image") \
54+
.setOutputCol("image_assembler")
55+
56+
imagesPath = "src/test/resources/image/"
57+
data = ImageAssembler \
58+
.loadImagesAsBytes(spark, imagesPath) \
59+
.withColumn("caption", lit("Caption this image.")) # Add a caption to each image.
60+
61+
nPredict = 40
62+
model = AutoGGUFVisionModel.pretrained() \
63+
.setInputCols(["caption_document", "image_assembler"]) \
64+
.setOutputCol("completions") \
65+
.setBatchSize(4) \
66+
.setNGpuLayers(99) \
67+
.setNCtx(4096) \
68+
.setMinKeep(0) \
69+
.setMinP(0.05) \
70+
.setNPredict(nPredict) \
71+
.setNProbs(0) \
72+
.setPenalizeNl(False) \
73+
.setRepeatLastN(256) \
74+
.setRepeatPenalty(1.18) \
75+
.setStopStrings(["</s>", "Llama:", "User:"]) \
76+
.setTemperature(0.05) \
77+
.setTfsZ(1) \
78+
.setTypicalP(1) \
79+
.setTopK(40) \
80+
.setTopP(0.95)
81+
82+
pipeline = Pipeline().setStages([documentAssembler, imageAssembler, model])
83+
pipeline.fit(data).transform(data) \
84+
.selectExpr("reverse(split(image.origin, '/'))[0] as image_name", "completions.result") \
85+
.show(truncate = False)
86+
87+
88+
```
89+
```scala
90+
import com.johnsnowlabs.nlp.ImageAssembler
91+
import com.johnsnowlabs.nlp.annotator._
92+
import com.johnsnowlabs.nlp.base._
93+
import org.apache.spark.ml.Pipeline
94+
import org.apache.spark.sql.DataFrame
95+
import org.apache.spark.sql.functions.lit
96+
97+
val documentAssembler = new DocumentAssembler()
98+
.setInputCol("caption")
99+
.setOutputCol("caption_document")
100+
101+
val imageAssembler = new ImageAssembler()
102+
.setInputCol("image")
103+
.setOutputCol("image_assembler")
104+
105+
val imagesPath = "src/test/resources/image/"
106+
val data: DataFrame = ImageAssembler
107+
.loadImagesAsBytes(ResourceHelper.spark, imagesPath)
108+
.withColumn("caption", lit("Caption this image.")) // Add a caption to each image.
109+
110+
val nPredict = 40
111+
val model = AutoGGUFVisionModel.pretrained()
112+
.setInputCols("caption_document", "image_assembler")
113+
.setOutputCol("completions")
114+
.setBatchSize(4)
115+
.setNGpuLayers(99)
116+
.setNCtx(4096)
117+
.setMinKeep(0)
118+
.setMinP(0.05f)
119+
.setNPredict(nPredict)
120+
.setNProbs(0)
121+
.setPenalizeNl(false)
122+
.setRepeatLastN(256)
123+
.setRepeatPenalty(1.18f)
124+
.setStopStrings(Array("</s>", "Llama:", "User:"))
125+
.setTemperature(0.05f)
126+
.setTfsZ(1)
127+
.setTypicalP(1)
128+
.setTopK(40)
129+
.setTopP(0.95f)
130+
131+
val pipeline = new Pipeline().setStages(Array(documentAssembler, imageAssembler, model))
132+
pipeline
133+
.fit(data)
134+
.transform(data)
135+
.selectExpr("reverse(split(image.origin, '/'))[0] as image_name", "completions.result")
136+
.show(truncate = false)
137+
138+
```
139+
</div>
140+
141+
## Results
142+
143+
```bash
144+
+-----------------+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
145+
|image_name |result |
146+
+-----------------+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
147+
|palace.JPEG |[ The image depicts a large, ornate room with high ceilings and beautifully decorated walls. There are several chairs placed throughout the space, some of which have cushions] |
148+
|egyptian_cat.jpeg|[ The image features two cats lying on a pink surface, possibly a bed or sofa. One cat is positioned towards the left side of the scene and appears to be sleeping while holding] |
149+
|hippopotamus.JPEG|[ A large brown hippo is swimming in a body of water, possibly an aquarium. The hippo appears to be enjoying its time in the water and seems relaxed as it floats] |
150+
|hen.JPEG |[ The image features a large chicken standing next to several baby chickens. In total, there are five birds in the scene: one adult and four young ones. They appear to be gathered together] |
151+
|ostrich.JPEG |[ The image features a large, long-necked bird standing in the grass. It appears to be an ostrich or similar species with its head held high and looking around. In addition to] |
152+
|junco.JPEG |[ A small bird with a black head and white chest is standing on the snow. It appears to be looking at something, possibly food or another animal in its vicinity. The scene takes place out] |
153+
|bluetick.jpg |[ A dog with a red collar is sitting on the floor, looking at something. The dog appears to be staring into the distance or focusing its attention on an object in front of it.] |
154+
|chihuahua.jpg |[ A small brown dog wearing a sweater is sitting on the floor. The dog appears to be looking at something, possibly its owner or another animal in the room. It seems comfortable and relaxed]|
155+
|tractor.JPEG |[ A man is sitting in the driver's seat of a green tractor, which has yellow wheels and tires. The tractor appears to be parked on top of an empty field with] |
156+
|ox.JPEG |[ A large bull with horns is standing in a grassy field.] |
157+
+-----------------+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
158+
```
159+
160+
{:.model-param}
161+
## Model Information
162+
163+
{:.table-model}
164+
|---|---|
165+
|Model Name:|llava_v1.5_7b_Q4_0_gguf|
166+
|Compatibility:|Spark NLP 6.0.0+|
167+
|License:|Open Source|
168+
|Edition:|Official|
169+
|Input Labels:|[caption_document, image_assembler]|
170+
|Output Labels:|[completions]|
171+
|Language:|en|
172+
|Size:|4.2 GB|
Lines changed: 86 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,86 @@
1+
---
2+
layout: model
3+
title: English 20230818214706 BertForQuestionAnswering from dkqjrm
4+
author: John Snow Labs
5+
name: 20230818214706
6+
date: 2025-01-29
7+
tags: [en, open_source, onnx, question_answering, bert]
8+
task: Question Answering
9+
language: en
10+
edition: Spark NLP 5.5.1
11+
spark_version: 3.0
12+
supported: true
13+
engine: onnx
14+
annotator: BertForQuestionAnswering
15+
article_header:
16+
type: cover
17+
use_language_switcher: "Python-Scala-Java"
18+
---
19+
20+
## Description
21+
22+
Pretrained BertForQuestionAnswering model, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP.`20230818214706` is a English model originally trained by dkqjrm.
23+
24+
{:.btn-box}
25+
<button class="button button-orange" disabled>Live Demo</button>
26+
<button class="button button-orange" disabled>Open in Colab</button>
27+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/20230818214706_en_5.5.1_3.0_1738185378925.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
28+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/20230818214706_en_5.5.1_3.0_1738185378925.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
29+
30+
## How to use
31+
32+
33+
34+
<div class="tabs-box" markdown="1">
35+
{% include programmingLanguageSelectScalaPythonNLU.html %}
36+
```python
37+
38+
documentAssembler = MultiDocumentAssembler() \
39+
.setInputCol(["question", "context"]) \
40+
.setOutputCol(["document_question", "document_context"])
41+
42+
spanClassifier = BertForQuestionAnswering.pretrained("20230818214706","en") \
43+
.setInputCols(["document_question","document_context"]) \
44+
.setOutputCol("answer")
45+
46+
pipeline = Pipeline().setStages([documentAssembler, spanClassifier])
47+
data = spark.createDataFrame([["What framework do I use?","I use spark-nlp."]]).toDF("document_question", "document_context")
48+
pipelineModel = pipeline.fit(data)
49+
pipelineDF = pipelineModel.transform(data)
50+
51+
```
52+
```scala
53+
54+
val documentAssembler = new MultiDocumentAssembler()
55+
.setInputCol(Array("question", "context"))
56+
.setOutputCol(Array("document_question", "document_context"))
57+
58+
val spanClassifier = BertForQuestionAnswering.pretrained("20230818214706", "en")
59+
.setInputCols(Array("document_question","document_context"))
60+
.setOutputCol("answer")
61+
62+
val pipeline = new Pipeline().setStages(Array(documentAssembler, spanClassifier))
63+
val data = Seq("What framework do I use?","I use spark-nlp.").toDS.toDF("document_question", "document_context")
64+
val pipelineModel = pipeline.fit(data)
65+
val pipelineDF = pipelineModel.transform(data)
66+
67+
```
68+
</div>
69+
70+
{:.model-param}
71+
## Model Information
72+
73+
{:.table-model}
74+
|---|---|
75+
|Model Name:|20230818214706|
76+
|Compatibility:|Spark NLP 5.5.1+|
77+
|License:|Open Source|
78+
|Edition:|Official|
79+
|Input Labels:|[document_question, document_context]|
80+
|Output Labels:|[answer]|
81+
|Language:|en|
82+
|Size:|1.2 GB|
83+
84+
## References
85+
86+
https://huggingface.co/dkqjrm/20230818214706

0 commit comments

Comments
 (0)