Skip to content

Commit 4b63405

Browse files
2024-12-14-deberta_v3_finetuned_en (#14479)
* Add model 2024-12-15-whisper_small_hausa_bible_tts_en * Add model 2024-12-15-whisper_small_tamil_lingalingeswaran_ta * Add model 2024-12-15-whisper_small_hausa_bible_tts_pipeline_en * Add model 2024-12-15-whisper_small_tamil_lingalingeswaran_pipeline_ta * Add model 2024-12-15-whisper_tiny_artcreativity_photography_tips_en * Add model 2024-12-15-whisper_tiny_artcreativity_photography_tips_pipeline_en * Add model 2024-12-15-whisper_tiny_med_pipeline_en * Add model 2024-12-15-whisper_tiny_med_en * Add model 2024-12-15-whisper_small_divehi_legendarynight_ar * Add model 2024-12-15-whisper_small_divehi_legendarynight_pipeline_ar * Add model 2024-12-15-whisper_medium_lithuanian_phone_16khz_v1_en * Add model 2024-12-15-whisper_small_v3_60000_en * Add model 2024-12-15-whisper_medium_lithuanian_phone_16khz_v1_pipeline_en * Add model 2024-12-15-whisper_small_v3_60000_pipeline_en * Add model 2024-12-15-whisperfinetuning_en * Add model 2024-12-15-whisperfinetuning_pipeline_en * Add model 2024-12-15-xlm_roberta_base_trimmed_french_10000_tweet_sentiment_french_en * Add model 2024-12-15-xlm_roberta_base_trimmed_french_10000_tweet_sentiment_french_pipeline_en * Add model 2024-12-15-xlm_roberta_base_nepal_bhasa_vietnam_train_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_replace_tfidf_en * Add model 2024-12-15-xlm_roberta_base_nepal_bhasa_vietnam_train_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_replace_tfidf_pipeline_en * Add model 2024-12-15-scenario_non_kd_scr_d2_data_cl_massive_all_1_1_en * Add model 2024-12-15-scenario_non_kd_scr_d2_data_cl_massive_all_1_1_pipeline_en * Add model 2024-12-15-roberta_genai_ara_en * Add model 2024-12-15-xlm_roberta_base_finetuned_kinyarwanda_kinyarwanda_finetuned_kinte_tweet_finetuned_kinyarwanda_sent3_en * Add model 2024-12-15-roberta_genai_ara_pipeline_en * Add model 2024-12-15-scenario_tcr_data_cl_cardiff_cl_only2_pipeline_en * Add model 2024-12-15-xlm_roberta_base_mixed_aug_delete_en * Add model 2024-12-15-xlm_roberta_base_mixed_aug_delete_pipeline_en * Add model 2024-12-15-twitter_xlm_roberta_base_sentiment_cardiffnlp_en * Add model 2024-12-15-xlm_roberta_base_finetuned_kinyarwanda_kinyarwanda_finetuned_kinte_tweet_finetuned_kinyarwanda_sent3_pipeline_en * Add model 2024-12-15-twitter_xlm_roberta_base_sentiment_cardiffnlp_pipeline_en * Add model 2024-12-15-scenario_tcr_data_cl_cardiff_cl_only2_en * Add model 2024-12-15-furina_seed42_eng_kinyarwanda_amh_cross_latin_2e_05_pipeline_en * Add model 2024-12-15-furina_seed42_eng_kinyarwanda_amh_cross_latin_2e_05_en * Add model 2024-12-15-scenario_tcr_data_amazonscience_massive_all_1_1_model_xlm_roberta_base_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_insert_tfidf_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_insert_tfidf_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_swap_2_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_delete_en * Add model 2024-12-15-xlm_roberta_base_finetuned_m_share_facts_en * Add model 2024-12-15-xlm_roberta_base_vietnam_aug_replace_phobert_en * Add model 2024-12-15-sentimientos_massa_pipeline_es * Add model 2024-12-15-xlm_roberta_base_vietnam_aug_replace_phobert_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_delete_pipeline_en * Add model 2024-12-15-xlm_roberta_base_balance_mixed_aug_replace_tfidf_en * Add model 2024-12-15-xlm_roberta_base_balance_mixed_aug_replace_tfidf_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_backtranslation_2_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_insert_synonym_1_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_insert_synonym_1_pipeline_en * Add model 2024-12-15-xlm_roberta_base_finetuned_m_share_facts_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_replace_synonym_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_insert_tfidf_1_en * Add model 2024-12-15-custom_classifier_hire_decision_en * Add model 2024-12-15-xlm_roberta_base_mixed_delete_en * Add model 2024-12-15-sentimientos_massa_es * Add model 2024-12-15-xlm_roberta_base_finetuned_detests24_en * Add model 2024-12-15-xlm_roberta_base_finetuned_detests24_pipeline_en * Add model 2024-12-15-xlm_roberta_base_balance_vietnam_aug_backtranslation_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_replace_synonym_pipeline_en * Add model 2024-12-15-xlm_roberta_base_wnli_100_pipeline_en * Add model 2024-12-15-mmarco_mminilmv2_l12_h384_v1_xx * Add model 2024-12-15-scenario_tcr_data_amazonscience_massive_all_1_1_model_xlm_roberta_base_pipeline_en * Add model 2024-12-15-mmarco_mminilmv2_l12_h384_v1_pipeline_xx * Add model 2024-12-15-xlm_roberta_base_wnli_100_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_swap_2_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_swap_pipeline_en * Add model 2024-12-15-xlm_roberta_base_balance_vietnam_aug_backtranslation_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_vietnam_aug_swap_en * Add model 2024-12-15-intent_classification_model_roberta_en * Add model 2024-12-15-xlm_roberta_base_finetuned_kinyarwanda_kinyarwanda_sent1_en * Add model 2024-12-15-xlm_roberta_base_mixed_delete_pipeline_en * Add model 2024-12-15-custom_classifier_hire_decision_pipeline_en * Add model 2024-12-15-intent_classification_model_roberta_pipeline_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_backtranslation_2_pipeline_en * Add model 2024-12-15-malayalam_qa_model_pipeline_en * Add model 2024-12-15-xlm_roberta_base_finetuned_kinyarwanda_kinyarwanda_sent1_pipeline_en * Add model 2024-12-15-roberta_finetuned_state_en * Add model 2024-12-15-xlm_roberta_base_final_mixed_aug_insert_tfidf_1_pipeline_en * Add model 2024-12-15-malayalam_qa_model_en * Add model 2024-12-15-roberta_vmw_mrqa_plus_en * Add model 2024-12-15-roberta_updated_model_02_pipeline_en * Add model 2024-12-15-roberta_finetuned_state_pipeline_en * Add model 2024-12-15-roberta_vmw_mrqa_plus_pipeline_en * Add model 2024-12-15-individual_carbon_emission_roberta_en * Add model 2024-12-15-roberta_updated_model_02_en * Add model 2024-12-15-individual_carbon_emission_roberta_pipeline_en * Add model 2024-12-15-roberta_vmw_mrqa_en * Add model 2024-12-15-roberta_vmw_mrqa_pipeline_en * Add model 2024-12-15-al_roberta_pipeline_en * Add model 2024-12-15-al_roberta_en * Add model 2024-12-15-debiasing_pre_trained_contextualised_embeddings_albert_en * Add model 2024-12-15-debiasing_pre_trained_contextualised_embeddings_albert_pipeline_en * Add model 2024-12-15-albert_base_v2_finetuned_bible_en * Add model 2024-12-15-albert_base_v2_finetuned_bible_pipeline_en * Add model 2024-12-15-watermark_detector_en * Add model 2024-12-15-watermark_detector_pipeline_en * Add model 2024-12-15-vit_base_nsfw_detector_adamcodd_en * Add model 2024-12-15-ethnicity_test_v003_pipeline_en * Add model 2024-12-15-ethnicity_test_v003_en * Add model 2024-12-15-vit_base_nsfw_detector_adamcodd_pipeline_en * Add model 2024-12-15-sent_chungli_ao_xlm_roberta_news_en * Add model 2024-12-15-sent_chungli_ao_xlm_roberta_news_pipeline_en * Add model 2024-12-15-bert_tiny_lda_20_cola_en * Add model 2024-12-15-bert_tiny_lda_20_cola_pipeline_en * Add model 2024-12-15-m365_h1_base_en * Add model 2024-12-15-test_bed_type_model_classifier_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_emotion_cotysong113_en * Add model 2024-12-15-distilbert_base_uncased_imdb_sentiment_pipeline_en * Add model 2024-12-15-truviz_ai_detect_en * Add model 2024-12-15-m365_h1_base_pipeline_en * Add model 2024-12-15-distilbert_sst5_padding40model_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_emotion_hoibui_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_qqp_kietb_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_qqp_kietb_en * Add model 2024-12-15-bert_finetuned_imdb_sentiment_en * Add model 2024-12-15-imdbert_en * Add model 2024-12-15-truviz_ai_detect_nepal_bhasa_en * Add model 2024-12-15-emotion_classification_model_matthewb245_pipeline_en * Add model 2024-12-15-finetuned_distilbert_with_amazon_fine_food_reviews_en * Add model 2024-12-15-burmese_finetuned_sentiment_model_tejasbits_pipeline_en * Add model 2024-12-15-db_fe2_3_2_1_en * Add model 2024-12-15-db_fe2_5_2_1_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_cola_boudreaup_en * Add model 2024-12-15-georgian_retrained_v1_en * Add model 2024-12-15-emotion_classification_model_matthewb245_en * Add model 2024-12-15-categor_ai_23_cats_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_distilled_clinc_vanillathunder_en * Add model 2024-12-15-food_not_food_text_classifier_distilbert_base_uncased_pipeline_en * Add model 2024-12-15-xlm_roberta_base_mixed_aug_replace_w2v_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_clinc_moraudiet_pipeline_en * Add model 2024-12-15-xlm_roberta_base_finetuning_wrime_random4000_epoch6_test01_en * Add model 2024-12-15-rulebert_v0_3_k0_it * Add model 2024-12-15-xlm_roberta_base_finetuning_wrime_random4000_epoch6_test01_pipeline_en * Add model 2024-12-15-distilbert_agnews_padding60model_en * Add model 2024-12-15-truviz_ai_detect_nepal_bhasa_pipeline_en * Add model 2024-12-15-amharic_news_classification_pipeline_en * Add model 2024-12-15-burmese_finetuned_sentiment_model_tejasbits_en * Add model 2024-12-15-l1_classifier_copexp_en * Add model 2024-12-15-l1_classifier_copexp_pipeline_en * Add model 2024-12-15-scenario_norwegian_kd_weight_reset_data_smsa_model_xlm_roberta_base_en * Add model 2024-12-15-xlm_roberta_finetuned_emojis_2_client_toxic_krum_iid_fed_en * Add model 2024-12-15-m365_h2_data_analysis_and_management_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_amazon_sentiment_analysis_en * Add model 2024-12-15-db_fe2_3_1_pipeline_en * Add model 2024-12-15-scenario_non_kd_scr_d2_data_cardiffnlp_tweet_sentiment_multilingual_all3_xx * Add model 2024-12-15-xlm_roberta_base_finetuned_m_help_seller_en * Add model 2024-12-15-scenario_non_kd_scr_d2_data_cardiffnlp_tweet_sentiment_multilingual_all3_pipeline_xx * Add model 2024-12-15-xlm_roberta_base_finetuned_m_help_seller_pipeline_en * Add model 2024-12-15-distilbert_agnews_padding60model_pipeline_en * Add model 2024-12-15-finetuning_distillbert_amazon_polarity_pipeline_en * Add model 2024-12-15-intent_analysis_v0_en * Add model 2024-12-15-multilingual_sentiment_analysis_xx * Add model 2024-12-15-fm_tc_hybrid_xml_catsp_end_en * Add model 2024-12-15-mnli_trained_xlm_roberta_en * Add model 2024-12-15-scenario_non_kd_pr_copy_cdf_english_d2_data_english_cardiff_eng_only_beta_pipeline_en * Add model 2024-12-15-furina_seed42_eng_kinyarwanda_amh_en * Add model 2024-12-15-distilbert_p1_pipeline_en * Add model 2024-12-15-xlm_roberta_base_trimmed_spanish_xnli_spanish_pipeline_en * Add model 2024-12-15-xlm_roberta_base_trimmed_spanish_xnli_spanish_en * Add model 2024-12-15-scenario_non_kd_pr_copy_cdf_cl_d2_data_cl_cardiff_cl_only_gamma_en * Add model 2024-12-15-distilbert_base_uncased_amazon_sentiment_analysis_pipeline_en * Add model 2024-12-15-scenario_non_kd_pr_copy_cdf_cl_d2_data_cl_cardiff_cl_only_gamma_pipeline_en * Add model 2024-12-15-georgian_retrained_v3_en * Add model 2024-12-15-distillbert_uncased_ag_news_en * Add model 2024-12-15-crypto_sustainability_news_text_classifier_distilbert_base_uncased_pipeline_en * Add model 2024-12-15-xlm_roberta_finetuned_emojis_2_client_toxic_krum_iid_fed_pipeline_en * Add model 2024-12-15-scenario_norwegian_kd_weight_reset_data_smsa_model_xlm_roberta_base_pipeline_en * Add model 2024-12-15-intent_analysis_v0_pipeline_en * Add model 2024-12-15-bge_reranker_base_ttkhang202_pipeline_en * Add model 2024-12-15-truviz_ai_detect_pipeline_en * Add model 2024-12-15-xlmr_romanian_english_all_shuffled_1986_test1000_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_emotion_hoibui_en * Add model 2024-12-15-trymodel_en * Add model 2024-12-15-xlm_roberta_base_seed42_original_amh_hau_eng_train_en * Add model 2024-12-15-xlm_roberta_base_seed42_original_amh_hau_eng_train_pipeline_en * Add model 2024-12-15-kaggle_nlp_with_desaster_tweets_01_en * Add model 2024-12-15-news_category_classifier_pipeline_en * Add model 2024-12-15-distilbert_food_en * Add model 2024-12-15-bge_reranker_base_ttkhang202_en * Add model 2024-12-15-distilbert_base_uncased_imdb_sentiment_en * Add model 2024-12-15-deberta_v3_base_squadv2_pipeline_en * Add model 2024-12-15-distillbert_uncased_ag_news_pipeline_en * Add model 2024-12-15-amharic_news_classification_en * Add model 2024-12-15-log_analysis_model_distilbert_pipeline_en * Add model 2024-12-15-m365_h2_data_analysis_and_management_en * Add model 2024-12-15-phishing_email_detection_pipeline_en * Add model 2024-12-15-categor_ai_23_cats_en * Add model 2024-12-15-finetuning_distillbert_amazon_polarity_en * Add model 2024-12-15-learn_hf_mood_detection_text_classifier_distilbert_base_uncased_en * Add model 2024-12-15-bert_base_lda_mnli_en * Add model 2024-12-15-db_fe2_3_2_1_pipeline_en * Add model 2024-12-15-deberta_v3_base_squadv2_en * Add model 2024-12-15-bert_finetuned_imdb_sentiment_pipeline_en * Add model 2024-12-15-db_fe2_5_2_1_pipeline_en * Add model 2024-12-15-imdbert_pipeline_en * Add model 2024-12-15-xlmr_english_german_all_shuffled_2020_test1000_en * Add model 2024-12-15-emotion_endpoint_test_en * Add model 2024-12-15-bert_base_lda_mnli_pipeline_en * Add model 2024-12-15-affilgood_ner_v2_en * Add model 2024-12-15-distilbert_food_pipeline_en * Add model 2024-12-15-news_category_classifier_en * Add model 2024-12-15-phishing_email_detection_en * Add model 2024-12-15-fm_tc_hybrid_xml_catsp_end_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_emotion_cotysong113_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_cola_boudreaup_pipeline_en * Add model 2024-12-15-distilbert_sst5_padding40model_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_cola_veipsf_en * Add model 2024-12-15-kaggle_nlp_with_desaster_tweets_01_pipeline_en * Add model 2024-12-15-emotion_endpoint_test_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_distilled_clinc_vanillathunder_pipeline_en * Add model 2024-12-15-roberta_ganda_cased_malay_ner_test_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_cola_veipsf_pipeline_en * Add model 2024-12-15-food_not_food_text_classifier_distilbert_base_uncased_en * Add model 2024-12-15-bert_base_lda_20_cola_pipeline_en * Add model 2024-12-15-affilgood_ner_v2_pipeline_en * Add model 2024-12-15-log_analysis_model_distilbert_en * Add model 2024-12-15-crypto_sustainability_news_text_classifier_distilbert_base_uncased_en * Add model 2024-12-15-learn_hf_mood_detection_text_classifier_distilbert_base_uncased_pipeline_en * Add model 2024-12-15-test_bed_type_model_classifier_pipeline_en * Add model 2024-12-15-trymodel_pipeline_en * Add model 2024-12-15-distilbert_base_uncased_finetuned_clinc_moraudiet_en * Add model 2024-12-15-xlm_roberta_base_mixed_aug_replace_w2v_pipeline_en * Add model 2024-12-15-xlm_roberta_base_finetuned_panx_french_lee_soha_en * Add model 2024-12-15-xlm_roberta_base_finetuned_panx_german_french_cotysong113_en * Add model 2024-12-15-xlm_roberta_base_finetuned_panx_german_mealduct_en * Add model 2024-12-15-scenario_non_kd_pr_copy_cdf_english_d2_data_english_cardiff_eng_only_beta_en * Add model 2024-12-15-georgian_retrained_v3_pipeline_en * Add model 2024-12-15-xlmr_english_german_all_shuffled_2020_test1000_pipeline_en * Add model 2024-12-15-finetuned_distilbert_with_amazon_fine_food_reviews_pipeline_en * Add model 2024-12-15-xlm_roberta_base_finetuned_panx_french_lee_soha_pipeline_en * Add model 2024-12-15-xlmr_romanian_english_all_shuffled_1986_test1000_en * Add model 2024-12-15-roberta_ganda_cased_malay_ner_test_pipeline_en * Add model 2024-12-15-rulebert_v0_3_k0_pipeline_it * Add model 2024-12-15-furina_seed42_eng_kinyarwanda_amh_pipeline_en * Add model 2024-12-15-distilbert_p1_en * Add model 2024-12-15-multilingual_sentiment_analysis_pipeline_xx * Add model 2024-12-15-georgian_retrained_v1_pipeline_en * Add model 2024-12-15-bert_base_lda_20_cola_en * Add model 2024-12-15-db_fe2_3_1_en * Add model 2024-12-15-mnli_trained_xlm_roberta_pipeline_en * Add model 2024-12-15-clip_hugging_face_en * Add model 2024-12-15-clip_hugging_face_pipeline_en * Add model 2024-12-15-clip_saban_vit_l_14_en * Add model 2024-12-15-clip_seed_vit_en * Add model 2024-12-15-clip_seed_vit_pipeline_en * Add model 2024-12-15-clip_zabir_en * Add model 2024-12-15-clip_zabir_pipeline_en * Add model 2024-12-15-clip_saban_vit_l_14_pipeline_en --------- Co-authored-by: ahmedlone127 <[email protected]>
1 parent ec286d8 commit 4b63405

File tree

750 files changed

+60133
-0
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

750 files changed

+60133
-0
lines changed
Lines changed: 94 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,94 @@
1+
---
2+
layout: model
3+
title: English 1a5e2b8e XlmRoBertaForTokenClassification from Osquery
4+
author: John Snow Labs
5+
name: 1a5e2b8e
6+
date: 2024-12-14
7+
tags: [en, open_source, onnx, token_classification, xlm_roberta, ner]
8+
task: Named Entity Recognition
9+
language: en
10+
edition: Spark NLP 5.5.1
11+
spark_version: 3.0
12+
supported: true
13+
engine: onnx
14+
annotator: XlmRoBertaForTokenClassification
15+
article_header:
16+
type: cover
17+
use_language_switcher: "Python-Scala-Java"
18+
---
19+
20+
## Description
21+
22+
Pretrained XlmRoBertaForTokenClassification model, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP.`1a5e2b8e` is a English model originally trained by Osquery.
23+
24+
{:.btn-box}
25+
<button class="button button-orange" disabled>Live Demo</button>
26+
<button class="button button-orange" disabled>Open in Colab</button>
27+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/1a5e2b8e_en_5.5.1_3.0_1734214604186.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
28+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/1a5e2b8e_en_5.5.1_3.0_1734214604186.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
29+
30+
## How to use
31+
32+
33+
34+
<div class="tabs-box" markdown="1">
35+
{% include programmingLanguageSelectScalaPythonNLU.html %}
36+
```python
37+
38+
documentAssembler = DocumentAssembler() \
39+
.setInputCol('text') \
40+
.setOutputCol('document')
41+
42+
tokenizer = Tokenizer() \
43+
.setInputCols(['document']) \
44+
.setOutputCol('token')
45+
46+
tokenClassifier = XlmRoBertaForTokenClassification.pretrained("1a5e2b8e","en") \
47+
.setInputCols(["documents","token"]) \
48+
.setOutputCol("ner")
49+
50+
pipeline = Pipeline().setStages([documentAssembler, tokenizer, tokenClassifier])
51+
data = spark.createDataFrame([["I love spark-nlp"]]).toDF("text")
52+
pipelineModel = pipeline.fit(data)
53+
pipelineDF = pipelineModel.transform(data)
54+
55+
```
56+
```scala
57+
58+
val documentAssembler = new DocumentAssembler()
59+
.setInputCols("text")
60+
.setOutputCols("document")
61+
62+
val tokenizer = new Tokenizer()
63+
.setInputCols("document")
64+
.setOutputCol("token")
65+
66+
val tokenClassifier = XlmRoBertaForTokenClassification.pretrained("1a5e2b8e", "en")
67+
.setInputCols(Array("documents","token"))
68+
.setOutputCol("ner")
69+
70+
val pipeline = new Pipeline().setStages(Array(documentAssembler, tokenizer, tokenClassifier))
71+
val data = Seq("I love spark-nlp").toDS.toDF("text")
72+
val pipelineModel = pipeline.fit(data)
73+
val pipelineDF = pipelineModel.transform(data)
74+
75+
```
76+
</div>
77+
78+
{:.model-param}
79+
## Model Information
80+
81+
{:.table-model}
82+
|---|---|
83+
|Model Name:|1a5e2b8e|
84+
|Compatibility:|Spark NLP 5.5.1+|
85+
|License:|Open Source|
86+
|Edition:|Official|
87+
|Input Labels:|[document, token]|
88+
|Output Labels:|[ner]|
89+
|Language:|en|
90+
|Size:|769.7 MB|
91+
92+
## References
93+
94+
https://huggingface.co/Osquery/1a5e2b8e
Lines changed: 70 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,70 @@
1+
---
2+
layout: model
3+
title: English 1a5e2b8e_pipeline pipeline XlmRoBertaForTokenClassification from Osquery
4+
author: John Snow Labs
5+
name: 1a5e2b8e_pipeline
6+
date: 2024-12-14
7+
tags: [en, open_source, pipeline, onnx]
8+
task: Named Entity Recognition
9+
language: en
10+
edition: Spark NLP 5.5.1
11+
spark_version: 3.0
12+
supported: true
13+
annotator: PipelineModel
14+
article_header:
15+
type: cover
16+
use_language_switcher: "Python-Scala-Java"
17+
---
18+
19+
## Description
20+
21+
Pretrained XlmRoBertaForTokenClassification, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP.`1a5e2b8e_pipeline` is a English model originally trained by Osquery.
22+
23+
{:.btn-box}
24+
<button class="button button-orange" disabled>Live Demo</button>
25+
<button class="button button-orange" disabled>Open in Colab</button>
26+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/1a5e2b8e_pipeline_en_5.5.1_3.0_1734214743900.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
27+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/1a5e2b8e_pipeline_en_5.5.1_3.0_1734214743900.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
28+
29+
## How to use
30+
31+
32+
33+
<div class="tabs-box" markdown="1">
34+
{% include programmingLanguageSelectScalaPythonNLU.html %}
35+
```python
36+
37+
pipeline = PretrainedPipeline("1a5e2b8e_pipeline", lang = "en")
38+
annotations = pipeline.transform(df)
39+
40+
```
41+
```scala
42+
43+
val pipeline = new PretrainedPipeline("1a5e2b8e_pipeline", lang = "en")
44+
val annotations = pipeline.transform(df)
45+
46+
```
47+
</div>
48+
49+
{:.model-param}
50+
## Model Information
51+
52+
{:.table-model}
53+
|---|---|
54+
|Model Name:|1a5e2b8e_pipeline|
55+
|Type:|pipeline|
56+
|Compatibility:|Spark NLP 5.5.1+|
57+
|License:|Open Source|
58+
|Edition:|Official|
59+
|Language:|en|
60+
|Size:|769.7 MB|
61+
62+
## References
63+
64+
https://huggingface.co/Osquery/1a5e2b8e
65+
66+
## Included Models
67+
68+
- DocumentAssembler
69+
- TokenizerModel
70+
- XlmRoBertaForTokenClassification
Lines changed: 70 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,70 @@
1+
---
2+
layout: model
3+
title: Multilingual affilgood_ner_multilingual_pipeline pipeline XlmRoBertaForTokenClassification from SIRIS-Lab
4+
author: John Snow Labs
5+
name: affilgood_ner_multilingual_pipeline
6+
date: 2024-12-14
7+
tags: [xx, open_source, pipeline, onnx]
8+
task: Named Entity Recognition
9+
language: xx
10+
edition: Spark NLP 5.5.1
11+
spark_version: 3.0
12+
supported: true
13+
annotator: PipelineModel
14+
article_header:
15+
type: cover
16+
use_language_switcher: "Python-Scala-Java"
17+
---
18+
19+
## Description
20+
21+
Pretrained XlmRoBertaForTokenClassification, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP.`affilgood_ner_multilingual_pipeline` is a Multilingual model originally trained by SIRIS-Lab.
22+
23+
{:.btn-box}
24+
<button class="button button-orange" disabled>Live Demo</button>
25+
<button class="button button-orange" disabled>Open in Colab</button>
26+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/affilgood_ner_multilingual_pipeline_xx_5.5.1_3.0_1734213424755.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
27+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/affilgood_ner_multilingual_pipeline_xx_5.5.1_3.0_1734213424755.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
28+
29+
## How to use
30+
31+
32+
33+
<div class="tabs-box" markdown="1">
34+
{% include programmingLanguageSelectScalaPythonNLU.html %}
35+
```python
36+
37+
pipeline = PretrainedPipeline("affilgood_ner_multilingual_pipeline", lang = "xx")
38+
annotations = pipeline.transform(df)
39+
40+
```
41+
```scala
42+
43+
val pipeline = new PretrainedPipeline("affilgood_ner_multilingual_pipeline", lang = "xx")
44+
val annotations = pipeline.transform(df)
45+
46+
```
47+
</div>
48+
49+
{:.model-param}
50+
## Model Information
51+
52+
{:.table-model}
53+
|---|---|
54+
|Model Name:|affilgood_ner_multilingual_pipeline|
55+
|Type:|pipeline|
56+
|Compatibility:|Spark NLP 5.5.1+|
57+
|License:|Open Source|
58+
|Edition:|Official|
59+
|Language:|xx|
60+
|Size:|1.0 GB|
61+
62+
## References
63+
64+
https://huggingface.co/SIRIS-Lab/affilgood-NER-multilingual
65+
66+
## Included Models
67+
68+
- DocumentAssembler
69+
- TokenizerModel
70+
- XlmRoBertaForTokenClassification
Lines changed: 94 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,94 @@
1+
---
2+
layout: model
3+
title: Multilingual affilgood_ner_multilingual XlmRoBertaForTokenClassification from SIRIS-Lab
4+
author: John Snow Labs
5+
name: affilgood_ner_multilingual
6+
date: 2024-12-14
7+
tags: [xx, open_source, onnx, token_classification, xlm_roberta, ner]
8+
task: Named Entity Recognition
9+
language: xx
10+
edition: Spark NLP 5.5.1
11+
spark_version: 3.0
12+
supported: true
13+
engine: onnx
14+
annotator: XlmRoBertaForTokenClassification
15+
article_header:
16+
type: cover
17+
use_language_switcher: "Python-Scala-Java"
18+
---
19+
20+
## Description
21+
22+
Pretrained XlmRoBertaForTokenClassification model, adapted from Hugging Face and curated to provide scalability and production-readiness using Spark NLP.`affilgood_ner_multilingual` is a Multilingual model originally trained by SIRIS-Lab.
23+
24+
{:.btn-box}
25+
<button class="button button-orange" disabled>Live Demo</button>
26+
<button class="button button-orange" disabled>Open in Colab</button>
27+
[Download](https://s3.amazonaws.com/auxdata.johnsnowlabs.com/public/models/affilgood_ner_multilingual_xx_5.5.1_3.0_1734213370612.zip){:.button.button-orange.button-orange-trans.arr.button-icon}
28+
[Copy S3 URI](s3://auxdata.johnsnowlabs.com/public/models/affilgood_ner_multilingual_xx_5.5.1_3.0_1734213370612.zip){:.button.button-orange.button-orange-trans.button-icon.button-copy-s3}
29+
30+
## How to use
31+
32+
33+
34+
<div class="tabs-box" markdown="1">
35+
{% include programmingLanguageSelectScalaPythonNLU.html %}
36+
```python
37+
38+
documentAssembler = DocumentAssembler() \
39+
.setInputCol('text') \
40+
.setOutputCol('document')
41+
42+
tokenizer = Tokenizer() \
43+
.setInputCols(['document']) \
44+
.setOutputCol('token')
45+
46+
tokenClassifier = XlmRoBertaForTokenClassification.pretrained("affilgood_ner_multilingual","xx") \
47+
.setInputCols(["documents","token"]) \
48+
.setOutputCol("ner")
49+
50+
pipeline = Pipeline().setStages([documentAssembler, tokenizer, tokenClassifier])
51+
data = spark.createDataFrame([["I love spark-nlp"]]).toDF("text")
52+
pipelineModel = pipeline.fit(data)
53+
pipelineDF = pipelineModel.transform(data)
54+
55+
```
56+
```scala
57+
58+
val documentAssembler = new DocumentAssembler()
59+
.setInputCols("text")
60+
.setOutputCols("document")
61+
62+
val tokenizer = new Tokenizer()
63+
.setInputCols("document")
64+
.setOutputCol("token")
65+
66+
val tokenClassifier = XlmRoBertaForTokenClassification.pretrained("affilgood_ner_multilingual", "xx")
67+
.setInputCols(Array("documents","token"))
68+
.setOutputCol("ner")
69+
70+
val pipeline = new Pipeline().setStages(Array(documentAssembler, tokenizer, tokenClassifier))
71+
val data = Seq("I love spark-nlp").toDS.toDF("text")
72+
val pipelineModel = pipeline.fit(data)
73+
val pipelineDF = pipelineModel.transform(data)
74+
75+
```
76+
</div>
77+
78+
{:.model-param}
79+
## Model Information
80+
81+
{:.table-model}
82+
|---|---|
83+
|Model Name:|affilgood_ner_multilingual|
84+
|Compatibility:|Spark NLP 5.5.1+|
85+
|License:|Open Source|
86+
|Edition:|Official|
87+
|Input Labels:|[document, token]|
88+
|Output Labels:|[ner]|
89+
|Language:|xx|
90+
|Size:|1.0 GB|
91+
92+
## References
93+
94+
https://huggingface.co/SIRIS-Lab/affilgood-NER-multilingual

0 commit comments

Comments
 (0)