o
    hq                     @   sn	  d Z ddlZdZi dddddd	d
dddddddddddddddddddddd d!d"d!d#d$i d%dd&d'd(d)d*d+d,d!d-d.d/d0d1d2d3d4d5dd6d7d8d9d:d;d<d!d=d>d?d@dAdBi dCdDdEdFdGdFdHddIdJdKd!dLddMdNdOdPdQdRdSdTdUdVdWdXdYdZd[d\d]d^d_d`i dadbdcdBdddedfdgdhdidjdkdldmdndodpdqdrdsdtdudvdwdxdydzd{d|d}d~dddi dddddddddddddddddd!dd@dddddddddddddddddddddddZeg dZi ddddddd
dddddddddddddddddddd dd"dd#dd%di d&dd(dd*dd,dd-dd/dd1dd3dd5dd6dd8dd:dd<dd=dd?ddAddCdi dEddGddHddIddKddLddMddOddQddSddUddWddYdd[dd]dd_ddadi dcdddddfdgdhddjddlddnddpddvddzdd|dddddddddddddi ddddddddddddddddddddddddddddddddZdd ZeeZd ddddiZ	e	Z
ddidddddddddddddddddddddddÜddiddidƜZi ddǓddȓddɓddddǓddʓd d˓d"dʓd&dd(dd,dʓd<dǓd=dǓdHd̓dKddLddOdǓddddddddddddddddМZdddddwdidќZeeZeeZdddddddddddddӜd!diddid՜Zi dd֓ddדddؓddddٓd dړd"dۓd&dܓd(dݓd,dޓd<dߓdCd!dEdFdKddLddOddcd͓dgdddddddddddddZdddddddZddddddddddd
ZddiZdfdiZdddddddddddd Z	 i ddddddd dd"dd&dd(dd,dd6d	d<d
d=ddEddHddKddLddcddzddddddddZddiZi dddddddddddd dd!d"d#d$d$dd%d&d'dd(dd)dd*d+d,d-d-dd.i d/d0d	d1d2d3d4d5d6d7d8d9d
d:dddd;d<d=d>d?d@dAdBdCdDdEdFdGdHdIdJdKi ddLddMddNddOddPdQdRdSdTdUdVdWdXdYdZdd*d[d\dd]d^d_d`dadd%dbdcdddedfZdgdh ZdS (i  z
Constants for default packages, default pretrains, charlms, etc

Separated from prepare_resources.py so that other modules can use the
same lists / maps without importing the resources script and possibly
causing a circular import
    Npackagesaf	afriboomsangnerthusarpadtbehsebgbtbbxrbdtcaancoracopscriptoriumcspdtcuproielcyccgdaddtdegsdelgdtencombinedesetedteufaperdtfitdtfofarpahcfrfroprofiterolegaidtgdarcosgglctggotgrcperseusgvcadhanhboptnkhehihdtbhrsethsbufalhuszegedhyarmtdphywidisicepahcitjakaglckkktbkmrmgkokaistkpvlatticekyktmulaittblijgltltalksnislvlvtblzhkyotomrmtmudtmyucsymyvjrnbbokmaalndslsdcnlalpinonnnynorskolokkpporvtorototabounpcmnscplpdbptbosqueqafarabiziqpmphilotisqtdsagtrorrtru	syntagrussavedicsdisrasksnkslssjsmegiellasqsrsv	talbankenswlsslctattbtemtgthorchidtrimstugudtiuudtbvtbwtbcavalgsdsimpud)ukurviwoxclzh-hanszh-hantmultilingual)	r   rq   rs   rw   r}   r   r   r   r   fasttextwikiconll17fasttext157utahisprasglovemokhar   r   r   r   r   r   r   c                 C   s<   t | }tD ]}||d  qt D ]}t| ||< q|S N)dictno_pretrain_languagespopspecific_default_pretrainskeys)default_treebanksdefault_pretrainslang r   \/var/www/html/env_mimamsha/lib/python3.10/site-packages/stanza/resources/default_packages.pybuild_default_pretrains   s   r   biomedmimic)craftgeniar   aqmar)conll03germeval2014fasttextcrawlglove)anatembc4chemdbc5cdr
bionlp13cgjnlpbalinnaeusncbi_diseases800	ontonotessampler   i2b2	radiology)r   conll02)r   wikinerr   lst20)r   r   r   r!   rm   r   r   oscarnerthus1024ccwikinewswiki1billion	oscar2023l3cube	oscar2022gigaword)rb   re   ri   rm   ry   r{   r   r   r   r   r   r   r   r   r   )r   r   pubmed)r   r   r   r   r   r   r   r   r   r   r   r   norne)r   rB   ro   nchltaqmar_charlmbsnlp19r   zontonotes-ww-multi_charlmr   armanturkuwikinergold_charlmiahlt_charlmfbkkazNERDnkjpsinersuc3shufflestarlanglangukvlspr   )re   ri   rm   ro   ry   r   r   r   r   r   r   r   r   sstplus_charlmsb10k_charlmtass2020_charlml3cube_charlmvsfc_charlm
ren_charlm)r   r   r!   rb   r   r   arboretum_charlmspmrl_charlmzptb3-revised_charlmcombined_charlmicon_charlm
vit_charlm
alt_charlmcintil_charlmvlsp22_charlmzctb-51_charlm)
r   r   r   r!   rG   rJ   rK   r{   r   r   starlang_charlmaltzudcoref_xlm-roberta-lorazdeeph_muril-large-cased-lora)r   r   r   r   r!   r+   r<   ri   ro   ry   r   z(aubmindlab/araelectra-base-discriminatorzvesteinn/ScandiBERTz,german-nlp-group/electra-base-german-uncasedz"google/electra-large-discriminatorz*bertin-project/bertin-roberta-base-spanishz'HooshvareLab/bert-base-parsbert-uncasedz#TurkuNLP/bert-base-finnish-cased-v1zcamembert/camembert-largezpranaydeeps/Ancient-Greek-BERTz#imvladikon/alephbertgimmel-base-512google/muril-large-casedzxlm-roberta-basezindolem/indobert-base-uncasedz2dbmdz/electra-base-italian-xxl-cased-discriminatorzrinna/japanese-roberta-basezl3cube-pune/marathi-robertazallegro/herbert-base-casedz&neuralmind/bert-large-portuguese-casedz"dbmdz/bert-base-turkish-128k-casedzvinai/phobert-largez,hfl/chinese-electra-180g-large-discriminator)r{   r   r   r   r   r      zasafaya/bert-base-arabiczasafaya-bertzaubmind-electrazaubmindlab/bert-base-arabertv2zaubmind-bert
scandibertzbert-base-german-casedzdbmdz/bert-base-german-casedzdbmdz-bert-german-casedzgerman-nlp-electrazbert-base-multilingual-casedmbertzxlm-roberta-largezelectra-largezmicrosoft/deberta-v3-largezdeberta-v3-largezbertin-robertaparsbertbertz$benjamin/roberta-base-wechsel-frenchzwechsel-robertazcamembert-basezcamembert-largez7dbmdz/electra-base-french-europeana-cased-discriminatorzdbmdz-electrazgrc-pranaydeepsz"lgessler/microbert-ancient-greek-mzgrc-microbert-mz#lgessler/microbert-ancient-greek-mxzgrc-microbert-mxz$lgessler/microbert-ancient-greek-mxpzgrc-microbert-mxpz&altsoph/bert-base-ancientgreek-uncasedzgrc-altsophalephbertgimmelindobertzindobenchmark/indobert-large-p1zindobenchmark-large-p1zindobenchmark/indobert-base-p1zindobenchmark-base-p1z$indobenchmark/indobert-lite-large-p1zindobenchmark-lite-large-p1z#indobenchmark/indobert-lite-base-p1zindobenchmark-lite-base-p1zindobenchmark/indobert-large-p2zindobenchmark-large-p2zindobenchmark/indobert-base-p2zindobenchmark-base-p2z$indobenchmark/indobert-lite-large-p2zindobenchmark-lite-large-p2z#indobenchmark/indobert-lite-base-p2zindobenchmark-lite-base-p2electrazrinna-robertazl3cube-marathi-robertaherbert	bertimbauzmonsoon-nlp/tamillion	tamillionzlgessler/microbert-tamil-mzta-microbert-mzlgessler/microbert-tamil-mxpzta-microbert-mxpzl3cube-pune/tamil-bertzl3cube-tamil-bertzd42kw01f/Tamil-RoBERTazta-d42kw01f-robertazvinai/phobert-basezphobert-basezphobert-largezgoogle-bert/bert-base-chinesezgoogle-bert-chinesezhfl/chinese-roberta-wwm-extzhfl-roberta-chinesezai4bharat/indic-bertz
indic-bertzmuril-base-casedzmuril-large-cased)zgoogle/muril-base-casedr  c                  C   s4   t dd t D } | d t| dd d} | S )z
    Return a list of all the transformer nicknames

    We return a list so that we can sort them in decreasing key length
    c                 s   s    | ]\}}|V  qd S r   r   ).0keyvaluer   r   r   	<genexpr>  s    z"known_nicknames.<locals>.<genexpr>transformerc                 S   s
   t |  S r   )len)xr   r   r   <lambda>  s   
 z!known_nicknames.<locals>.<lambda>)r  )listTRANSFORMER_NICKNAMESitemsappendsorted)	nicknamesr   r   r   known_nicknames  s   
r  )__doc__copyPACKAGESr   r?   r   r   r   r   pos_pretrainsdepparse_pretrainsner_pretrainsdefault_charlmspos_charlmsdeepcopydepparse_charlmslemma_charlmsner_charlmsdefault_nersdefault_sentimentdefault_constituencyoptional_constituencydefault_tokenizeroptional_corefTRANSFORMERSTRANSFORMER_LAYERSr  r  r   r   r   r   <module>   s   	
 !"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWa	
 !"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTX/	
&

	
#
(Lsv 	    +  4  I  P  V  f               "    .	  
  Y
 !$%&'(+.123456789<?BEHKLMNORUVYZ[^_
c