o
    h                     @   sd   d Z ddlZddlZddlmZ ddlmZ ejjejj	gZ
ejdddd Zd	d
 Zdd ZdS )zD
Test the MWT resplitting of preexisting tokens without word splits
    N)resplit_mwt)TEST_MODELS_DIRmodule)scopec                   C   s   t jdtdddS )z1
    A reusable pipeline with the NER module
    enztokenize,mwtgum)dir
processorspackage)stanzaPipeliner    r   r   V/var/www/html/env_mimamsha/lib/python3.10/site-packages/stanza/tests/mwt/test_utils.pypipeline   s   r   c                 C   s<  g dddgg}t || }t|jdksJ t|jd jdks"J t|jd jd jdks1J |jd jd jd jdksAJ |jd jd jd jd	ksQJ t|jd jdks]J t|jd jd jd
kslJ |jd jd jd jdks|J |jd jd jd jdksJ |jd jd jd jd	ksJ dS )z7
    Test splitting with enforced token boundaries
    Izcan'tbelieveitI can'tsleep   r         can't   r   Nr   len	sentencestokenswordstextr   r   docr   r   r   test_resplit_keep_tokens   s   
    $r$   c                 C   s   g dddgg}t || dd}t|jdksJ t|jd jdks$J t|jd jd	 jdks3J |jd jd	 jd jd
ksCJ |jd jd	 jd	 jdksSJ t|jd	 jdks_J t|jd	 jd	 jdksnJ |jd	 jd	 jd jd
ks~J |jd	 jd	 jd	 jdksJ dS )z:
    Test splitting without enforced token boundaries
    r   r   r   F)keep_tokensr   r   r   r   r   r   r   Nr   r"   r   r   r   test_resplit_no_keep_tokens,   s      $r&   )__doc__pytestr   stanza.models.mwt.utilsr   stanza.testsr   markr   travis
pytestmarkfixturer$   r&   r   r   r   r   <module>   s    

