o
    h
                     @   sr   d Z ddlZddlZddlmZ ddlZejjejjgZ	ddl
m  m  m  mZ dZdZdd Zdd	 ZdS )
z4
Tests the conversion code for the SUC3 NER dataset
    N)ZipFileu  
1	Den	den	PN	PN	UTR|SIN|DEF|SUB/OBJ	_	_	_	_	O	_	ac01b-030:2328
2	Gud	Gud	PM	PM	NOM	_	_	_	_	B	myth	ac01b-030:2329
3	giver	giva	VB	VB	PRS|AKT	_	_	_	_	O	_	ac01b-030:2330
4	ämbetet	ämbete	NN	NN	NEU|SIN|DEF|NOM	_	_	_	_	O	_	ac01b-030:2331
5	får	få	VB	VB	PRS|AKT	_	_	_	_	O	_	ac01b-030:2332
6	också	också	AB	AB		_	_	_	_	O	_	ac01b-030:2333
7	förståndet	förstånd	NN	NN	NEU|SIN|DEF|NOM	_	_	_	_	O	_	ac01b-030:2334
8	.	.	MAD	MAD		_	_	_	_	O	_	ac01b-030:2335

1	Han	han	PN	PN	UTR|SIN|DEF|SUB	_	_	_	_	O	_	aa01a-017:227
2	berättar	berätta	VB	VB	PRS|AKT	_	_	_	_	O	_	aa01a-017:228
3	anekdoten	anekdot	NN	NN	UTR|SIN|DEF|NOM	_	_	_	_	O	_	aa01a-017:229
4	som	som	HP	HP	-|-|-	_	_	_	_	O	_	aa01a-017:230
5	FN-medlaren	FN-medlare	NN	NN	UTR|SIN|DEF|NOM	_	_	_	_	O	_	aa01a-017:231
6	Brian	Brian	PM	PM	NOM	_	_	_	_	B	person	aa01a-017:232
7	Urquhart	Urquhart	PM	PM	NOM	_	_	_	_	I	person	aa01a-017:233
8	myntat	mynta	VB	VB	SUP|AKT	_	_	_	_	O	_	aa01a-017:234
9	:	:	MAD	MAD		_	_	_	_	O	_	aa01a-017:235
u   
Den	O
Gud	B-myth
giver	O
ämbetet	O
får	O
också	O
förståndet	O
.	O

Han	O
berättar	O
anekdoten	O
som	O
FN-medlaren	O
Brian	B-person
Urquhart	I-person
myntat	O
:	O
c            	   
   C   s  t  u} tj| d}d}t|d%}||d}|t	  W d   n1 s,w   Y  W d   n1 s;w   Y  d}t
|||}|dksOJ t|}| }W d   n1 sbw   Y  t | ksqJ W d   dS 1 s|w   Y  dS )zK
    Test creating a fake zip file, then converting it to an .iob file
    ztest.zipconllwNiob   )tempfileTemporaryDirectoryospathjoinr   openwrite
TEST_CONLLencodesuc_conll_to_iobextract_from_zipreadEXPECTED_IOBstrip)	tempdirzip_namein_filenamezoutfoutout_filenamenumfinresult r   U/var/www/html/env_mimamsha/lib/python3.10/site-packages/stanza/tests/ner/test_suc3.pytest_read_zip8   s"   


"r    c               
   C   s.  t  } tj| d}t|ddd}|t W d   n1 s#w   Y  d}t|dd%}t|ddd}t	||}W d   n1 sIw   Y  W d   n1 sXw   Y  |dkscJ t|}|
 }W d   n1 svw   Y  t | ksJ W d   dS 1 sw   Y  dS )z=
    Test a direct text file conversion w/o the zip file
    ztest.txtr   zutf-8)encodingNr   r   )r   r   r	   r
   r   r   r   r   r   extractr   r   r   )r   r   r   r   r   r   r   r   r   r   test_read_rawK   s"   
 

"r#   )__doc__r	   r   zipfiler   pytestmarktravispipeline
pytestmark*stanza.utils.datasets.ner.suc_conll_to_iobutilsdatasetsnerr   r   r   r    r#   r   r   r   r   <module>   s    