
    Of(                        S r SSKrSSKrSSK7  SSKJr  SSKJr  SSK7  SSK	J
r
   " S S\5      r " S	 S
\5      r " S S\5      r0 SS_SS_SS_SS_SS_SS_SS_SS_SS_SS _S!S"_S#S$_S%S&_S'S(_S)S*_S+S,_S-S._0 S/S0_S1S2_S3S4_S5S6_S7S8_S9S:_S;S<_S=S>_S?S@_SASB_SCSD_SESF_SGSH_SISJ_SKSL_SMSN_SOSN_E0 SPSQ_SRSS_STSU_SVSW_SXSY_SZS[_S\S]_S^S__S`Sa_SbSc_SdSe_SfSg_ShSi_SjSk_SlSm_SnSo_SpSq_E0 SrSs_StSu_SvSw_SxSy_SzS{_S|S}_S~S_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_E0 SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_SS_ESSSSSSSSSSSSSSSS.Erg)a  
Corpus reader for the York-Toronto-Helsinki Parsed Corpus of Old
English Prose (YCOE), a 1.5 million word syntactically-annotated
corpus of Old English prose texts. The corpus is distributed by the
Oxford Text Archive: http://www.ota.ahds.ac.uk/ It is not included
with NLTK.

The YCOE corpus is divided into 100 files, each representing
an Old English prose text. Tags used within each text complies
to the YCOE standard: https://www-users.york.ac.uk/~lang22/YCOE/YcoeHome.htm
    N)*)BracketParseCorpusReader)TaggedCorpusReader)RegexpTokenizerc                       \ rS rSrSrSS jrSS jrSS jrS rSS jr	SS	 jr
SS
 jrSS jrSS jrSS jrSS jrSrg)YCOECorpusReader   z
Corpus reader for the York-Toronto-Helsinki Parsed Corpus of Old
English Prose (YCOE), a 1.5 million word syntactically-annotated
corpus of Old English prose texts.
c                    [         R                  X/ U5        [        U R                  R	                  S5      SSUS9U l        [        U R                  R	                  S5      SS5      U l        U R
                  R                  5        Vs1 s H  o3S S iM	     nnU R                  R                  5        Vs1 s H  o3S S iM	     snU:w  a  [        S5      e[        U Vs/ s H  nS	U-  PM
     snU Vs/ s H  nS
U-  PM
     sn-   5      n[         R                  XXb5        [        U5      U l        g s  snf s  snf s  snf s  snf )Npsdz.*.psd)encodingpos.posz5Items in "psd" and "pos" subdirectories do not match.%s.psd%s.pos)CorpusReader__init__YCOEParseCorpusReaderrootjoin_psd_readerYCOETaggedCorpusReader_pos_readerfileids
ValueErrorsorted
_documents)selfr   r   f	documentsdocr   s          9/usr/lib/python3/dist-packages/nltk/corpus/reader/ycoe.pyr   YCOECorpusReader.__init__%   s$   d"h70IINN5!4(
 2$))..2GvV &*%5%5%=%=%?@%?sV%?	@ ,,44676qcrF679DWXX'01yX^y1)23#x#~34
 	d'< + A7 23s   	D25D7D<3E
Nc                     Uc  U R                   $ [        U[        5      (       a  U/nU H   nX R                  ;  d  M  [	        SU-  5      e   [        U Vs1 s H  o"SS iM	     sn5      $ s  snf )z
Return a list of document identifiers for all documents in
this corpus, or for the documents with the given file(s) if
specified.
NzFile id %s not foundr   )r   
isinstancestr_fileidsKeyErrorr   )r   r   r    s      r#   r!   YCOECorpusReader.documents9   so     ???"gs##iGA%5?@@  w/w!"vw/00/s   A,c           
          Uc  U R                   $ [        U[        5      (       a  U/n[        [	        U Vs/ s H  nSU-  PM
     snU Vs/ s H  nSU-  PM
     sn-   5      5      $ s  snf s  snf )z}
Return a list of file identifiers for the files that make up
this corpus, or that store the given document(s) if specified.
r   r   )r(   r&   r'   r   set)r   r!   r"   s      r#   r   YCOECorpusReader.fileidsI   st    
 == 	3''"I+459CC95-67Yc8c>Y78
 	
57s   A'A,c                     Uc  U R                   nOR[        U[        5      (       a  U/nU H4  nX0R                   ;  d  M  USS S;   a  [        S5      e[        SU-  5      e   U Vs/ s H	  oD SU 3PM     sn$ s  snf )zo
Helper that selects the appropriate fileids for a given set of
documents from a given subcorpus (pos or psd).
Nr   )r   r   zvExpected a document identifier, not a file identifier.  (Use corpus.documents() to get a list of document identifiers.z Document identifier %s not found.)r   r&   r'   r   )r   r!   	subcorpusdocumentds        r#   _getfileidsYCOECorpusReader._getfileidsY   s    
 I)S))&K	%??2}(88(>  ))Kh)VWW & -66Iq#Qyk"I666s   'A:c                 X    U R                   R                  U R                  US5      5      $ Nr   )r   wordsr3   r   r!   s     r#   r7   YCOECorpusReader.wordsp   &    %%d&6&6y%&HII    c                 X    U R                   R                  U R                  US5      5      $ r6   )r   sentsr3   r8   s     r#   r=   YCOECorpusReader.sentss   r:   r;   c                 X    U R                   R                  U R                  US5      5      $ r6   )r   parasr3   r8   s     r#   r@   YCOECorpusReader.parasv   r:   r;   c                 X    U R                   R                  U R                  US5      5      $ r6   )r   tagged_wordsr3   r8   s     r#   rC   YCOECorpusReader.tagged_wordsy   &    ,,T-=-=i-OPPr;   c                 X    U R                   R                  U R                  US5      5      $ r6   )r   tagged_sentsr3   r8   s     r#   rG   YCOECorpusReader.tagged_sents|   rE   r;   c                 X    U R                   R                  U R                  US5      5      $ r6   )r   tagged_parasr3   r8   s     r#   rJ   YCOECorpusReader.tagged_paras   rE   r;   c                 X    U R                   R                  U R                  US5      5      $ )Nr   )r   parsed_sentsr3   r8   s     r#   rM   YCOECorpusReader.parsed_sents   rE   r;   )r   r   r   utf8)N)__name__
__module____qualname____firstlineno____doc__r   r!   r   r3   r7   r=   r@   rC   rG   rJ   rM   __static_attributes__ r;   r#   r   r      sE    ,(1 
 7.JJJQQQQr;   r   c                       \ rS rSrSrS rSrg)r      znSpecialized version of the standard bracket parse corpus reader
that strips out (CODE ...) and (ID ...) nodes.c                     [         R                  " SSU5      n[         R                  " SU5      (       a  g [        R                  " X5      $ )Nz(?u)\((CODE|ID)[^\)]*\) z\s*\(\s*\)\s*$)resubmatchr   _parse)r   ts     r#   r_   YCOEParseCorpusReader._parse   s;    FF-r1588%q))'..t77r;   rW   N)rQ   rR   rS   rT   rU   r_   rV   rW   r;   r#   r   r      s    68r;   r   c                       \ rS rSrSS jrSrg)r      c                 J    Sn[        USS9n[        R                  " XUSUS9  g )Nz+(?u)(?<=/\.)\s+|\s*\S*_CODE\s*|\s*\S*_ID\s*T)gaps_)sepsent_tokenizer)r   r   r   )r   r   itemsr   gaps_rerh   s         r#   r   YCOETaggedCorpusReader.__init__   s*    @(t<##3~	
r;   rW   NrO   )rQ   rR   rS   rT   r   rV   rW   r;   r#   r   r      s    
r;   r   zcoadrian.o34zAdrian and Ritheuszcoaelhom.o3u   Ælfric, Supplemental Homilieszcoaelive.o3u   Ælfric's Lives of SaintscoalcuinzAlcuin De virtutibus et vitiisz
coalex.o23zAlexander's Letter to Aristotlezcoapollo.o3zApollonius of Tyrecoaugust	Augustinez	cobede.o2z$Bede's History of the English Churchzcobenrul.o3zBenedictine Rulezcoblick.o23zBlickling Homiliesz
coboeth.o2z#Boethius' Consolation of Philosophyzcobyrhtf.o3zByrhtferth's Manual	cocanedgDzCanons of Edgar (D)	cocanedgXzCanons of Edgar (X)zcocathom1.o3u   Ælfric's Catholic Homilies Izcocathom2.o3u   Ælfric's Catholic Homilies IIz
cochad.o24z
Saint ChadcochdrulzChrodegang of Metz, RulecochristophzSaint ChristopherzcochronA.o23zAnglo-Saxon Chronicle AcochronCzAnglo-Saxon Chronicle CcochronDzAnglo-Saxon Chronicle DzcochronE.o34zAnglo-Saxon Chronicle Ez	cocura.o2zCura PastoraliscocuraCzCura Pastoralis (Cotton)zcodicts.o34zDicts of Catoz
codocu1.o1zDocuments 1 (O1)zcodocu2.o12zDocuments 2 (O1/O2)z
codocu2.o2zDocuments 2 (O2)zcodocu3.o23zDocuments 3 (O2/O3)z
codocu3.o3zDocuments 3 (O3)zcodocu4.o24zDocuments 4 (O2/O4)coeluc1z Honorius of Autun, Elucidarium 1coeluc2zcoepigen.o3u   Ælfric's Epilogue to GenesiscoeuphrzSaint Euphrosynecoeustz Saint Eustace and his companions	coexodusPz
Exodus (P)	cogenesiCzGenesis (C)zcogregdC.o24zGregory's Dialogues (C)zcogregdH.o23zGregory's Dialogues (H)coherbarzPseudo-Apuleius, HerbariumzcoinspolD.o34z"Wulfstan's Institute of Polity (D)	coinspolXz"Wulfstan's Institute of Polity (X)cojameszSaint Jameszcolacnu.o23Lacnungaz
colaece.o2	Leechdomszcolaw1cn.o3zLaws, Cnut Izcolaw2cn.o3zLaws, Cnut IIzcolaw5atr.o3u   Laws, Æthelred Vzcolaw6atr.o3u   Laws, Æthelred VIz
colawaf.o2zLaws, Alfredzcolawafint.o2zAlfred's Introduction to Lawszcolawger.o34zLaws, Gerefazcolawine.ox2z	Laws, Inezcolawnorthu.o3zNorthumbra Preosta Laguzcolawwllad.o4zLaws, William I, Ladzcoleofri.o4Leofriczcolsigef.o3u   Ælfric's Letter to Sigefyrth	colsigewBu!   Ælfric's Letter to Sigeweard (B)zcolsigewZ.o34u!   Ælfric's Letter to Sigeweard (Z)colwgeatu   Ælfric's Letter to Wulfgeat	colwsigeTu    Ælfric's Letter to Wulfsige (T)zcolwsigeXa.o34u!   Ælfric's Letter to Wulfsige (Xa)zcolwstan1.o3u   Ælfric's Letter to Wulfstan Izcolwstan2.o3u   Ælfric's Letter to Wulfstan IIzcomargaC.o34zSaint Margaret (C)comargaTzSaint Margaret (T)comart1zMartyrology, Icomart2zMartyrology, IIzcomart3.o23zMartyrology, IIIzcomarvel.o23zMarvels of the EastcomaryzMary of Egyptconeotz
Saint NeotconicodAzGospel of Nicodemus (A)conicodCzGospel of Nicodemus (C)conicodDzGospel of Nicodemus (D)conicodEzGospel of Nicodemus (E)zcoorosiu.o2Orosiusz
cootest.o3
Heptateuchzcoprefcath1.o3u(   Ælfric's Preface to Catholic Homilies Izcoprefcath2.o3u)   Ælfric's Preface to Catholic Homilies IIzcoprefcura.o2zPreface to the Cura Pastoraliszcoprefgen.o3u   Ælfric's Preface to Genesiszcopreflives.o3u$   Ælfric's Preface to Lives of Saintsz"Preface to Augustine's Soliloquiesz*Pseudo-Apuleius, Medicina de quadrupedibuszHistory of the Holy Rood-TreezSeven SleeperszSt. Augustine's SoliloquieszSolomon and Saturn IzSolomon and Saturn IIu   Ælfric's De Temporibus AnnizVercelli HomilieszVercelli Homilies (E)zVercelli Homilies (L)zSaint Vincent (Bodley 343)zVindicta SalvatoriszWest-Saxon GospelszWulfstan's Homilies)coprefsolilozcoquadru.o23corood	cosevenslcosolilozcosolsat1.o4	cosolsat2z
cotempo.o3coverhom	coverhomE	coverhomLcovinceBcovinsalzcowsgosp.o3z
cowulf.o34)rU   osr\   nltk.corpus.reader.api nltk.corpus.reader.bracket_parser   nltk.corpus.reader.taggedr   nltk.corpus.reader.utilnltk.tokenizer   r   r   r   r   r!   rW   r;   r#   <module>r      s  
 
 	 $ E 8 % )eQ| eQP84 8
/ 
e(e3e .e 0	e
 3e 'e e 7e %e 'e 7e (e &e &e 3e  4!e" ,#e$ *%e& &'e( -)e* )+e, )-e. -/e0 "1e2 )3e4 ?5e6 $7e8 (9e: $;e< (=e> $?e@ (AeB 1CeD 1EeF 2GeH !IeJ 0KeL MeN OeP -QeR -SeT ,UeV 9WeX 5YeZ }[e\ :]e^ +_e` >aeb ?ced 'eef (geh .iej 4kel Nmen Koep /qer +set 9uev 2wex 4yez 8{e| .}e~ 3e@ 9AeB 4CeD 5EeF (GeH $IeJ KeL  MeN %OeP )QeR oSeT lUeV )WeX )YeZ )[e\ )]e^ 9_e` ,aeb @ced Aeef 5geh 2iej <kel 9@-!-*(0#((,%''Ie	r;   