
    g	                     6    d Z ddlmZ ddlmZ  G d de      Zy)z5
UDHR corpus reader. It mostly deals with encodings.
    )PlaintextCorpusReader)find_corpus_fileidsc                   0     e Zd Zg dZh dZd fd	Z xZS )UdhrCorpusReader))z
.*-Latin1$zlatin-1)z
.*-Hebrew$hebrew)z
.*-Arabic$cp1256)zCzech_Cesky-UTF8cp1250)zPolish-Latin2r	   )zPolish_Polski-Latin2r	   )z.*-Cyrillic$cyrillic)z.*-SJIS$SJIS)z
.*-GB2312$GB2312)z
.*-Latin2$z
ISO-8859-2)z	.*-Greek$greek)z.*-UTF8$zutf-8)Hungarian_Magyar-Unicodez	utf-16-le)Amahuacalatin1)zTurkish_Turkce-Turkishlatin5)zLithuanian_Lietuviskai-Balticlatin4)zJapanese_Nihongo-EUCzEUC-JP)Japanese_Nihongo-JIS
iso2022_jp)Chinese_Mandarin-HZhz)zAbkhaz\-Cyrillic\+Abkhcp1251>   Lao-UTF8
Tamil-UTF8Magahi-AgraMagahi-UTF8Marathi-UTF8Bhojpuri-AgraEsperanto-T61Gujarati-UTF8Vietnamese-VPSVietnamese-TCVNVietnamese-VIQRCzech-Latin2-errArmenian-DallakHelvBurmese_Myanmar-UTF8Russian_Russky-UTF8~Chinese_Mandarin-UTF8Amharic-Afenegus6..60375Tigrinya_Tigrigna-VG2MainBurmese_Myanmar-WinResearcherNavaho_Dine-Navajo-Navaho-font(Azeri_Azerbaijani_Latin-Az.Times.Lat01172Azeri_Azerbaijani_Cyrillic-Az.Times.Cyr.Normal0117r   r   r   c                     t        |d      }t        | 	  ||D cg c]  }|| j                  vs| c}| j                         y c c}w )Nz(?!README|\.).*)encoding)r   super__init__SKIP	ENCODINGS)selfrootfileidsfileid	__class__s       L/var/www/openai/venv/lib/python3.12/site-packages/nltk/corpus/reader/udhr.pyr1   zUdhrCorpusReader.__init__D   sL    %d,>?")E'V499-DV'E^^ 	 	
Es
   A
A
)udhr)__name__
__module____qualname__r3   r2   r1   __classcell__)r8   s   @r9   r   r   	   s    I.!DF
 
    r   N)__doc__nltk.corpus.reader.plaintextr   nltk.corpus.reader.utilr   r    r?   r9   <module>rD      s!    ? 7A
, A
r?   