o
    i	                     @   s0   d Z ddlmZ ddlmZ G dd deZdS )z5
UDHR corpus reader. It mostly deals with encodings.
    )PlaintextCorpusReader)find_corpus_fileidsc                       s.   e Zd Zg dZh dZd fdd	Z  ZS )UdhrCorpusReader))z
.*-Latin1$zlatin-1)z
.*-Hebrew$hebrew)z
.*-Arabic$cp1256)zCzech_Cesky-UTF8cp1250)zPolish-Latin2r   )zPolish_Polski-Latin2r   )z.*-Cyrillic$cyrillic)z.*-SJIS$SJIS)z
.*-GB2312$GB2312)z
.*-Latin2$z
ISO-8859-2)z	.*-Greek$greek)z.*-UTF8$zutf-8)Hungarian_Magyar-Unicodez	utf-16-le)Amahuacalatin1)zTurkish_Turkce-Turkishlatin5)zLithuanian_Lietuviskai-Balticlatin4)zJapanese_Nihongo-EUCzEUC-JP)Japanese_Nihongo-JIS
iso2022_jp)Chinese_Mandarin-HZhz)zAbkhaz\-Cyrillic\+Abkhcp1251>   Lao-UTF8
Tamil-UTF8Magahi-AgraMagahi-UTF8Marathi-UTF8Bhojpuri-AgraEsperanto-T61Gujarati-UTF8Vietnamese-VPSVietnamese-TCVNVietnamese-VIQRCzech-Latin2-errArmenian-DallakHelvBurmese_Myanmar-UTF8Russian_Russky-UTF8~Chinese_Mandarin-UTF8Amharic-Afenegus6..60375Tigrinya_Tigrigna-VG2MainBurmese_Myanmar-WinResearcherNavaho_Dine-Navajo-Navaho-font(Azeri_Azerbaijani_Latin-Az.Times.Lat01172Azeri_Azerbaijani_Cyrillic-Az.Times.Cyr.Normal0117r   r   r   udhrc                    s0   t |d}t j| fdd|D  jd d S )Nz(?!README|\.).*c                    s   g | ]	}| j vr|qS  )SKIP).0fileidselfr-   R/var/www/edux/Edux_v2/venv/lib/python3.10/site-packages/nltk/corpus/reader/udhr.py
<listcomp>H   s    z-UdhrCorpusReader.__init__.<locals>.<listcomp>)encoding)r   super__init__	ENCODINGS)r2   rootfileids	__class__r1   r3   r7   D   s   

zUdhrCorpusReader.__init__)r,   )__name__
__module____qualname__r8   r.   r7   __classcell__r-   r-   r;   r3   r   	   s    #r   N)__doc__nltk.corpus.reader.plaintextr   nltk.corpus.reader.utilr   r   r-   r-   r-   r3   <module>   s    