
    dh                     >    S SK Jr  S SKJr  S SKJr   " S S\5      rg)    )List)Document)
BaseLoaderc                   :    \ rS rSrSrS\4S jrS\\   4S jr	Sr
g)	GutenbergLoader   zLoad from `Gutenberg.org`.	file_pathc                     UR                  S5      (       d  [        S5      eUR                  S5      (       d  [        S5      eXl        g)zInitialize with a file path.zhttps://www.gutenberg.orgz5file path must start with 'https://www.gutenberg.org'z.txtzfile path must end with '.txt'N)
startswith
ValueErrorendswithr	   )selfr	   s     f/var/www/html/shao/venv/lib/python3.13/site-packages/langchain_community/document_loaders/gutenberg.py__init__GutenbergLoader.__init__   sB    ##$?@@TUU!!&))=>>"    returnc           
          SSK Jn  U" U R                  5      nSR                  U Vs/ sH  n[	        UR                  S5      5      PM     sn5      nSU R                  0n[        XES9/$ s  snf )z
Load file.r   )urlopenz

z	utf-8-sigsource)page_contentmetadata)urllib.requestr   r	   joinstrdecoder   )r   r   elementseltextr   s         r   loadGutenbergLoader.load   s`    *4>>*{{(K(BC		+ 67(KLdnn-d>?? Ls   #A*)r	   N)__name__
__module____qualname____firstlineno____doc__r   r   r   r   r    __static_attributes__ r   r   r   r      s#    $## #@d8n @r   r   N)typingr   langchain_core.documentsr   )langchain_community.document_loaders.baser   r   r(   r   r   <module>r,      s     - @@j @r   