3 \X@sdZddgZddlZddlmZddlmZddlmZddl m Z ej d Z ej d Z ej d Zej d Zej d Zd ZdZeZGdddeZGdddZGdddeZdS)aFeedParser - An email feed parser. The feed parser implements an interface for incrementally parsing an email message, line by line. This has advantages for certain applications, such as those reading email messages off a socket. FeedParser.feed() is the primary interface for pushing new data into the parser. It returns when there's nothing more it can do with the available data. When you have no more data to push into the parser, call .close(). This completes the parsing and returns the root message object. The other advantage of this parser is that it will never raise a parsing exception. Instead, when it finds something unexpected, it adds a 'defect' to the current message. Defects are just instances that live on the message object's .defects attribute. FeedParserBytesFeedParserN)errors)compat32)deque)StringIOz \r\n|\r|\nz (\r\n|\r|\n)z(\r\n|\r|\n)\Zz%^(From |[\041-\071\073-\176]*:|[\t ]) c@s`eZdZdZddZddZddZdd Zd d Zd d Z ddZ ddZ ddZ ddZ dS)BufferedSubFileakA file-ish object that can have new data loaded into it. You can also push and pop line-matching predicates onto a stack. When the current predicate matches the current line, a false EOF response (i.e. empty string) is returned instead. This lets the parser adhere to a simple abstraction -- it parses until EOF closes the current message. cCs$tdd|_t|_g|_d|_dS)Nr)newlineF)r_partialr_lines _eofstack_closed)selfr"/usr/lib64/python3.6/feedparser.py__init__5s zBufferedSubFile.__init__cCs|jj|dS)N)rappend)rZpredrrrpush_eof_matcher@sz BufferedSubFile.push_eof_matchercCs |jjS)N)rpop)rrrrpop_eof_matcherCszBufferedSubFile.pop_eof_matchercCs<|jjd|j|jj|jjd|jjd|_dS)NrT)r seek pushlines readlinestruncater)rrrrcloseFs    zBufferedSubFile.closecCsN|js|jrdStS|jj}x*t|jD]}||r*|jj|dSq*W|S)Nr)r r NeedMoreDatapopleftreversedr appendleft)rlineZateofrrrreadlineNs  zBufferedSubFile.readlinecCs|jj|dS)N)r r )rr!rrr unreadline`szBufferedSubFile.unreadlinecCsx|jj|d|kr d|kr dS|jjd|jj}|jjd|jj|djdsj|jj|j|j|dS)z$Push some new data into this object.r  Nr)r writerrrendswithrr)rdatapartsrrrpushes     zBufferedSubFile.pushcCs|jj|dS)N)r extend)rlinesrrrrzszBufferedSubFile.pushlinescCs|S)Nr)rrrr__iter__}szBufferedSubFile.__iter__cCs|j}|dkrt|S)Nr)r" StopIteration)rr!rrr__next__szBufferedSubFile.__next__N)__name__ __module__ __qualname____doc__rrrrr"r#r+rr.r0rrrrr -s r c@s`eZdZdZdedddZddZdd Zd d Zd d Z ddZ ddZ ddZ ddZ dS)rzA feed-style parser of email.N)policyc Cs||_d|_|dkr<|jdkr2ddlm}||_qn|j|_n2||_y||jdWntk rld|_YnXt|_g|_ |j j |_ d|_ d|_d|_dS)a_factory is called with no arguments to create a new message obj The policy keyword specifies a policy object that controls a number of aspects of the parser's operation. The default policy maintains backward compatibility. FNr)Message)r5T)r5_old_style_factoryZmessage_factoryZ email.messager6_factory TypeErrorr _input _msgstack _parsegenr0_parse_cur_last _headersonly)rr8r5r6rrrrs$     zFeedParser.__init__cCs d|_dS)NT)r@)rrrr_set_headersonlyszFeedParser._set_headersonlycCs|jj||jdS)zPush more data into the parser.N)r:r+ _call_parse)rr)rrrfeeds zFeedParser.feedc Cs&y |jWntk r YnXdS)N)r=r/)rrrrrBs zFeedParser._call_parsecCsJ|jj|j|j}|jdkrF|j rFtj}|jj |||S)zget_content_typeZset_default_typer;Zattachrr?)rmsgrrr _new_messages   zFeedParser._new_messagecCs(|jj}|jr|jd|_nd|_|S)Nr%r&)r;rr>)rretvalrrrrEs  zFeedParser._pop_messageccs6|jg}xb|jD]X}|tkr(tVqtj|sbtj|s`tj}|jj |j ||jj |P|j |qW|j ||jrg}x2|jj}|tkrtVq|dkrP|j |qW|j jtj|dS|j jdkrx|jjtjx$|jD]}|tkrtVqPqW|j}|jjx&|jj}|tkrFtVq(Pq(Wx&|jj}|tkrntVqPPqPW|dkrP|jj |qWdS|j jdkrx(|jD]}|tkrtVqPqW|jdS|j jdkr|j j}|dkrbtj}|jj |j |g}x.|jD]$}|tkrtj+}|jj |j ||j jtj| g}x$|jD]}|tkrtVqqWtj||j _'dS| s`tj,}|jj |j |dS| rndg}ng}x.|jD]$}|tkrtVqz|j |qzW|r|d}t-j|}|r|t$|j!dd|d<tj||j _'dSg}x.|jD]$}|tkrtVq|j |qW|j jtj|dS)Nrzmessage/delivery-statusmessagerDzcontent-transfer-encoding8bit7bitbinaryz--z(?Pz4)(?P--)?(?P[ \t]*)(?P\r\n|\r|\n)?$TFendlinesepr%r)rPrOrQr&r&).rLr:rheaderREmatchNLCRErZ MissingHeaderBodySeparatorDefectr5rGr>r#r_parse_headersr@r"Z set_payload EMPTYSTRINGjoinrJrr<rErrFZ get_boundaryZNoBoundaryInMultipartDefectgetlowerZ-InvalidMultipartContentTransferEncodingDefectrecompileescapegroup NLCRE_eolsearchlenpreambler?epilogueZ_payload isinstancestrZStartBoundaryNotFoundDefectZCloseBoundaryNotFoundDefect NLCRE_bol)rZheadersr!rIr-rMrKboundaryZ separatorZ boundaryreZcapturing_preamblercrSZclose_boundary_seenmoZlastlineZeolmordrRZpayload firstlineZbolmorrrr<sf                                                zFeedParser._parsegenc Cs^d}g}x4t|D]&\}}|ddkrV|sJtj|}|jj|j|q|j|q|rx|jj|jj|dg}}|j dr|dkrt j |}|r|dt |j d }|jj|qn:|t |dkr|jj|dStj|}|jjj|q|jd}|dkr*tjd}|jjj|q|d|}|g}qW|rZ|jj|jj|dS)Nrrz zFrom r%:zMissing header name.) enumeraterZ#FirstHeaderLineIsContinuationDefectr5rGr>rZset_rawZheader_source_parse startswithr`rarbr_Z set_unixfromr:r#ZMisplacedEnvelopeHeaderDefectZdefectsfindZInvalidHeaderDefect) rr-Z lastheaderZ lastvaluelinenor!rIriirrrrWsF              zFeedParser._parse_headers)N)r1r2r3r4rrrArCrBrrLrEr<rWrrrrrs  ~cs eZdZdZfddZZS)rz(Like FeedParser, but feed accepts bytes.cstj|jdddS)Nasciisurrogateescape)superrCdecode)rr)) __class__rrrCszBytesFeedParser.feed)r1r2r3r4rC __classcell__rr)rurrs)r4__all__r\ZemailrZemail._policybaser collectionsriorr]rVrgr`Z NLCRE_crackrTrXNLobjectrr rrrrrrs(         [