Coverage Report

Coverage Report - org.apache.commons.feedparser.AtomFeedParser

Classes in this File

Line Coverage

Branch Coverage

Complexity

AtomFeedParser

0/136

0/40

3.3

 /*
  * Copyright 1999,2004 The Apache Software Foundation.
  * 
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  * 
  *      http://www.apache.org/licenses/LICENSE-2.0
  * 
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 
 package org.apache.commons.feedparser;
 
 import java.util.Iterator;
 import java.util.List;
 
 import org.apache.commons.feedparser.locate.EntityDecoder;
 import org.jaxen.jdom.JDOMXPath;
 import org.jdom.Attribute;
 import org.jdom.CDATA;
 import org.jdom.Comment;
 import org.jdom.Element;
 import org.jdom.Text;
 import org.jdom.output.XMLOutputter;
 
 /**
  * http://www.intertwingly.net/wiki/pie/FrontPage
  *  
  * http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-05.txt
  * 
  * http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-04.txt
  * 
  * http://www.mnot.net/drafts/draft-nottingham-atom-format-02.html
  * 
  * http://www.ietf.org/html.charters/atompub-charter.html
  * 
  * http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-01.txt
  * 
  * @author <a href="mailto:burton@apache.org">Kevin A. Burton (burtonator)</a>
  * @version $Id: AtomFeedParser.java 373614 2006-01-30 22:31:21Z mvdb $
  */
 public class AtomFeedParser extends BaseParser {
 
     /**
      * Parse this feed.
      *
      * 
      */
     public static void parse( FeedParserListener listener,
                               org.jdom.Document doc ) throws Exception {
 
         FeedParserState state = new FeedParserState( listener );
 
         FeedVersion v = new FeedVersion();
         v.isAtom = true;
         listener.onFeedVersion( v );
 
         listener.init();
 
         Element root = doc.getRootElement();
 
         doLocale( state, listener, root );
         
         doChannel( state, listener, doc );
         doEntry( state, listener, doc );
 
         doLocaleEnd( state, listener, root );
 
         listener.finished();
 
     }
 
     private static void doChannel( FeedParserState state,
                                    FeedParserListener listener,
                                    org.jdom.Document doc ) throws Exception {
 
         Element root = doc.getRootElement();
 
         //perform onChannel method...  (title, link, description)
         String title = selectText( "/atom:feed/atom:title", root );
 
         //xpath = new XPath( "/atom:feed/atom:link[atom:rel='alternate']" );
         
         //perform onChannel method...  (title, link, description)
         String link = selectSingleAttribute( "/atom:feed/atom:link[@rel='alternate'][@type='text/html']/@href", root );
 
         //String description = selectText( "/atom:feed/atom:summary[@rel='text/plain']", doc );
 
         String tagline = selectText( "/atom:feed/atom:tagline", root );
         
         //state.current = title;
         listener.onChannel( state, title, link, tagline );
 
         listener.onChannelEnd();
 
     }
 
     private static void doEntry( FeedParserState state,
                                  FeedParserListener listener,
                                  org.jdom.Document doc ) throws Exception {
 
         JDOMXPath xpath = new JDOMXPath( "/atom:feed/atom:entry" );
         xpath.setNamespaceContext( NS.context );
 
         List items = xpath.selectNodes( doc );
 
         Iterator i = items.iterator();
             
         //update items.
         while ( i.hasNext() ) {
 
             Element child = (Element)i.next();
 
             doLocale( state, listener, child );
             
             String title = selectText( "atom:title", child );
 
             // The "atom:link" element is a Link construct that conveys a URI
             // associated with the entry. The nature of the relationship as well
             // as the link itself is determined by the element's content.
 
             // atom:entry elements MUST contain at least one atom:link element
             // with a rel attribute value of "alternate".
 
             // atom:entry elements MUST NOT contain more than one atom:link
             // element with a rel attribute value of "alternate" that has the
             // same type attribute value.
 
             // atom:entry elements MAY contain additional atom:link elements
             // beyond those described above.
             
             String link = selectSingleAttribute( "atom:link[@rel='alternate'][@type='text/html']/@href",
                                                  child );
 
             // The "atom:summary" element is a Content construct that conveys a
             // short summary, abstract or excerpt of the entry. atom:entry
             // elements MAY contain an atom:created element, but MUST NOT
             // contain more than one.
 
             //FIXME: what if there is no type attribute specified?  Whats the default?
 
             // Content constructs MAY have a "type" attribute, whose value
             // indicates the media type of the content.  When present, this
             // attribute's value MUST be a media type [RFC2045].  If this
             // attribute is not present, processors MUST behave as if it were
             // present with a value of "text/ plain".
 
             String description = null;
 
             Element summary = child.getChild( "summary", NS.ATOM );
 
             if ( summary != null ) {
 
                 String type = summary.getAttributeValue( "type", NS.ATOM );
                 
                 if ( type == null || "text/plain".equals( type ) )
                     description = summary.getText();
                 
             }
 
             state.current = child;
             
             listener.onItem( state, title, link, description, link );
             
             doLink( state, listener, child );
             
             doMeta( state, listener, child );
 
             doContent( state, listener, child );
 
             MetaFeedParser.parse( listener, state );
             TagFeedParser.parse( listener, state );
             
             listener.onItemEnd();
             doLocale( state, listener, child );
 
         }
 
     }
 
     private static void doLink( FeedParserState state,
                                 FeedParserListener listener,
                                 Element current ) throws Exception {
 
         if ( listener instanceof LinkFeedParserListener == false )
             return;
 
         LinkFeedParserListener lfpl = (LinkFeedParserListener)listener;
         
         JDOMXPath xpath = new JDOMXPath( "atom:link" );
         xpath.setNamespaceContext( NS.context );
 
         List items = xpath.selectNodes( current );
 
         Iterator it = items.iterator();
             
         //update items.
         while ( it.hasNext() ) {
 
             Element link = (Element)it.next();
             
             String href = link.getAttributeValue( "href" );
             String rel = link.getAttributeValue( "rel" );
             String type = link.getAttributeValue( "type" );
 
             String title = null;
             long length = -1;
 
             lfpl.onLink( state, rel, type, href, title, length );
             
         }
         
     }
     
     private static void doContent( FeedParserState state,
                                    FeedParserListener listener,
                                    Element current ) throws Exception {
 
         if ( ! (listener instanceof ContentFeedParserListener) )
             return;
         
         ContentFeedParserListener clistener = (ContentFeedParserListener)listener;
 
         JDOMXPath xpath = new JDOMXPath( "atom:content" );
         xpath.setNamespaceContext( NS.context );
 
         List items = xpath.selectNodes( current );
 
         Iterator i = items.iterator();
             
         //update items.
         while ( i.hasNext() ) {
 
             Element content = (Element)i.next();
 
             doLocale( state, listener, content );
 
             String type = content.getAttributeValue( "type", "text/plain" );
             String mode = content.getAttributeValue( "mode" );
 
             String format = null;
             String encoding = null;
 
             String value = null;
 
             //
             if ( "xml".equals( mode ) ) {
                 value = content.getText();
             } else if ( "escaped".equals( mode ) ) {
 
                 //need to decode the content here &lt; -> < etc.
                 value = getXMLOfContent( content.getContent() );
                 value = EntityDecoder.decode( value );
             } else {
                 mode = "xml";
                 value = getXMLOfContent( content.getContent() );
             }
 
             boolean isSummary = false;
             
             clistener.onContent( state, type, format, encoding, mode, value, isSummary );
 
             doLocaleEnd( state, listener, content );
             
         }
 
         xpath = new JDOMXPath( "atom:summary[@type='application/xhtml+xml']" );
         xpath.setNamespaceContext( NS.context );
         Element e = (Element)xpath.selectSingleNode( current );
 
         if ( e != null ) {
 
             String type = "text/html";
             String format = "application/xhtml+xml";
             String encoding = null;
             String mode = "xml";
 
             //FIXME: get xml:base to expand the URIs.
             
             String value = getXMLOfContent( e );
             boolean isSummary = true;
             
             clistener.onContent( state, type, format, encoding, mode, value, isSummary );
 
         }
         
     }
 
     private static String getXMLOfContent( Element element ) {
         return getXMLOfContent( element.getContent() );
     }
     
     /**
      * Get the content of the given element.
      *
      * 
      */
     private static String getXMLOfContent( List content ) {
 
         //NOTE: Fri Mar 04 2005 03:59 PM (burton1@rojo.com): in my profiling I
         //found that this is a BIG memory allocater.  FIXME: We SHOULD be able
         //to do the same thing we do for xhtml:body RIGHT?
         
         StringBuffer buff = new StringBuffer( 10000 ); 
 
         // NOTE: Changed this constructor to use the default Format. Since the
         // constructor used no longer exists in jdom 1.0.
         XMLOutputter outputter = new XMLOutputter();
 
         Iterator it = content.iterator();
         
         while ( it.hasNext() ) {
 
             Object next = it.next();
             
             if ( next instanceof String ) {
                 buff.append( (String)next );
             } else if ( next instanceof Element ) {
                 buff.append( outputter.outputString( (Element)next ) );
             } else if ( next instanceof CDATA ) {
                 buff.append( ((CDATA)next).getText() );
             } else if ( next instanceof Comment ) {
                 buff.append( outputter.outputString( (Comment)next ) );
             } else if ( next instanceof Text ) {
                 buff.append( outputter.outputString( (Text)next ) );
             } 
 
         } 
 
         return buff.toString();
         
     }
 
     private static void doMeta( FeedParserState state,
                                 FeedParserListener listener,
                                 Element element ) throws Exception {
 
         //FIXME: move this code to MetaFeedParser...
         
         if ( ! (listener instanceof MetaFeedParserListener) ) 
             return;
 
         MetaFeedParserListener mlistener = (MetaFeedParserListener)listener;
 
         //handle issued, created, and then dublin core..
         String subject = selectText( "dc:subject", element);
 
         if ( subject != null ) {
             mlistener.onSubject( state, subject );
             mlistener.onSubjectEnd();
         } 
 
     }
 
     private static Element selectSingleElement( String query, org.jdom.Document doc ) throws Exception {
 
         JDOMXPath xpath = new JDOMXPath( query );
         xpath.setNamespaceContext( NS.context );
         
         //perform onChannel method...  (title, link, description)
         return (Element)xpath.selectSingleNode( doc );
 
     }
 
     private static String selectSingleAttribute( String query, Element element ) throws Exception {
 
         JDOMXPath xpath = new JDOMXPath( query );
         xpath.setNamespaceContext( NS.context );
         
         //perform onChannel method...  (title, link, description)
         Attribute a = (Attribute)xpath.selectSingleNode( element );
         if ( a == null )
             return null;
         
         return a.getValue();
 
     }
 
 }
 

1		/*
2		* Copyright 1999,2004 The Apache Software Foundation.
3		*
4		* Licensed under the Apache License, Version 2.0 (the "License");
5		* you may not use this file except in compliance with the License.
6		* You may obtain a copy of the License at
7		*
8		* http://www.apache.org/licenses/LICENSE-2.0
9		*
10		* Unless required by applicable law or agreed to in writing, software
11		* distributed under the License is distributed on an "AS IS" BASIS,
12		* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13		* See the License for the specific language governing permissions and
14		* limitations under the License.
15		*/
16
17		package org.apache.commons.feedparser;
18
19		import java.util.Iterator;
20		import java.util.List;
21
22		import org.apache.commons.feedparser.locate.EntityDecoder;
23		import org.jaxen.jdom.JDOMXPath;
24		import org.jdom.Attribute;
25		import org.jdom.CDATA;
26		import org.jdom.Comment;
27		import org.jdom.Element;
28		import org.jdom.Text;
29		import org.jdom.output.XMLOutputter;
30
31		/**
32		* http://www.intertwingly.net/wiki/pie/FrontPage
33		*
34		* http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-05.txt
35		*
36		* http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-04.txt
37		*
38		* http://www.mnot.net/drafts/draft-nottingham-atom-format-02.html
39		*
40		* http://www.ietf.org/html.charters/atompub-charter.html
41		*
42		* http://www.ietf.org/internet-drafts/draft-ietf-atompub-format-01.txt
43		*
44		* @author <a href="mailto:burton@apache.org">Kevin A. Burton (burtonator)</a>
45		* @version $Id: AtomFeedParser.java 373614 2006-01-30 22:31:21Z mvdb $
46		*/
47	0	public class AtomFeedParser extends BaseParser {
48
49		/**
50		* Parse this feed.
51		*
52		*
53		*/
54		public static void parse( FeedParserListener listener,
55		org.jdom.Document doc ) throws Exception {
56
57	0	FeedParserState state = new FeedParserState( listener );
58
59	0	FeedVersion v = new FeedVersion();
60	0	v.isAtom = true;
61	0	listener.onFeedVersion( v );
62
63	0	listener.init();
64
65	0	Element root = doc.getRootElement();
66
67	0	doLocale( state, listener, root );
68
69	0	doChannel( state, listener, doc );
70	0	doEntry( state, listener, doc );
71
72	0	doLocaleEnd( state, listener, root );
73
74	0	listener.finished();
75
76	0	}
77
78		private static void doChannel( FeedParserState state,
79		FeedParserListener listener,
80		org.jdom.Document doc ) throws Exception {
81
82	0	Element root = doc.getRootElement();
83
84		//perform onChannel method... (title, link, description)
85	0	String title = selectText( "/atom:feed/atom:title", root );
86
87		//xpath = new XPath( "/atom:feed/atom:link[atom:rel='alternate']" );
88
89		//perform onChannel method... (title, link, description)
90	0	String link = selectSingleAttribute( "/atom:feed/atom:link[@rel='alternate'][@type='text/html']/@href", root );
91
92		//String description = selectText( "/atom:feed/atom:summary[@rel='text/plain']", doc );
93
94	0	String tagline = selectText( "/atom:feed/atom:tagline", root );
95
96		//state.current = title;
97	0	listener.onChannel( state, title, link, tagline );
98
99	0	listener.onChannelEnd();
100
101	0	}
102
103		private static void doEntry( FeedParserState state,
104		FeedParserListener listener,
105		org.jdom.Document doc ) throws Exception {
106
107	0	JDOMXPath xpath = new JDOMXPath( "/atom:feed/atom:entry" );
108	0	xpath.setNamespaceContext( NS.context );
109
110	0	List items = xpath.selectNodes( doc );
111
112	0	Iterator i = items.iterator();
113
114		//update items.
115	0	while ( i.hasNext() ) {
116
117	0	Element child = (Element)i.next();
118
119	0	doLocale( state, listener, child );
120
121	0	String title = selectText( "atom:title", child );
122
123		// The "atom:link" element is a Link construct that conveys a URI
124		// associated with the entry. The nature of the relationship as well
125		// as the link itself is determined by the element's content.
126
127		// atom:entry elements MUST contain at least one atom:link element
128		// with a rel attribute value of "alternate".
129
130		// atom:entry elements MUST NOT contain more than one atom:link
131		// element with a rel attribute value of "alternate" that has the
132		// same type attribute value.
133
134		// atom:entry elements MAY contain additional atom:link elements
135		// beyond those described above.
136
137	0	String link = selectSingleAttribute( "atom:link[@rel='alternate'][@type='text/html']/@href",
138		child );
139
140		// The "atom:summary" element is a Content construct that conveys a
141		// short summary, abstract or excerpt of the entry. atom:entry
142		// elements MAY contain an atom:created element, but MUST NOT
143		// contain more than one.
144
145		//FIXME: what if there is no type attribute specified? Whats the default?
146
147		// Content constructs MAY have a "type" attribute, whose value
148		// indicates the media type of the content. When present, this
149		// attribute's value MUST be a media type [RFC2045]. If this
150		// attribute is not present, processors MUST behave as if it were
151		// present with a value of "text/ plain".
152
153	0	String description = null;
154
155	0	Element summary = child.getChild( "summary", NS.ATOM );
156
157	0	if ( summary != null ) {
158
159	0	String type = summary.getAttributeValue( "type", NS.ATOM );
160
161	0	if ( type == null \|\| "text/plain".equals( type ) )
162	0	description = summary.getText();
163
164		}
165
166	0	state.current = child;
167
168	0	listener.onItem( state, title, link, description, link );
169
170	0	doLink( state, listener, child );
171
172	0	doMeta( state, listener, child );
173
174	0	doContent( state, listener, child );
175
176	0	MetaFeedParser.parse( listener, state );
177	0	TagFeedParser.parse( listener, state );
178
179	0	listener.onItemEnd();
180	0	doLocale( state, listener, child );
181
182	0	}
183
184	0	}
185
186		private static void doLink( FeedParserState state,
187		FeedParserListener listener,
188		Element current ) throws Exception {
189
190	0	if ( listener instanceof LinkFeedParserListener == false )
191	0	return;
192
193	0	LinkFeedParserListener lfpl = (LinkFeedParserListener)listener;
194
195	0	JDOMXPath xpath = new JDOMXPath( "atom:link" );
196	0	xpath.setNamespaceContext( NS.context );
197
198	0	List items = xpath.selectNodes( current );
199
200	0	Iterator it = items.iterator();
201
202		//update items.
203	0	while ( it.hasNext() ) {
204
205	0	Element link = (Element)it.next();
206
207	0	String href = link.getAttributeValue( "href" );
208	0	String rel = link.getAttributeValue( "rel" );
209	0	String type = link.getAttributeValue( "type" );
210
211	0	String title = null;
212	0	long length = -1;
213
214	0	lfpl.onLink( state, rel, type, href, title, length );
215
216	0	}
217
218	0	}
219
220		private static void doContent( FeedParserState state,
221		FeedParserListener listener,
222		Element current ) throws Exception {
223
224	0	if ( ! (listener instanceof ContentFeedParserListener) )
225	0	return;
226
227	0	ContentFeedParserListener clistener = (ContentFeedParserListener)listener;
228
229	0	JDOMXPath xpath = new JDOMXPath( "atom:content" );
230	0	xpath.setNamespaceContext( NS.context );
231
232	0	List items = xpath.selectNodes( current );
233
234	0	Iterator i = items.iterator();
235
236		//update items.
237	0	while ( i.hasNext() ) {
238
239	0	Element content = (Element)i.next();
240
241	0	doLocale( state, listener, content );
242
243	0	String type = content.getAttributeValue( "type", "text/plain" );
244	0	String mode = content.getAttributeValue( "mode" );
245
246	0	String format = null;
247	0	String encoding = null;
248
249	0	String value = null;
250
251		//
252	0	if ( "xml".equals( mode ) ) {
253	0	value = content.getText();
254	0	} else if ( "escaped".equals( mode ) ) {
255
256		//need to decode the content here < -> < etc.
257	0	value = getXMLOfContent( content.getContent() );
258	0	value = EntityDecoder.decode( value );
259		} else {
260	0	mode = "xml";
261	0	value = getXMLOfContent( content.getContent() );
262		}
263
264	0	boolean isSummary = false;
265
266	0	clistener.onContent( state, type, format, encoding, mode, value, isSummary );
267
268	0	doLocaleEnd( state, listener, content );
269
270	0	}
271
272	0	xpath = new JDOMXPath( "atom:summary[@type='application/xhtml+xml']" );
273	0	xpath.setNamespaceContext( NS.context );
274	0	Element e = (Element)xpath.selectSingleNode( current );
275
276	0	if ( e != null ) {
277
278	0	String type = "text/html";
279	0	String format = "application/xhtml+xml";
280	0	String encoding = null;
281	0	String mode = "xml";
282
283		//FIXME: get xml:base to expand the URIs.
284
285	0	String value = getXMLOfContent( e );
286	0	boolean isSummary = true;
287
288	0	clistener.onContent( state, type, format, encoding, mode, value, isSummary );
289
290		}
291
292	0	}
293
294		private static String getXMLOfContent( Element element ) {
295	0	return getXMLOfContent( element.getContent() );
296		}
297
298		/**
299		* Get the content of the given element.
300		*
301		*
302		*/
303		private static String getXMLOfContent( List content ) {
304
305		//NOTE: Fri Mar 04 2005 03:59 PM (burton1@rojo.com): in my profiling I
306		//found that this is a BIG memory allocater. FIXME: We SHOULD be able
307		//to do the same thing we do for xhtml:body RIGHT?
308
309	0	StringBuffer buff = new StringBuffer( 10000 );
310
311		// NOTE: Changed this constructor to use the default Format. Since the
312		// constructor used no longer exists in jdom 1.0.
313	0	XMLOutputter outputter = new XMLOutputter();
314
315	0	Iterator it = content.iterator();
316
317	0	while ( it.hasNext() ) {
318
319	0	Object next = it.next();
320
321	0	if ( next instanceof String ) {
322	0	buff.append( (String)next );
323	0	} else if ( next instanceof Element ) {
324	0	buff.append( outputter.outputString( (Element)next ) );
325	0	} else if ( next instanceof CDATA ) {
326	0	buff.append( ((CDATA)next).getText() );
327	0	} else if ( next instanceof Comment ) {
328	0	buff.append( outputter.outputString( (Comment)next ) );
329	0	} else if ( next instanceof Text ) {
330	0	buff.append( outputter.outputString( (Text)next ) );
331		}
332
333	0	}
334
335	0	return buff.toString();
336
337		}
338
339		private static void doMeta( FeedParserState state,
340		FeedParserListener listener,
341		Element element ) throws Exception {
342
343		//FIXME: move this code to MetaFeedParser...
344
345	0	if ( ! (listener instanceof MetaFeedParserListener) )
346	0	return;
347
348	0	MetaFeedParserListener mlistener = (MetaFeedParserListener)listener;
349
350		//handle issued, created, and then dublin core..
351	0	String subject = selectText( "dc:subject", element);
352
353	0	if ( subject != null ) {
354	0	mlistener.onSubject( state, subject );
355	0	mlistener.onSubjectEnd();
356		}
357
358	0	}
359
360		private static Element selectSingleElement( String query, org.jdom.Document doc ) throws Exception {
361
362	0	JDOMXPath xpath = new JDOMXPath( query );
363	0	xpath.setNamespaceContext( NS.context );
364
365		//perform onChannel method... (title, link, description)
366	0	return (Element)xpath.selectSingleNode( doc );
367
368		}
369
370		private static String selectSingleAttribute( String query, Element element ) throws Exception {
371
372	0	JDOMXPath xpath = new JDOMXPath( query );
373	0	xpath.setNamespaceContext( NS.context );
374
375		//perform onChannel method... (title, link, description)
376	0	Attribute a = (Attribute)xpath.selectSingleNode( element );
377	0	if ( a == null )
378	0	return null;
379
380	0	return a.getValue();
381
382		}
383
384		}
385