-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathRssReader.java
More file actions
154 lines (140 loc) · 6.08 KB
/
RssReader.java
File metadata and controls
154 lines (140 loc) · 6.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
/**
* (c) 2020 Wolfgang Hauptfleisch <dev@augmentedlogic.com>
* This file is part of simplefeedreader
* Licence: Apache v2
**/
package com.augmentedlogic.simplefeedreader;
import java.io.IOException;
import java.io.InputStream;
import java.net.MalformedURLException;
import java.net.URL;
import javax.xml.stream.XMLEventReader;
import javax.xml.stream.XMLInputFactory;
import javax.xml.stream.XMLStreamException;
import javax.xml.stream.events.*;
import javax.xml.namespace.QName;
public class RssReader {
static final String RSS_TITLE = "title";
static final String RSS_DESCRIPTION = "description";
static final String RSS_CHANNEL = "channel";
static final String RSS_LANGUAGE = "language";
static final String RSS_COPYRIGHT = "copyright";
static final String RSS_LINK = "link";
static final String RSS_AUTHOR = "author";
static final String RSS_ITEM = "item";
static final String RSS_PUB_DATE = "pubDate";
static final String RSS_GUID = "guid";
static final String RSS_ENCLOSURE = "enclosure";
private Boolean plain_text = false;
private String process(String html_string)
{
if(this.plain_text) {
if (html_string != null) {
html_string = html_string.replaceAll("(\\<.*?\\>|<.*?>)", "").trim();
}
}
return html_string;
}
protected Feed readFeed(InputStream in) {
Feed feed = null;
try {
boolean isFeedHeader = true;
String description = "";
String title = "";
String link = "";
String language = "";
String copyright = "";
String author = "";
String pubdate = "";
String guid = "";
String mediafile = "";
String mediatype = "";
XMLInputFactory inputFactory = XMLInputFactory.newInstance();
inputFactory.setProperty("javax.xml.stream.isCoalescing", true);
XMLEventReader eventReader = inputFactory.createXMLEventReader(in);
// iterate over the document
while (eventReader.hasNext()) {
XMLEvent event = eventReader.nextEvent();
if (event.isStartElement()) {
String localPart = event.asStartElement().getName().getLocalPart();
switch (localPart) {
case RSS_ITEM:
if (isFeedHeader) {
isFeedHeader = false;
feed = new Feed(title, link, description, language, copyright, pubdate);
}
event = eventReader.nextEvent();
break;
case RSS_TITLE:
title = getCharacterData(event, eventReader);
break;
case RSS_DESCRIPTION:
description = getCharacterData(event, eventReader);
break;
case RSS_LINK:
link = getCharacterData(event, eventReader);
break;
case RSS_GUID:
guid = getCharacterData(event, eventReader);
break;
case RSS_LANGUAGE:
language = getCharacterData(event, eventReader);
break;
case RSS_AUTHOR:
author = getCharacterData(event, eventReader);
break;
case RSS_PUB_DATE:
pubdate = getCharacterData(event, eventReader);
break;
case RSS_COPYRIGHT:
copyright = getCharacterData(event, eventReader);
break;
case RSS_ENCLOSURE:
if (event.isStartElement()) {
if(event.asStartElement().getAttributeByName(new QName("url")) != null) {
Attribute attribute = event.asStartElement().getAttributeByName(new QName("url"));
mediafile = attribute.getValue();
}
if(event.asStartElement().getAttributeByName(new QName("type")) != null) {
Attribute attribute = event.asStartElement().getAttributeByName(new QName("type"));
mediatype = attribute.getValue();
}
}
break;
}
} else if (event.isEndElement()) {
if (event.asEndElement().getName().getLocalPart() == (RSS_ITEM)) {
FeedItem message = new FeedItem();
message.setAuthor(author);
message.setDescription(this.process(description));
message.setGuid(guid);
message.setLink(link);
message.setTitle(title);
message.setPubDate(pubdate);
message.setMediaFile(mediafile);
message.setMediaType(mediatype);
feed.getFeedItems().add(message);
event = eventReader.nextEvent();
continue;
}
}
}
} catch (XMLStreamException e) {
throw new RuntimeException(e);
}
return feed;
}
private String getCharacterData(XMLEvent event, XMLEventReader eventReader)
throws XMLStreamException {
String result = "";
event = eventReader.nextEvent();
if (event instanceof Characters) {
result = event.asCharacters().getData();
}
return result;
}
protected void setPlainText(Boolean plain_text)
{
this.plain_text = plain_text;
}
}