public void notifySubscribers(SyndEntry[] entries) { for (SyndEntry entry : entries) { for (String destination : subscribers) { Main.getBot() .sendMessage( destination, String.format( "[" + Colors.BOLD + "RSS - %s" + Colors.NORMAL + "]" + " [" + Colors.BOLD + "%s" + Colors.NORMAL + "]" + Colors.BLUE + Colors.BOLD + " %s" + Colors.NORMAL + ": " + Colors.DARK_GREEN + "%s" + Colors.NORMAL + " (" + Colors.OLIVE + Colors.BOLD + "%s" + Colors.NORMAL + ")", title, entry.getPublishedDate().toString(), entry.getAuthor(), entry.getTitle(), entry.getLink())); } } }
public void setEpisodeAttributes(Episode episode, Podcast podcast, SyndEntry entry) { // set DESCRIPTION for episode - used in search if (null != entry.getDescription()) { String episodeDesc = entry.getDescription().getValue(); // tags are removed from description String descWithoutTabs = episodeDesc.replaceAll("\\<[^>]*>", ""); // carriage returns are removed from description - for player String descWithoutEndOfLine = descWithoutTabs.replaceAll("\\n", ""); if (descWithoutEndOfLine.length() > MAX_LENGTH_DESCRIPTION) { episode.setDescription(descWithoutEndOfLine.substring(0, MAX_LENGTH_DESCRIPTION)); } else { episode.setDescription(descWithoutEndOfLine); } } // set author episode.setAuthor(entry.getAuthor()); // set title for episode - used in search String episodeTitle = entry.getTitle(); if (episodeTitle != null) { // removes quotes to display properly in player episodeTitle = episodeTitle.replaceAll("\"", ""); if (episodeTitle.length() > MAX_PERMITTED_TITLE_LENGTH) { episodeTitle = episodeTitle.substring(0, MAX_PERMITTED_TITLE_LENGTH); } episode.setTitle(episodeTitle); String titleInUrl = episodeTitle.trim().replaceAll("[^a-zA-Z0-9\\-\\s\\.]", ""); titleInUrl = titleInUrl.replaceAll("[\\-| |\\.]+", "-"); if (titleInUrl.length() > TITLE_IN_URL_MAX_LENGTH) { episode.setTitleInUrl(titleInUrl.substring(0, TITLE_IN_URL_MAX_LENGTH)); } else { episode.setTitleInUrl(titleInUrl); } } episode.setLink(entry.getLink()); // in the beginning inherit the media type from the podcast episode.setMediaType(podcast.getMediaType()); // get the list of enclosures @SuppressWarnings("unchecked") List<SyndEnclosure> enclosures = (List<SyndEnclosure>) entry.getEnclosures(); List<String> audioMimeTypesList = Arrays.asList(audioMimeTypesArray); List<String> videoMimeTypesList = Arrays.asList(videoMimeTypesArray); // set media url for the episode - this will be played in the player if (null != enclosures) { // if in the enclosure list is a media type (either audio or video), // this will set as the link of the episode for (SyndEnclosure enclosure : enclosures) { if (null != enclosure) { episode.setMediaUrl(enclosure.getUrl()); if (enclosure.getLength() >= 0) episode.setLength(enclosure.getLength()); // when adding a new podcast media type is selected for the // podcast based on an initial view, but it can be that is a // mixed podcast so both audio // and video should be considered and in that case PRIORITY // has the type of the episode if any... if (null != enclosure.getType()) { episode.setEnclosureType(enclosure.getType().trim()); if (audioMimeTypesList.contains(enclosure.getType().trim())) { episode.setMediaType(MediaType.Audio); break; } if (videoMimeTypesList.contains(enclosure.getType().trim())) { episode.setMediaType(MediaType.Video); break; } } } } } else { episode.setMediaUrl("noMediaUrl"); } if (episode.getMediaUrl() == null) { episode.setMediaUrl("noMediaUrl"); } if (episode.getMediaUrl() == null || episode.getMediaUrl().equals("noMediaUrl")) { LOG.warn( "PodcastId[" + podcast.getPodcastId() + "] - " + "COULD NOT SET MEDIA URL - " + "epTitle[" + entry.getTitle() + "]" + "feed[" + podcast.getUrl() + "]"); } // set link attribute episode.setLink(entry.getLink()); episode.setPublicationDate(entry.getPublishedDate()); updatePodcastPublicationDateAndLastMediaUrl(episode, podcast); if (episode.getPublicationDate() == null) { LOG.warn( "PodcastId[" + podcast.getPodcastId() + "] - " + "COULD NOT SET publication date " + "epTitle[" + entry.getTitle() + "]" + "feed[" + podcast.getUrl() + "]"); } }
@SuppressWarnings("unchecked") public void setPodcastFeedAttributes(Podcast podcast, boolean feedPropertyHasBeenSet) throws IllegalArgumentException, FeedException, IOException { SyndFeed syndFeed = null; if (!feedPropertyHasBeenSet) { syndFeed = syndFeedService.getSyndFeedForUrl(podcast.getUrl()); podcast.setPodcastFeed(syndFeed); } if (syndFeed != null) { // set DESCRIPTION for podcast - used in search if (syndFeed.getDescription() != null && !syndFeed.getDescription().equals("")) { String description = syndFeed.getDescription(); // out of description remove tags if any exist and store also // short description String descWithoutTabs = description.replaceAll("\\<[^>]*>", ""); if (descWithoutTabs.length() > MAX_LENGTH_DESCRIPTION) { podcast.setDescription(descWithoutTabs.substring(0, MAX_LENGTH_DESCRIPTION)); } else { podcast.setDescription(descWithoutTabs); } } // set TITLE - used in search String podcastTitle = syndFeed.getTitle(); podcast.setTitle(podcastTitle); // build the title that will appear in the URL when accessing a // podcast from the main application String titleInUrl = podcastTitle.trim().replaceAll("[^a-zA-Z0-9\\-\\s\\.]", ""); titleInUrl = titleInUrl.replaceAll("[\\-| |\\.]+", "-"); if (titleInUrl.length() > TITLE_IN_URL_MAX_LENGTH) { podcast.setTitleInUrl(titleInUrl.substring(0, TITLE_IN_URL_MAX_LENGTH)); } else { podcast.setTitleInUrl(titleInUrl); } // set author podcast.setAuthor(syndFeed.getAuthor()); // set COPYRIGHT podcast.setCopyright(syndFeed.getCopyright()); // set LINK podcast.setLink(syndFeed.getLink()); // set url link of the podcast's image when selecting the podcast in // the main application - mostly used through <a // href="urlOfImageToDisplay".... SyndImage podcastImage = syndFeed.getImage(); if (null != podcastImage) { if (podcastImage.getUrl() != null) { podcast.setUrlOfImageToDisplay(podcastImage.getUrl()); } else if (podcastImage.getLink() != null) { podcast.setUrlOfImageToDisplay(podcastImage.getLink()); } else { podcast.setUrlOfImageToDisplay(configBean.get("NO_IMAGE_LOCAL_URL")); } } else { podcast.setUrlOfImageToDisplay(configBean.get("NO_IMAGE_LOCAL_URL")); } podcast.setPublicationDate(null); // default value is null, if cannot // be set // set url media link of the last episode - this is used when // generating the ATOM and RSS feeds from the Start page for example for (SyndEntry entry : (List<SyndEntry>) syndFeed.getEntries()) { // get the list of enclosures List<SyndEnclosure> enclosures = (List<SyndEnclosure>) entry.getEnclosures(); if (null != enclosures) { // if in the enclosure list is a media type (either audio or // video), this will set as the link of the episode for (SyndEnclosure enclosure : enclosures) { if (null != enclosure) { podcast.setLastEpisodeMediaUrl(enclosure.getUrl()); break; } } } if (entry.getPublishedDate() == null) { LOG.warn( "PodURL[" + podcast.getUrl() + "] - " + "COULD NOT SET publication date for podcast, default date 08.01.1983 will be used "); } else { podcast.setPublicationDate(entry.getPublishedDate()); } // first episode in the list is last episode - normally (are // there any exceptions?? TODO -investigate) break; } } }
private List<Outlink> parseFeed(String url, byte[] content, Metadata parentMetadata) throws MalformedURLException { List<Outlink> links = new ArrayList<>(); SyndFeed feed = null; try (ByteArrayInputStream is = new ByteArrayInputStream(content)) { SyndFeedInput input = new SyndFeedInput(); feed = input.build(new InputSource(is)); } catch (Exception e) { LOG.error("Exception parsing feed from DOM {}", url); return links; } URL sURL = new URL(url); List<SyndEntry> entries = feed.getEntries(); for (SyndEntry entry : entries) { String targetURL = entry.getLink(); // build an absolute URL try { targetURL = URLUtil.resolveURL(sURL, targetURL).toExternalForm(); } catch (MalformedURLException e) { LOG.debug("MalformedURLException on {}", targetURL); continue; } targetURL = urlFilters.filter(sURL, parentMetadata, targetURL); if (StringUtils.isBlank(targetURL)) continue; Outlink newLink = new Outlink(targetURL); Metadata targetMD = metadataTransfer.getMetaForOutlink(targetURL, url, parentMetadata); newLink.setMetadata(targetMD); String title = entry.getTitle(); if (StringUtils.isNotBlank(title)) { targetMD.setValue("feed.title", title.trim()); } Date publishedDate = entry.getPublishedDate(); if (publishedDate != null) { // filter based on the published date if (filterHoursSincePub != -1) { Calendar rightNow = Calendar.getInstance(); rightNow.add(Calendar.HOUR, -filterHoursSincePub); if (publishedDate.before(rightNow.getTime())) { LOG.info( "{} has a published date {} which is more than {} hours old", targetURL, publishedDate.toString(), filterHoursSincePub); continue; } } targetMD.setValue("feed.publishedDate", publishedDate.toString()); } SyndContent description = entry.getDescription(); if (description != null && StringUtils.isNotBlank(description.getValue())) { targetMD.setValue("feed.description", description.getValue()); } links.add(newLink); } return links; }