Skip to content

Commit 7b2199e

Browse files
committed
update ard crawler
1 parent 75f36a5 commit 7b2199e

3 files changed

Lines changed: 10 additions & 10 deletions

File tree

src/main/java/de/mediathekview/mserver/crawler/ard/ArdCrawler.java

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
import org.apache.logging.log4j.LogManager;
1414
import org.apache.logging.log4j.Logger;
1515

16+
import java.util.Arrays;
1617
import java.util.Collection;
1718
import java.util.HashSet;
1819
import java.util.List;
@@ -40,8 +41,13 @@ public Sender getSender() {
4041
private Queue<CrawlerUrlDTO> createDayUrlsToCrawl() {
4142
final Queue<CrawlerUrlDTO> dayUrlsToCrawl = new ConcurrentLinkedQueue<>();
4243
final List<String> days = DateUtils.generateDaysToCrawl(crawlerConfig);
44+
// funk hat keine program übersicht
45+
final String[] CLIENTS_WITHOUT_FUNK =
46+
Arrays.stream(ArdConstants.CLIENTS)
47+
.filter(c -> !"funk".equals(c))
48+
.toArray(String[]::new);
4349
days.forEach( dateString -> {
44-
for (final String client : ArdConstants.CLIENTS) {
50+
for (final String client : CLIENTS_WITHOUT_FUNK) {
4551
final String url = String.format(ArdConstants.DAY_PAGE_URL, dateString, client);
4652
dayUrlsToCrawl.offer(new CrawlerUrlDTO(url));
4753
}
@@ -57,7 +63,6 @@ protected RecursiveTask<Set<Film>> createCrawlerTask() {
5763
forkJoinPool.submit(new ArdDayPageTask(this, createDayUrlsToCrawl()));
5864

5965
final Set<ArdFilmInfoDto> shows = dayTask.get();
60-
shows.clear();
6166
printMessage(
6267
ServerMessages.DEBUG_ALL_SENDUNG_FOLGEN_COUNT, getSender().getName(), shows.size());
6368

@@ -74,12 +79,8 @@ protected RecursiveTask<Set<Film>> createCrawlerTask() {
7479
assitUrls.addAll(forkJoinPool.submit(groupsToAsset).get());
7580
LOG.debug("sender group assit tasks: {}", assitUrls.size());
7681

77-
//test.add(new CrawlerUrlDTO("https://api.ardmediathek.de/page-gateway/widgets/swr/asset/Y3JpZDovL3N3ci5kZS8yNDEwMzY1MA?pageNumber=0&pageSize=48&embedded=true&seasoned=false&seasonNumber=&withAudiodescription=false&withOriginalWithSubtitle=false&withOriginalversion=false&single=false"));
78-
test.add(new CrawlerUrlDTO("https://api.ardmediathek.de/page-gateway/widgets/wdr/asset/Y3JpZDovL3dkci5kZS93ZXN0cG9s?pageNumber=0&pageSize=48&embedded=true&seasoned=false&seasonNumber=&withAudiodescription=false&withOriginalWithSubtitle=false&withOriginalversion=false&single=false"));
79-
8082
final ArdTopicPageTask topicTask =
8183
new ArdTopicPageTask(this, new ConcurrentLinkedQueue<>(assitUrls));
82-
//new ArdTopicPageTask(this, new ConcurrentLinkedQueue<>(test));
8384

8485
final int showsCountBefore = shows.size();
8586
shows.addAll(forkJoinPool.submit(topicTask).get());

src/main/java/de/mediathekview/mserver/crawler/ard/json/ArdFilmDeserializer.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -210,9 +210,9 @@ public List<ArdFilmDto> deserialize(
210210
date.orElse(null),
211211
duration.orElse(null),
212212
videoInfo.get()));
213-
if (widgets.size() > 1) {
214-
parseRelatedFilms(filmDto, widgets.get(1).getAsJsonObject());
215-
}
213+
//if (widgets.size() > 1) {
214+
//parseRelatedFilms(filmDto, widgets.get(1).getAsJsonObject());
215+
//}
216216
films.add(filmDto);
217217
}
218218
// OV - long term this should go into Film as "OV"

src/main/java/de/mediathekview/mserver/crawler/ard/tasks/ArdTaskBase.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,6 @@ private Response executeRequest(final WebTarget aTarget) {
101101
}
102102

103103
return request
104-
.header("Accept-Encoding", "br, gzip, deflate, zstd")
105104
.header(HEADER_ACCEPT, APPLICATION_JSON)
106105
.header(HEADER_CONTENT_TYPE, APPLICATION_JSON)
107106
.get();

0 commit comments

Comments
 (0)