package eu.kanade.mangafeed.sources; import com.squareup.okhttp.Headers; import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.nodes.Element; import org.jsoup.select.Elements; import java.text.ParseException; import java.text.SimpleDateFormat; import java.util.ArrayList; import java.util.Date; import java.util.List; import java.util.Locale; import eu.kanade.mangafeed.data.caches.CacheManager; import eu.kanade.mangafeed.data.helpers.NetworkHelper; import eu.kanade.mangafeed.data.helpers.SourceManager; import eu.kanade.mangafeed.data.models.Chapter; import eu.kanade.mangafeed.data.models.Manga; import rx.Observable; public class Batoto extends Source { public static final String NAME = "Batoto (EN)"; public static final String BASE_URL = "www.bato.to"; public static final String INITIAL_UPDATE_URL = "http://bato.to/search_ajax?order_cond=views&order=desc&p="; public static final String INITIAL_SEARCH_URL = "http://bato.to/search_ajax?"; public Batoto(NetworkHelper networkService, CacheManager cacheManager) { super(networkService, cacheManager); } @Override public String getName() { return NAME; } @Override protected Headers.Builder headersBuilder() { Headers.Builder builder = super.headersBuilder(); builder.add("Cookie", "lang_option=English"); return builder; } public Observable> getGenres() { List genres = new ArrayList<>(38); genres.add("4-Koma"); genres.add("Action"); genres.add("Adventure"); genres.add("Award Winning"); genres.add("Comedy"); genres.add("Cooking"); genres.add("Doujinshi"); genres.add("Drama"); genres.add("Ecchi"); genres.add("Fantasy"); genres.add("Gender Bender"); genres.add("Harem"); genres.add("Historical"); genres.add("Horror"); genres.add("Josei"); genres.add("Martial Arts"); genres.add("Mecha"); genres.add("Medical"); genres.add("Music"); genres.add("Mystery"); genres.add("One Shot"); genres.add("Psychological"); genres.add("Romance"); genres.add("School Life"); genres.add("Sci-fi"); genres.add("Seinen"); genres.add("Shoujo"); genres.add("Shoujo Ai"); genres.add("Shounen"); genres.add("Shounen Ai"); genres.add("Slice of Life"); genres.add("Smut"); genres.add("Sports"); genres.add("Supernatural"); genres.add("Tragedy"); genres.add("Webtoon"); genres.add("Yaoi"); genres.add("Yuri"); return Observable.just(genres); } @Override public int getSource() { return SourceManager.BATOTO; } @Override protected String getUrlFromPageNumber(int page) { return INITIAL_UPDATE_URL + page; } @Override protected String getSearchUrl(String query, int page) { return INITIAL_SEARCH_URL + "name=" + query + "&p=" + page; } @Override protected String getMangaUrl(String defaultMangaUrl) { String mangaId = defaultMangaUrl.substring(defaultMangaUrl.lastIndexOf("r") + 1); return "http://bato.to/comic_pop?id=" + mangaId; } private List parseMangasFromHtml(String unparsedHtml) { if (unparsedHtml.contains("No (more) comics found!")) { return new ArrayList<>(); } Document parsedDocument = Jsoup.parse(unparsedHtml); List updatedMangaList = new ArrayList<>(); Elements updatedHtmlBlocks = parsedDocument.select("tr:not([id]):not([class])"); for (Element currentHtmlBlock : updatedHtmlBlocks) { Manga currentlyUpdatedManga = constructMangaFromHtmlBlock(currentHtmlBlock); updatedMangaList.add(currentlyUpdatedManga); } return updatedMangaList; } @Override public List parsePopularMangasFromHtml(String unparsedHtml) { return parseMangasFromHtml(unparsedHtml); } @Override protected List parseSearchFromHtml(String unparsedHtml) { return parseMangasFromHtml(unparsedHtml); } private Manga constructMangaFromHtmlBlock(Element htmlBlock) { Manga mangaFromHtmlBlock = new Manga(); Element urlElement = htmlBlock.select("a[href^=http://bato.to]").first(); Element nameElement = urlElement; Element updateElement = htmlBlock.select("td").get(5); mangaFromHtmlBlock.source = getSource(); if (urlElement != null) { String fieldUrl = urlElement.attr("href"); mangaFromHtmlBlock.url = fieldUrl; } if (nameElement != null) { String fieldName = nameElement.text().trim(); mangaFromHtmlBlock.title = fieldName; } if (updateElement != null) { long fieldUpdate = parseUpdateFromElement(updateElement); mangaFromHtmlBlock.last_update = fieldUpdate; } return mangaFromHtmlBlock; } private long parseUpdateFromElement(Element updateElement) { String updatedDateAsString = updateElement.text(); try { Date specificDate = new SimpleDateFormat("dd MMMMM yyyy - hh:mm a", Locale.ENGLISH).parse(updatedDateAsString); return specificDate.getTime(); } catch (ParseException e) { // Do Nothing. } return 0; } @Override protected Manga parseHtmlToManga(String mangaUrl, String unparsedHtml) { Document parsedDocument = Jsoup.parse(unparsedHtml); Elements artistElements = parsedDocument.select("a[href^=http://bato.to/search?artist_name]"); Element descriptionElement = parsedDocument.select("tr").get(5); Elements genreElements = parsedDocument.select("img[src=http://bato.to/forums/public/style_images/master/bullet_black.png]"); Element thumbnailUrlElement = parsedDocument.select("img[src^=http://img.bato.to/forums/uploads/]").first(); Manga newManga = new Manga(); newManga.url = mangaUrl; if (artistElements != null) { newManga.author = artistElements.get(0).text(); if (artistElements.size() > 1) { newManga.artist = artistElements.get(1).text(); } else { newManga.artist = newManga.author; } } if (descriptionElement != null) { String fieldDescription = descriptionElement.text().substring("Description:".length()).trim(); newManga.description = fieldDescription; } if (genreElements != null) { String fieldGenres = ""; for (int index = 0; index < genreElements.size(); index++) { String currentGenre = genreElements.get(index).attr("alt"); if (index < genreElements.size() - 1) { fieldGenres += currentGenre + ", "; } else { fieldGenres += currentGenre; } } newManga.genre = fieldGenres; } if (thumbnailUrlElement != null) { String fieldThumbnailUrl = thumbnailUrlElement.attr("src"); newManga.thumbnail_url = fieldThumbnailUrl; } boolean fieldCompleted = unparsedHtml.contains("Complete"); //TODO fix newManga.status = fieldCompleted + ""; newManga.initialized = true; return newManga; } @Override protected List parseHtmlToChapters(String unparsedHtml) { Document parsedDocument = Jsoup.parse(unparsedHtml); List chapterList = new ArrayList<>(); Elements chapterElements = parsedDocument.select("tr.row.lang_English.chapter_row"); for (Element chapterElement : chapterElements) { Chapter currentChapter = constructChapterFromHtmlBlock(chapterElement); chapterList.add(currentChapter); } //saveChaptersToDatabase(chapterList, mangaUrl); return chapterList; } private Chapter constructChapterFromHtmlBlock(Element chapterElement) { Chapter newChapter = Chapter.newChapter(); Element urlElement = chapterElement.select("a[href^=http://bato.to/read/").first(); Element nameElement = urlElement; Element dateElement = chapterElement.select("td").get(4); if (urlElement != null) { String fieldUrl = urlElement.attr("href"); newChapter.url = fieldUrl; } if (nameElement != null) { String fieldName = nameElement.text().trim(); newChapter.name = fieldName; } if (dateElement != null) { long fieldDate = parseDateFromElement(dateElement); newChapter.date_upload = fieldDate; } newChapter.date_fetch = new Date().getTime(); return newChapter; } private long parseDateFromElement(Element dateElement) { String dateAsString = dateElement.text(); try { Date specificDate = new SimpleDateFormat("dd MMMMM yyyy - hh:mm a", Locale.ENGLISH).parse(dateAsString); return specificDate.getTime(); } catch (ParseException e) { // Do Nothing. } return 0; } @Override protected List parseHtmlToPageUrls(String unparsedHtml) { Document parsedDocument = Jsoup.parse(unparsedHtml); List pageUrlList = new ArrayList<>(); Elements pageUrlElements = parsedDocument.getElementById("page_select").getElementsByTag("option"); for (Element pageUrlElement : pageUrlElements) { pageUrlList.add(pageUrlElement.attr("value")); } return pageUrlList; } @Override protected String parseHtmlToImageUrl(String unparsedHtml) { int beginIndex = unparsedHtml.indexOf("", beginIndex); String trimmedHtml = unparsedHtml.substring(beginIndex, endIndex); Document parsedDocument = Jsoup.parse(trimmedHtml); Element imageElement = parsedDocument.getElementById("comic_page"); return imageElement.attr("src"); } }