2015-10-05 18:24:29 -04:00
|
|
|
package eu.kanade.mangafeed.sources;
|
|
|
|
|
|
|
|
import com.squareup.okhttp.Headers;
|
|
|
|
|
|
|
|
import org.jsoup.Jsoup;
|
|
|
|
import org.jsoup.nodes.Document;
|
|
|
|
import org.jsoup.nodes.Element;
|
|
|
|
import org.jsoup.select.Elements;
|
|
|
|
|
2015-10-06 13:44:30 -04:00
|
|
|
import java.text.ParseException;
|
|
|
|
import java.text.SimpleDateFormat;
|
2015-10-05 18:24:29 -04:00
|
|
|
import java.util.ArrayList;
|
2015-10-06 13:44:30 -04:00
|
|
|
import java.util.Date;
|
2015-10-05 18:24:29 -04:00
|
|
|
import java.util.List;
|
2015-10-06 13:44:30 -04:00
|
|
|
import java.util.Locale;
|
2015-10-05 18:24:29 -04:00
|
|
|
import java.util.concurrent.atomic.AtomicInteger;
|
|
|
|
|
|
|
|
import eu.kanade.mangafeed.data.caches.CacheManager;
|
|
|
|
import eu.kanade.mangafeed.data.helpers.NetworkHelper;
|
2015-10-08 07:15:29 -04:00
|
|
|
import eu.kanade.mangafeed.data.helpers.SourceManager;
|
2015-10-06 13:44:30 -04:00
|
|
|
import eu.kanade.mangafeed.data.models.Chapter;
|
|
|
|
import eu.kanade.mangafeed.data.models.Manga;
|
2015-10-05 18:24:29 -04:00
|
|
|
import rx.Observable;
|
|
|
|
import rx.schedulers.Schedulers;
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
public class Batoto extends Source {
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
public static final String NAME = "Batoto (EN)";
|
|
|
|
public static final String BASE_URL = "www.bato.to";
|
2015-10-08 07:15:29 -04:00
|
|
|
public static final String INITIAL_UPDATE_URL = "http://bato.to/search_ajax?order_cond=views&order=desc&p=1";
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
private static final Headers REQUEST_HEADERS = constructRequestHeaders();
|
|
|
|
private static Headers constructRequestHeaders() {
|
|
|
|
Headers.Builder headerBuilder = new Headers.Builder();
|
|
|
|
headerBuilder.add("User-Agent", "Mozilla/5.0 (Windows NT 6.3; WOW64)");
|
|
|
|
headerBuilder.add("Cookie", "lang_option=English");
|
|
|
|
|
|
|
|
return headerBuilder.build();
|
|
|
|
}
|
|
|
|
|
|
|
|
private NetworkHelper mNetworkService;
|
|
|
|
private CacheManager mCacheManager;
|
|
|
|
|
|
|
|
public Batoto(NetworkHelper networkService, CacheManager cacheManager) {
|
|
|
|
mNetworkService = networkService;
|
|
|
|
mCacheManager = cacheManager;
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<String> getName() {
|
|
|
|
return Observable.just(NAME);
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<String> getBaseUrl() {
|
|
|
|
return Observable.just(BASE_URL);
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<String> getInitialUpdateUrl() {
|
|
|
|
return Observable.just(INITIAL_UPDATE_URL);
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<List<String>> getGenres() {
|
|
|
|
List<String> genres = new ArrayList<String>(38);
|
|
|
|
|
|
|
|
genres.add("4-Koma");
|
|
|
|
genres.add("Action");
|
|
|
|
genres.add("Adventure");
|
|
|
|
genres.add("Award Winning");
|
|
|
|
genres.add("Comedy");
|
|
|
|
genres.add("Cooking");
|
|
|
|
genres.add("Doujinshi");
|
|
|
|
genres.add("Drama");
|
|
|
|
genres.add("Ecchi");
|
|
|
|
genres.add("Fantasy");
|
|
|
|
genres.add("Gender Bender");
|
|
|
|
genres.add("Harem");
|
|
|
|
genres.add("Historical");
|
|
|
|
genres.add("Horror");
|
|
|
|
genres.add("Josei");
|
|
|
|
genres.add("Martial Arts");
|
|
|
|
genres.add("Mecha");
|
|
|
|
genres.add("Medical");
|
|
|
|
genres.add("Music");
|
|
|
|
genres.add("Mystery");
|
|
|
|
genres.add("One Shot");
|
|
|
|
genres.add("Psychological");
|
|
|
|
genres.add("Romance");
|
|
|
|
genres.add("School Life");
|
|
|
|
genres.add("Sci-fi");
|
|
|
|
genres.add("Seinen");
|
|
|
|
genres.add("Shoujo");
|
|
|
|
genres.add("Shoujo Ai");
|
|
|
|
genres.add("Shounen");
|
|
|
|
genres.add("Shounen Ai");
|
|
|
|
genres.add("Slice of Life");
|
|
|
|
genres.add("Smut");
|
|
|
|
genres.add("Sports");
|
|
|
|
genres.add("Supernatural");
|
|
|
|
genres.add("Tragedy");
|
|
|
|
genres.add("Webtoon");
|
|
|
|
genres.add("Yaoi");
|
|
|
|
genres.add("Yuri");
|
|
|
|
|
|
|
|
return Observable.just(genres);
|
|
|
|
}
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
public String getUrlFromPageNumber(int page) {
|
|
|
|
if (page == 1)
|
|
|
|
return INITIAL_UPDATE_URL;
|
|
|
|
|
|
|
|
return INITIAL_UPDATE_URL.substring(0, INITIAL_UPDATE_URL.length() - 1) + page;
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<List<Manga>> pullPopularMangasFromNetwork(int page) {
|
|
|
|
String url = getUrlFromPageNumber(page);
|
2015-10-05 18:24:29 -04:00
|
|
|
return mNetworkService
|
2015-10-08 07:15:29 -04:00
|
|
|
.getStringResponse(url, mNetworkService.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
2015-10-09 07:38:28 -04:00
|
|
|
.flatMap(response -> Observable.just(parsePopularMangasFromHtml(response)));
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
2015-10-09 07:38:28 -04:00
|
|
|
private List<Manga> parsePopularMangasFromHtml(String unparsedHtml) {
|
2015-10-05 18:24:29 -04:00
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
List<Manga> updatedMangaList = new ArrayList<>();
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
Elements updatedHtmlBlocks = parsedDocument.select("tr:not([id]):not([class])");
|
|
|
|
for (Element currentHtmlBlock : updatedHtmlBlocks) {
|
|
|
|
Manga currentlyUpdatedManga = constructMangaFromHtmlBlock(currentHtmlBlock);
|
|
|
|
|
|
|
|
updatedMangaList.add(currentlyUpdatedManga);
|
|
|
|
}
|
|
|
|
|
|
|
|
return updatedMangaList;
|
|
|
|
}
|
|
|
|
|
|
|
|
private Manga constructMangaFromHtmlBlock(Element htmlBlock) {
|
2015-10-08 07:15:29 -04:00
|
|
|
Manga mangaFromHtmlBlock = new Manga();
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
Element urlElement = htmlBlock.select("a[href^=http://bato.to]").first();
|
|
|
|
Element nameElement = urlElement;
|
|
|
|
Element updateElement = htmlBlock.select("td").get(5);
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
mangaFromHtmlBlock.source = SourceManager.BATOTO;
|
|
|
|
|
2015-10-05 18:24:29 -04:00
|
|
|
if (urlElement != null) {
|
|
|
|
String fieldUrl = urlElement.attr("href");
|
2015-10-08 07:15:29 -04:00
|
|
|
mangaFromHtmlBlock.url = fieldUrl;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
if (nameElement != null) {
|
|
|
|
String fieldName = nameElement.text().trim();
|
2015-10-08 07:15:29 -04:00
|
|
|
mangaFromHtmlBlock.title = fieldName;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
if (updateElement != null) {
|
|
|
|
long fieldUpdate = parseUpdateFromElement(updateElement);
|
2015-10-08 07:15:29 -04:00
|
|
|
mangaFromHtmlBlock.last_update = fieldUpdate;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
return mangaFromHtmlBlock;
|
|
|
|
}
|
|
|
|
|
|
|
|
private long parseUpdateFromElement(Element updateElement) {
|
|
|
|
String updatedDateAsString = updateElement.text();
|
|
|
|
|
|
|
|
try {
|
|
|
|
Date specificDate = new SimpleDateFormat("dd MMMMM yyyy - hh:mm a", Locale.ENGLISH).parse(updatedDateAsString);
|
|
|
|
|
|
|
|
return specificDate.getTime();
|
|
|
|
} catch (ParseException e) {
|
|
|
|
// Do Nothing.
|
|
|
|
}
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
return 0;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
2015-10-08 07:15:29 -04:00
|
|
|
/*
|
|
|
|
|
2015-10-05 18:24:29 -04:00
|
|
|
private void updateLibraryInDatabase(List<Manga> mangaList) {
|
|
|
|
mQueryManager.beginLibraryTransaction();
|
|
|
|
try {
|
|
|
|
List<Manga> mangaToRemove = new ArrayList<>();
|
|
|
|
for (Manga currentManga : mangaList) {
|
|
|
|
Manga existingManga = mQueryManager.retrieveManga(NAME, currentManga.getName())
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
|
|
|
|
if (existingManga != null) {
|
|
|
|
existingManga.setUpdated(currentManga.getUpdated());
|
|
|
|
existingManga.setUpdateCount(currentManga.getUpdateCount());
|
|
|
|
|
|
|
|
|
|
|
|
mQueryManager.createManga(existingManga)
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
} else {
|
|
|
|
mangaToRemove.add(currentManga);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
mangaList.removeAll(mangaToRemove);
|
|
|
|
|
|
|
|
mQueryManager.setLibraryTransactionSuccessful();
|
|
|
|
} finally {
|
|
|
|
mQueryManager.endLibraryTransaction();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private String findNextUrlFromParsedDocument(String requestUrl, String unparsedHtml) {
|
|
|
|
if (!unparsedHtml.contains("No (more) comics found!")) {
|
|
|
|
requestUrl = requestUrl.replace("http://bato.to/search_ajax?order_cond=update&order=desc&p=", "");
|
|
|
|
|
|
|
|
return "http://bato.to/search_ajax?order_cond=update&order=desc&p=" + (Integer.valueOf(requestUrl) + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
return DefaultFactory.UpdatePageMarker.DEFAULT_NEXT_PAGE_URL;
|
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<Manga> pullMangaFromNetwork(final String mangaUrl) {
|
|
|
|
String mangaId = mangaUrl.substring(mangaUrl.lastIndexOf("r") + 1);
|
|
|
|
|
|
|
|
return mNetworkService
|
|
|
|
.getResponse("http://bato.to/comic_pop?id=" + mangaId, NetworkModule.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
|
|
|
.flatMap(new Func1<Response, Observable<String>>() {
|
|
|
|
@Override
|
|
|
|
public Observable<String> call(Response response) {
|
|
|
|
return mNetworkService.mapResponseToString(response);
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.flatMap(new Func1<String, Observable<Manga>>() {
|
|
|
|
@Override
|
|
|
|
public Observable<Manga> call(String unparsedHtml) {
|
|
|
|
return Observable.just(parseHtmlToManga(mangaUrl, unparsedHtml));
|
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
private Manga parseHtmlToManga(String mangaUrl, String unparsedHtml) {
|
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
|
|
|
Element artistElement = parsedDocument.select("a[href^=http://bato.to/search?artist_name]").first();
|
|
|
|
Element descriptionElement = parsedDocument.select("tr").get(5);
|
|
|
|
Elements genreElements = parsedDocument.select("img[src=http://bato.to/forums/public/style_images/master/bullet_black.png]");
|
|
|
|
Element thumbnailUrlElement = parsedDocument.select("img[src^=http://img.batoto.net/forums/uploads/]").first();
|
|
|
|
|
|
|
|
StringBuilder selection = new StringBuilder();
|
|
|
|
List<String> selectionArgs = new ArrayList<String>();
|
|
|
|
|
|
|
|
selection.append(LibraryContract.Manga.COLUMN_SOURCE + " = ?");
|
|
|
|
selectionArgs.add(NAME);
|
|
|
|
selection.append(" AND ").append(LibraryContract.Manga.COLUMN_URL + " = ?");
|
|
|
|
selectionArgs.add(mangaUrl);
|
|
|
|
|
|
|
|
Manga newManga = mQueryManager.retrieveMangaAsCursor(
|
|
|
|
null,
|
|
|
|
selection.toString(),
|
|
|
|
selectionArgs.toArray(new String[selectionArgs.size()]),
|
|
|
|
null,
|
|
|
|
null,
|
|
|
|
null,
|
|
|
|
"1"
|
|
|
|
)
|
|
|
|
.map(new Func1<Cursor, Manga>() {
|
|
|
|
@Override
|
|
|
|
public Manga call(Cursor cursor) {
|
|
|
|
return DatabaseUtils.toObject(cursor, Manga.class);
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.filter(new Func1<Manga, Boolean>() {
|
|
|
|
@Override
|
|
|
|
public Boolean call(Manga manga) {
|
|
|
|
return manga != null;
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
|
|
|
|
if (artistElement != null) {
|
|
|
|
String fieldArtist = artistElement.text();
|
|
|
|
newManga.setArtist(fieldArtist);
|
|
|
|
newManga.setAuthor(fieldArtist);
|
|
|
|
}
|
|
|
|
if (descriptionElement != null) {
|
|
|
|
String fieldDescription = descriptionElement.text().substring("Description:".length()).trim();
|
|
|
|
newManga.setDescription(fieldDescription);
|
|
|
|
}
|
|
|
|
if (genreElements != null) {
|
|
|
|
String fieldGenres = "";
|
|
|
|
for (int index = 0; index < genreElements.size(); index++) {
|
|
|
|
String currentGenre = genreElements.get(index).attr("alt");
|
|
|
|
|
|
|
|
if (index < genreElements.size() - 1) {
|
|
|
|
fieldGenres += currentGenre + ", ";
|
|
|
|
} else {
|
|
|
|
fieldGenres += currentGenre;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
newManga.setGenre(fieldGenres);
|
|
|
|
}
|
|
|
|
if (thumbnailUrlElement != null) {
|
|
|
|
String fieldThumbnailUrl = thumbnailUrlElement.attr("src");
|
|
|
|
newManga.setThumbnailUrl(fieldThumbnailUrl);
|
|
|
|
}
|
|
|
|
|
|
|
|
boolean fieldCompleted = unparsedHtml.contains("<td>Complete</td>");
|
|
|
|
newManga.setCompleted(fieldCompleted);
|
|
|
|
|
|
|
|
|
|
|
|
newManga.setInitialized(true);
|
|
|
|
|
|
|
|
mQueryManager.createManga(newManga)
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
|
|
|
|
return newManga;
|
|
|
|
}
|
2015-10-06 13:44:30 -04:00
|
|
|
*/
|
2015-10-05 18:24:29 -04:00
|
|
|
|
2015-10-06 13:44:30 -04:00
|
|
|
public Observable<List<Chapter>> pullChaptersFromNetwork(String mangaUrl) {
|
2015-10-05 18:24:29 -04:00
|
|
|
return mNetworkService
|
2015-10-06 13:44:30 -04:00
|
|
|
.getStringResponse(mangaUrl, mNetworkService.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
|
|
|
.flatMap(unparsedHtml ->
|
|
|
|
Observable.just(parseHtmlToChapters(unparsedHtml)));
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
2015-10-06 13:44:30 -04:00
|
|
|
private List<Chapter> parseHtmlToChapters(String unparsedHtml) {
|
2015-10-05 18:24:29 -04:00
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
|
|
|
List<Chapter> chapterList = new ArrayList<Chapter>();
|
|
|
|
|
|
|
|
Elements chapterElements = parsedDocument.select("tr.row.lang_English.chapter_row");
|
|
|
|
for (Element chapterElement : chapterElements) {
|
|
|
|
Chapter currentChapter = constructChapterFromHtmlBlock(chapterElement);
|
2015-10-06 13:44:30 -04:00
|
|
|
System.out.println(currentChapter.name);
|
2015-10-05 18:24:29 -04:00
|
|
|
chapterList.add(currentChapter);
|
|
|
|
}
|
|
|
|
|
2015-10-06 13:44:30 -04:00
|
|
|
//saveChaptersToDatabase(chapterList, mangaUrl);
|
|
|
|
|
2015-10-05 18:24:29 -04:00
|
|
|
return chapterList;
|
2015-10-06 13:44:30 -04:00
|
|
|
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
private Chapter constructChapterFromHtmlBlock(Element chapterElement) {
|
2015-10-06 13:44:30 -04:00
|
|
|
Chapter newChapter = Chapter.newChapter();
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
Element urlElement = chapterElement.select("a[href^=http://bato.to/read/").first();
|
|
|
|
Element nameElement = urlElement;
|
|
|
|
Element dateElement = chapterElement.select("td").get(4);
|
|
|
|
|
|
|
|
if (urlElement != null) {
|
|
|
|
String fieldUrl = urlElement.attr("href");
|
2015-10-06 13:44:30 -04:00
|
|
|
newChapter.url = fieldUrl;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
if (nameElement != null) {
|
|
|
|
String fieldName = nameElement.text().trim();
|
2015-10-06 13:44:30 -04:00
|
|
|
newChapter.name = fieldName;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
if (dateElement != null) {
|
|
|
|
long fieldDate = parseDateFromElement(dateElement);
|
2015-10-06 13:44:30 -04:00
|
|
|
newChapter.date_upload = fieldDate;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
2015-10-06 13:44:30 -04:00
|
|
|
newChapter.date_fetch = new Date().getTime();
|
2015-10-05 18:24:29 -04:00
|
|
|
|
|
|
|
return newChapter;
|
|
|
|
}
|
|
|
|
|
|
|
|
private long parseDateFromElement(Element dateElement) {
|
|
|
|
String dateAsString = dateElement.text();
|
|
|
|
|
|
|
|
try {
|
|
|
|
Date specificDate = new SimpleDateFormat("dd MMMMM yyyy - hh:mm a", Locale.ENGLISH).parse(dateAsString);
|
|
|
|
|
|
|
|
return specificDate.getTime();
|
|
|
|
} catch (ParseException e) {
|
|
|
|
// Do Nothing.
|
|
|
|
}
|
|
|
|
|
2015-10-06 13:44:30 -04:00
|
|
|
return 0;
|
2015-10-05 18:24:29 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
public Observable<String> pullImageUrlsFromNetwork(final String chapterUrl) {
|
|
|
|
final List<String> temporaryCachedImageUrls = new ArrayList<>();
|
|
|
|
|
|
|
|
return mCacheManager.getImageUrlsFromDiskCache(chapterUrl)
|
|
|
|
.onErrorResumeNext(throwable -> {
|
2015-10-09 07:38:28 -04:00
|
|
|
return getImageUrlsFromNetwork(chapterUrl)
|
2015-10-05 18:24:29 -04:00
|
|
|
.doOnNext(imageUrl -> temporaryCachedImageUrls.add(imageUrl))
|
|
|
|
.doOnCompleted(mCacheManager.putImageUrlsToDiskCache(chapterUrl, temporaryCachedImageUrls));
|
|
|
|
})
|
|
|
|
.onBackpressureBuffer();
|
|
|
|
}
|
|
|
|
|
2015-10-09 07:38:28 -04:00
|
|
|
public Observable<String> getImageUrlsFromNetwork(final String chapterUrl) {
|
|
|
|
return mNetworkService
|
|
|
|
.getStringResponse(chapterUrl, mNetworkService.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
|
|
|
.flatMap(unparsedHtml -> Observable.from(parseHtmlToPageUrls(unparsedHtml)))
|
|
|
|
.buffer(3)
|
|
|
|
.concatMap(batchedPageUrls -> {
|
|
|
|
List<Observable<String>> imageUrlObservables = new ArrayList<>();
|
|
|
|
for (String pageUrl : batchedPageUrls) {
|
|
|
|
Observable<String> temporaryObservable = mNetworkService
|
|
|
|
.getStringResponse(pageUrl, mNetworkService.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
|
|
|
.flatMap(unparsedHtml -> Observable.just(parseHtmlToImageUrl(unparsedHtml)))
|
|
|
|
.subscribeOn(Schedulers.io());
|
|
|
|
|
|
|
|
imageUrlObservables.add(temporaryObservable);
|
|
|
|
}
|
|
|
|
|
|
|
|
return Observable.merge(imageUrlObservables);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2015-10-05 18:24:29 -04:00
|
|
|
private List<String> parseHtmlToPageUrls(String unparsedHtml) {
|
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
|
|
|
List<String> pageUrlList = new ArrayList<String>();
|
|
|
|
|
|
|
|
Elements pageUrlElements = parsedDocument.getElementById("page_select").getElementsByTag("option");
|
|
|
|
for (Element pageUrlElement : pageUrlElements) {
|
|
|
|
pageUrlList.add(pageUrlElement.attr("value"));
|
|
|
|
}
|
|
|
|
|
|
|
|
return pageUrlList;
|
|
|
|
}
|
|
|
|
|
|
|
|
private String parseHtmlToImageUrl(String unparsedHtml) {
|
|
|
|
int beginIndex = unparsedHtml.indexOf("<img id=\"comic_page\"");
|
|
|
|
int endIndex = unparsedHtml.indexOf("</a>", beginIndex);
|
|
|
|
String trimmedHtml = unparsedHtml.substring(beginIndex, endIndex);
|
|
|
|
|
|
|
|
Document parsedDocument = Jsoup.parse(trimmedHtml);
|
|
|
|
|
|
|
|
Element imageElement = parsedDocument.getElementById("comic_page");
|
|
|
|
|
|
|
|
return imageElement.attr("src");
|
|
|
|
}
|
|
|
|
|
|
|
|
private static String INITIAL_DATABASE_URL_1 = "http://bato.to/comic_pop?id=1";
|
|
|
|
private static String INITIAL_DATABASE_URL_2 = "http://bato.to/search_ajax?order_cond=views&order=desc&p=1";
|
|
|
|
|
|
|
|
private static AtomicInteger mCounter = new AtomicInteger(1);
|
|
|
|
|
|
|
|
/*
|
|
|
|
public Observable<String> recursivelyConstructDatabase(final String url) {
|
|
|
|
return mNetworkService
|
|
|
|
.getResponse(url, NetworkUtil.NULL_CACHE_CONTROL, REQUEST_HEADERS)
|
|
|
|
.flatMap(new Func1<Response, Observable<String>>() {
|
|
|
|
@Override
|
|
|
|
public Observable<String> call(Response response) {
|
|
|
|
return mNetworkService.mapResponseToString(response);
|
|
|
|
}
|
|
|
|
})
|
|
|
|
.flatMap(new Func1<String, Observable<String>>() {
|
|
|
|
@Override
|
|
|
|
public Observable<String> call(String unparsedHtml) {
|
|
|
|
return Observable.just(parseEnglish_Batoto(unparsedHtml));
|
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
private String parseEnglish_Batoto(String unparsedHtml) {
|
|
|
|
if (!unparsedHtml.equals("wtf?")) {
|
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
|
|
|
Manga newManga = new Manga();
|
|
|
|
|
|
|
|
Element temporaryElementOne = parsedDocument.getElementsByTag("a").first();
|
|
|
|
Element temporaryElementTwo = parsedDocument.select("a[href^=http://bato.to/forums/forum/]").first();
|
|
|
|
Element temporaryElementThree = parsedDocument.select("img[src^=http://img.batoto.net/forums/uploads/]").first();
|
|
|
|
Elements temporaryElementsFour = parsedDocument.select("img[src=http://bato.to/forums/public/style_images/master/bullet_black.png]");
|
|
|
|
|
|
|
|
String fieldSource = English_Batoto.NAME;
|
|
|
|
newManga.setSource(fieldSource);
|
|
|
|
|
|
|
|
String fieldUrl = "http://bato.to" + temporaryElementOne.attr("href");
|
|
|
|
newManga.setUrl(fieldUrl);
|
|
|
|
|
|
|
|
String fieldName = temporaryElementTwo.text();
|
|
|
|
int startIndex = "Go to ".length();
|
|
|
|
int endIndex = fieldName.lastIndexOf(" Forums!");
|
|
|
|
newManga.setName(fieldName.substring(startIndex, endIndex));
|
|
|
|
|
|
|
|
String fieldThumbnailUrl = temporaryElementThree.attr("src");
|
|
|
|
newManga.setThumbnailUrl(fieldThumbnailUrl);
|
|
|
|
|
|
|
|
String fieldGenres = "";
|
|
|
|
for (int index = 0; index < temporaryElementsFour.size(); index++) {
|
|
|
|
String currentGenre = temporaryElementsFour.get(index).attr("alt");
|
|
|
|
|
|
|
|
if (index < temporaryElementsFour.size() - 1) {
|
|
|
|
fieldGenres += currentGenre + ", ";
|
|
|
|
} else {
|
|
|
|
fieldGenres += currentGenre;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
newManga.setGenre(fieldGenres);
|
|
|
|
|
|
|
|
boolean fieldIsCompleted = unparsedHtml.contains("<td>Complete</td>");
|
|
|
|
newManga.setCompleted(fieldIsCompleted);
|
|
|
|
|
|
|
|
mQueryManager.createManga(newManga)
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
}
|
|
|
|
|
|
|
|
return "http://bato.to/comic_pop?id=" + mCounter.incrementAndGet();
|
|
|
|
}
|
|
|
|
|
|
|
|
private String parseEnglish_Batoto_Views(String unparsedHtml) {
|
|
|
|
if (!unparsedHtml.contains("No (more) comics found!")) {
|
|
|
|
Document parsedDocument = Jsoup.parse(unparsedHtml);
|
|
|
|
|
|
|
|
List<Pair<String, ContentValues>> updateList = new ArrayList<Pair<String, ContentValues>>();
|
|
|
|
Elements mangaElements = parsedDocument.select("tr:not([id]):not([class])");
|
|
|
|
for (Element mangaElement : mangaElements) {
|
|
|
|
Element temporaryElementOne = mangaElement.select("a[href^=http://bato.to]").first();
|
|
|
|
Element temporaryElementTwo = mangaElement.select("td").get(3);
|
|
|
|
String temporaryString = temporaryElementTwo.text();
|
|
|
|
|
|
|
|
String fieldUrl = temporaryElementOne.attr("href");
|
|
|
|
|
|
|
|
String fieldView = null;
|
|
|
|
if (temporaryString.contains("m")) {
|
|
|
|
temporaryString = temporaryString.replace("m", "");
|
|
|
|
|
|
|
|
int viewsAsNumber = (int)(Double.valueOf(temporaryString) * 1000000);
|
|
|
|
fieldView = String.valueOf(viewsAsNumber);
|
|
|
|
} else if (temporaryString.contains("k")) {
|
|
|
|
temporaryString = temporaryString.replace("k", "");
|
|
|
|
|
|
|
|
int viewsAsNumber = (int)(Double.valueOf(temporaryString) * 1000);
|
|
|
|
fieldView = String.valueOf(viewsAsNumber);
|
|
|
|
} else {
|
|
|
|
int viewsAsNumber = (int)(Double.valueOf(temporaryString) * 1);
|
|
|
|
fieldView = String.valueOf(viewsAsNumber);
|
|
|
|
}
|
|
|
|
|
|
|
|
ContentValues fieldRanking = new ContentValues(1);
|
|
|
|
fieldRanking.put(LibraryContract.Manga.COLUMN_RANK, fieldView);
|
|
|
|
|
|
|
|
updateList.add(Pair.create(fieldUrl, fieldRanking));
|
|
|
|
}
|
|
|
|
|
|
|
|
mQueryManager.beginLibraryTransaction();
|
|
|
|
try {
|
|
|
|
for (Pair<String, ContentValues> currentUpdate : updateList) {
|
|
|
|
mQueryManager.updateManga(currentUpdate.second, LibraryContract.Manga.COLUMN_URL + " = ?", new String[]{currentUpdate.first})
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
}
|
|
|
|
|
|
|
|
mQueryManager.setLibraryTransactionSuccessful();
|
|
|
|
} finally {
|
|
|
|
mQueryManager.endLibraryTransaction();
|
|
|
|
}
|
|
|
|
|
|
|
|
return "http://bato.to/search_ajax?order_cond=views&order=desc&p=" + mCounter.incrementAndGet();
|
|
|
|
}
|
|
|
|
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
public void reorderEnglish_Batoto_Rankings() {
|
|
|
|
List<Manga> mangaList = mQueryManager.retrieveAllMangaAsStream(
|
|
|
|
null,
|
|
|
|
LibraryContract.Manga.COLUMN_SOURCE + " = ?",
|
|
|
|
new String[]{NAME},
|
|
|
|
null,
|
|
|
|
null,
|
|
|
|
LibraryContract.Manga.COLUMN_RANK + " DESC",
|
|
|
|
null
|
|
|
|
)
|
|
|
|
.toList()
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
|
|
|
|
for (int index = 0; index < mangaList.size(); index++) {
|
|
|
|
mangaList.get(index).setRank(index + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
mQueryManager.beginLibraryTransaction();
|
|
|
|
try {
|
|
|
|
for (Manga currentManga : mangaList) {
|
|
|
|
mQueryManager.createManga(currentManga)
|
|
|
|
.toBlocking()
|
|
|
|
.single();
|
|
|
|
}
|
|
|
|
mQueryManager.setLibraryTransactionSuccessful();
|
|
|
|
} finally {
|
|
|
|
mQueryManager.endLibraryTransaction();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
*/
|
|
|
|
}
|
|
|
|
|