package eu.kanade.mangafeed.util; import java.util.ArrayList; import java.util.List; import java.util.regex.Matcher; import java.util.regex.Pattern; import eu.kanade.mangafeed.data.database.models.Chapter; import eu.kanade.mangafeed.data.database.models.Manga; public class ChapterRecognition { private static Pattern p1 = Pattern.compile("ch.?(\\d+[\\.,]?\\d*)"); private static Pattern p2 = Pattern.compile("(\\d+[\\.,]?\\d*)"); public static void parseChapterNumber(Chapter chapter, Manga manga) { if (chapter.chapter_number != 0) return; // Remove spaces and convert to lower case String name = replaceIrrelevantCharacters(chapter.name); Matcher matcher; // Safest option, the chapter has a token prepended matcher = p1.matcher(name); if (matcher.find()) { chapter.chapter_number = Float.parseFloat(matcher.group(1)); return; } // If there's only one number, use it matcher = p2.matcher(name); List occurences = getAllOccurrences(matcher); if (occurences.size() == 1) { chapter.chapter_number = occurences.get(0); return; } // Try to remove the manga name from the chapter, and try again String mangaName = replaceIrrelevantCharacters(manga.title); String nameWithoutManga = difference(mangaName, name); if (!nameWithoutManga.isEmpty()) { matcher = p2.matcher(nameWithoutManga); occurences = getAllOccurrences(matcher); if (occurences.size() == 1) { chapter.chapter_number = occurences.get(0); return; } } // TODO more checks (maybe levenshtein?) } public static List getAllOccurrences(Matcher matcher) { List occurences = new ArrayList<>(); while (matcher.find()) { try { float value = Float.parseFloat(matcher.group()); if (!occurences.contains(value)) occurences.add(value); } catch (NumberFormatException e) { /* Do nothing */ } } return occurences; } public static String replaceIrrelevantCharacters(String str) { return str.replaceAll("\\s+", "").toLowerCase(); } public static String difference(String str1, String str2) { if (str1 == null) { return str2; } if (str2 == null) { return str1; } int at = indexOfDifference(str1, str2); if (at == -1) { return ""; } return str2.substring(at); } public static int indexOfDifference(String str1, String str2) { if (str1 == str2) { return -1; } if (str1 == null || str2 == null) { return 0; } int i; for (i = 0; i < str1.length() && i < str2.length(); ++i) { if (str1.charAt(i) != str2.charAt(i)) { break; } } if (i < str2.length() || i < str1.length()) { return i; } return -1; } }