refactor(chapter): Improve chapter recognition

This commit is contained in:
stevenyomi 2024-08-16 08:11:15 +07:00 committed by Ahmad Ansori Palembani
parent 842ca9ec4a
commit 1cd40907ef
Signed by: null2264
GPG key ID: BA64F8B60AF3EFB6
2 changed files with 29 additions and 56 deletions

View file

@ -17,7 +17,7 @@ plugins {
alias(libs.plugins.google.services) apply false alias(libs.plugins.google.services) apply false
} }
if (gradle.startParameter.taskRequests.toString().contains("Standard")) { if (gradle.startParameter.taskRequests.toString().contains("standard", true)) {
apply<CrashlyticsPlugin>() apply<CrashlyticsPlugin>()
apply<GoogleServicesPlugin>() apply<GoogleServicesPlugin>()
} }

View file

@ -2,41 +2,36 @@ package eu.kanade.tachiyomi.util.chapter
import eu.kanade.tachiyomi.source.model.SChapter import eu.kanade.tachiyomi.source.model.SChapter
import eu.kanade.tachiyomi.source.model.SManga import eu.kanade.tachiyomi.source.model.SManga
import eu.kanade.tachiyomi.source.models.originalTitle
/** /**
* -R> = regex conversion. * -R> = regex conversion.
*/ */
object ChapterRecognition { object ChapterRecognition {
private const val NUMBER_PATTERN = """([0-9]+)(\.[0-9]+)?(\.?[a-z]+)?"""
/** /**
* All cases with Ch.xx * All cases with Ch.xx
* Mokushiroku Alice Vol.1 Ch. 4: Misrepresentation -R> 4 * Mokushiroku Alice Vol.1 Ch. 4: Misrepresentation -R> 4
*/ */
private val basic = Regex("""(?<=ch\.) *([0-9]+)(\.[0-9]+)?(\.?[a-z]+)?""") private val basic = Regex("""(?<=ch\.) *$NUMBER_PATTERN""")
/** /**
* Regex used when only one number occurrence
* Example: Bleach 567: Down With Snowwhite -R> 567 * Example: Bleach 567: Down With Snowwhite -R> 567
*/ */
private val occurrence = Regex("""([0-9]+)(\.[0-9]+)?(\.?[a-z]+)?""") private val number = Regex(NUMBER_PATTERN)
/**
* Regex used when manga title removed
* Example: Solanin 028 Vol. 2 -> 028 Vol.2 -> 028Vol.2 -R> 028
*/
private val withoutManga = Regex("""^([0-9]+)(\.[0-9]+)?(\.?[a-z]+)?""")
/** /**
* Regex used to remove unwanted tags * Regex used to remove unwanted tags
* Example Prison School 12 v.1 vol004 version1243 volume64 -R> Prison School 12 * Example Prison School 12 v.1 vol004 version1243 volume64 -R> Prison School 12
*/ */
private val unwanted = Regex("""(?<![a-z])(v|ver|vol|version|volume|season|s).?[0-9]+""") private val unwanted = Regex("""\b(?:v|ver|vol|version|volume|season|s)[^a-z]?[0-9]+""")
/** /**
* Regex used to remove unwanted whitespace * Regex used to remove unwanted whitespace
* Example One Piece 12 special -R> One Piece 12special * Example One Piece 12 special -R> One Piece 12special
*/ */
private val unwantedWhiteSpace = Regex("""(\s)(extra|special|omake)""") private val unwantedWhiteSpace = Regex("""\s(?=extra|special|omake)""")
fun parseChapterNumber(chapter: SChapter, manga: SManga) { fun parseChapterNumber(chapter: SChapter, manga: SManga) {
// If chapter number is known return. // If chapter number is known return.
@ -47,66 +42,44 @@ object ChapterRecognition {
// Get chapter title with lower case // Get chapter title with lower case
var name = chapter.name.lowercase() var name = chapter.name.lowercase()
// Remove manga title from chapter title.
name = name.replace(manga.title.lowercase(), "").trim()
// Remove comma's or hyphens. // Remove comma's or hyphens.
name = name.replace(',', '.').replace('-', '.') name = name.replace(',', '.').replace('-', '.')
// Remove unwanted white spaces. // Remove unwanted white spaces.
unwantedWhiteSpace.findAll(name).let { name = unwantedWhiteSpace.replace(name, "")
it.forEach { occurrence -> name = name.replace(occurrence.value, occurrence.value.trim()) }
}
// Remove unwanted tags. // Remove unwanted tags.
unwanted.findAll(name).let { name = unwanted.replace(name, "")
it.forEach { occurrence -> name = name.replace(occurrence.value, "") }
}
// Check base case ch.xx basic.find(name)?.let {
if (updateChapter(basic.find(name), chapter)) { chapter.chapter_number = getChapterNumberFromMatch(it)
return return
} }
// Check one number occurrence. number.find(name)?.let {
val occurrences: MutableList<MatchResult> = arrayListOf() chapter.chapter_number = getChapterNumberFromMatch(it)
occurrence.findAll(name).let {
it.forEach { occurrence -> occurrences.add(occurrence) }
}
if (occurrences.size == 1) {
if (updateChapter(occurrences[0], chapter)) {
return
}
}
// Remove manga title from chapter title.
val nameWithoutManga = name.replace(manga.originalTitle.lowercase(), "").trim()
// Check if first value is number after title remove.
if (updateChapter(withoutManga.find(nameWithoutManga), chapter)) {
return return
} }
// Take the first number encountered. // if (chapter.chapter_number == null) chapter.chapter_number = -1f
if (updateChapter(occurrence.find(nameWithoutManga), chapter)) {
return
}
} }
/** /**
* Check if volume is found and update chapter * Check if volume is found and return it
* @param match result of regex * @param match result of regex
* @param chapter chapter object * @return chapter number if found else null
* @return true if volume is found
*/ */
private fun updateChapter(match: MatchResult?, chapter: SChapter): Boolean { private fun getChapterNumberFromMatch(match: MatchResult): Float {
match?.let { return match.let {
val initial = it.groups[1]?.value?.toFloat()!! val initial = it.groups[1]?.value?.toFloat()!!
val subChapterDecimal = it.groups[2]?.value val subChapterDecimal = it.groups[2]?.value
val subChapterAlpha = it.groups[3]?.value val subChapterAlpha = it.groups[3]?.value
val addition = checkForDecimal(subChapterDecimal, subChapterAlpha) val addition = checkForDecimal(subChapterDecimal, subChapterAlpha)
chapter.chapter_number = initial.plus(addition) initial.plus(addition)
return true
} }
return false
} }
/** /**
@ -133,11 +106,9 @@ object ChapterRecognition {
return .97f return .97f
} }
return if (alpha[0] == '.') { val trimmedAlpha = alpha.trimStart('.')
// Take value after (.) if (trimmedAlpha.length == 1) {
parseAlphaPostFix(alpha[1]) return parseAlphaPostFix(trimmedAlpha[0])
} else {
parseAlphaPostFix(alpha[0])
} }
} }
@ -148,6 +119,8 @@ object ChapterRecognition {
* x.a -> x.1, x.b -> x.2, etc * x.a -> x.1, x.b -> x.2, etc
*/ */
private fun parseAlphaPostFix(alpha: Char): Float { private fun parseAlphaPostFix(alpha: Char): Float {
return ("0." + (alpha.code - 96).toString()).toFloat() val number = alpha.code - ('a'.code - 1)
if (number >= 10) return 0f
return number / 10f
} }
} }