mirror of
https://github.com/mitb-archive/filebot
synced 2024-11-02 08:25:02 -04:00
* make sure longest OR expressions is captured
This commit is contained in:
parent
8a885ff1fe
commit
af8e8c185a
@ -229,21 +229,19 @@ public class ReleaseInfo {
|
||||
folders.add(it);
|
||||
}
|
||||
}
|
||||
structureRootFolderPattern = compile(join(folders, "|"), CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
structureRootFolderPattern = compile(or(folders.toArray()), CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
return structureRootFolderPattern;
|
||||
}
|
||||
|
||||
public Pattern getLanguageTagPattern(Collection<String> languages) {
|
||||
// [en]
|
||||
return compile("(?<=[-\\[{(])(" + join(quoteAll(languages), "|") + ")(?=\\p{Punct})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile("(?<=[-\\[{(])" + or(quoteAll(languages)) + "(?=\\p{Punct})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Pattern getLanguageSuffixPattern(Collection<String> languages, boolean strict) {
|
||||
// e.g. ".en.srt" or ".en.forced.srt"
|
||||
String language = join(quoteAll(languages), "|");
|
||||
String tag = getProperty("pattern.subtitle.tags");
|
||||
return compile("(?<=[.-])(" + language + ")(?=([.-](" + tag + "))?$)", strict ? 0 : CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile("(?<=[.-])" + or(quoteAll(languages)) + "(?=([.-](" + getProperty("pattern.subtitle.tags") + "))?$)", strict ? 0 : CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Pattern getResolutionPattern() {
|
||||
@ -277,21 +275,21 @@ public class ReleaseInfo {
|
||||
|
||||
public Pattern getReleaseGroupPattern(boolean strict) throws IOException {
|
||||
// pattern matching any release group name enclosed in separators
|
||||
return compile("(?<!\\p{Alnum})(" + join(releaseGroupResource.get(), "|") + ")(?!\\p{Alnum}|[^\\p{Alnum}](19|20)\\d{2})", strict ? 0 : CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile("(?<!\\p{Alnum})" + or(releaseGroupResource.get()) + "(?!\\p{Alnum}|[^\\p{Alnum}](19|20)\\d{2})", strict ? 0 : CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Pattern getBlacklistPattern() throws IOException {
|
||||
// pattern matching any release group name enclosed in separators
|
||||
return compile("(?<!\\p{Alnum})(" + join(queryBlacklistResource.get(), "|") + ")(?!\\p{Alnum})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile("(?<!\\p{Alnum})" + or(queryBlacklistResource.get()) + "(?!\\p{Alnum})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Pattern getExcludePattern() throws IOException {
|
||||
// pattern matching any release group name enclosed in separators
|
||||
return compile(join(excludeBlacklistResource.get(), "|"), CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile(or(excludeBlacklistResource.get()), CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Pattern getCustomRemovePattern(Collection<String> terms) throws IOException {
|
||||
return compile("(?<!\\p{Alnum})(" + join(quoteAll(terms), "|") + ")(?!\\p{Alnum})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
return compile("(?<!\\p{Alnum})" + or(quoteAll(terms)) + "(?!\\p{Alnum})", CASE_INSENSITIVE | UNICODE_CHARACTER_CLASS);
|
||||
}
|
||||
|
||||
public Movie[] getMovieList() throws IOException {
|
||||
@ -515,12 +513,12 @@ public class ReleaseInfo {
|
||||
}
|
||||
}
|
||||
|
||||
private Collection<String> quoteAll(Collection<String> strings) {
|
||||
List<String> patterns = new ArrayList<String>(strings.size());
|
||||
for (String it : strings) {
|
||||
patterns.add(Pattern.quote(it));
|
||||
}
|
||||
return patterns;
|
||||
private String or(Object[] terms) {
|
||||
return joinSorted(terms, "|", reverseOrder(), "(", ")"); // non-capturing group that matches the longest occurrence
|
||||
}
|
||||
|
||||
private String[] quoteAll(Collection<String> values) {
|
||||
return values.stream().map((s) -> Pattern.quote(s)).toArray(String[]::new);
|
||||
}
|
||||
|
||||
public Map<String, Locale> getLanguageMap(Locale... supportedDisplayLocale) {
|
||||
|
@ -2,6 +2,8 @@ package net.filebot.util;
|
||||
|
||||
import static java.util.Arrays.*;
|
||||
|
||||
import java.util.Arrays;
|
||||
import java.util.Comparator;
|
||||
import java.util.Iterator;
|
||||
|
||||
public final class StringUtilities {
|
||||
@ -10,33 +12,32 @@ public final class StringUtilities {
|
||||
return object == null ? null : object.toString();
|
||||
}
|
||||
|
||||
public static boolean isEmptyValue(Object object) {
|
||||
public static boolean isEmpty(Object object) {
|
||||
return object == null || object.toString().length() == 0;
|
||||
}
|
||||
|
||||
public static String joinBy(CharSequence delimiter, Object... values) {
|
||||
return join(asList(values), delimiter);
|
||||
}
|
||||
|
||||
public static String join(Object[] values, CharSequence delimiter) {
|
||||
return join(asList(values), delimiter);
|
||||
return join(asList(values), delimiter, "", "");
|
||||
}
|
||||
|
||||
public static String join(Iterable<?> values, CharSequence delimiter) {
|
||||
StringBuilder sb = new StringBuilder();
|
||||
public static String joinSorted(Object[] values, CharSequence delimiter, Comparator<Object> sort, CharSequence start, CharSequence end) {
|
||||
return join(Arrays.stream(values).sorted(sort)::iterator, delimiter, start, end);
|
||||
}
|
||||
|
||||
public static String join(Iterable<?> values, CharSequence delimiter, CharSequence start, CharSequence end) {
|
||||
StringBuilder sb = new StringBuilder().append(start);
|
||||
|
||||
for (Iterator<?> iterator = values.iterator(); iterator.hasNext();) {
|
||||
Object value = iterator.next();
|
||||
if (!isEmptyValue(value)) {
|
||||
if (!isEmpty(value)) {
|
||||
if (sb.length() > 0) {
|
||||
sb.append(delimiter);
|
||||
}
|
||||
|
||||
sb.append(value);
|
||||
}
|
||||
}
|
||||
|
||||
return sb.toString();
|
||||
return sb.append(end).toString();
|
||||
}
|
||||
|
||||
/**
|
||||
|
Loading…
Reference in New Issue
Block a user