filebot/source/net/filebot/format/ExpressionFormatMethods.java

package net.filebot.format;

import static java.util.regex.Pattern.*;

import java.io.File;
import java.util.ArrayList;
import java.util.List;
import java.util.regex.Matcher;

import net.filebot.util.FileUtilities;

import com.ibm.icu.text.Transliterator;

public class ExpressionFormatMethods {

	/**
	 * Convenience methods for String.toLowerCase() and String.toUpperCase()
	 */
	public static String lower(String self) {
		return self.toLowerCase();
	}

	public static String upper(String self) {
		return self.toUpperCase();
	}

	/**
	 * Pad strings or numbers with given characters ('0' by default).
	 * 
	 * e.g. "1" -> "01"
	 */
	public static String pad(String self, int length, String padding) {
		while (self.length() < length) {
			self = padding + self;
		}
		return self;
	}

	public static String pad(String self, int length) {
		return pad(self, length, "0");
	}

	public static String pad(Number self, int length) {
		return pad(self.toString(), length, "0");
	}

	/**
	 * Return a substring matching the given pattern or break.
	 */
	public static String match(String self, String pattern) {
		return match(self, pattern, -1);
	}

	public static String match(String self, String pattern, int matchGroup) {
		Matcher matcher = compile(pattern, CASE_INSENSITIVE | UNICODE_CASE | MULTILINE).matcher(self);
		if (matcher.find()) {
			return (matcher.groupCount() > 0 && matchGroup < 0 ? matcher.group(1) : matcher.group(matchGroup < 0 ? 0 : matchGroup)).trim();
		} else {
			throw new IllegalArgumentException("Pattern not found");
		}
	}

	/**
	 * Return a list of all matching patterns or break.
	 */
	public static List<String> matchAll(String self, String pattern) {
		return matchAll(self, pattern, 0);
	}

	public static List<String> matchAll(String self, String pattern, int matchGroup) {
		List<String> matches = new ArrayList<String>();
		Matcher matcher = compile(pattern, CASE_INSENSITIVE | UNICODE_CASE | MULTILINE).matcher(self);
		while (matcher.find()) {
			matches.add(matcher.group(matchGroup).trim());
		}

		if (matches.size() > 0) {
			return matches;
		} else {
			throw new IllegalArgumentException("Pattern not found");
		}
	}

	public static String replaceAll(String self, String pattern) {
		return self.replaceAll(pattern, "");
	}

	public static String removeAll(String self, String pattern) {
		return compile(pattern, CASE_INSENSITIVE | UNICODE_CASE | MULTILINE).matcher(self).replaceAll("").trim();
	}

	/**
	 * Replace space characters with a given characters.
	 * 
	 * e.g. "Doctor Who" -> "Doctor_Who"
	 */
	public static String space(String self, String replacement) {
		return self.replaceAll("[:?._]", " ").trim().replaceAll("\\s+", replacement);
	}

	/**
	 * Upper-case all initials.
	 * 
	 * e.g. "The Day a new Demon was born" -> "The Day A New Demon Was Born"
	 */
	public static String upperInitial(String self) {
		Matcher matcher = compile("(?<=[&()+.,-;<=>?\\[\\]_{|}~ ]|^)[a-z]").matcher(self);

		StringBuffer buffer = new StringBuffer();
		while (matcher.find()) {
			matcher.appendReplacement(buffer, matcher.group().toUpperCase());
		}
		matcher.appendTail(buffer);

		return buffer.toString();
	}

	public static String sortName(String self) {
		return sortName(self, "$2, $1");
	}

	public static String sortName(String self, String replacement) {
		return compile("^(The|A|An)\\s(.+)", CASE_INSENSITIVE).matcher(self).replaceFirst(replacement).trim();
	}

	/**
	 * Get acronym, i.e. first letter of each word.
	 * 
	 * e.g. "Deep Space 9" -> "DS9"
	 */
	public static String acronym(String self) {
		String name = sortName(self, "$2");
		Matcher matcher = compile("(?<=[&()+.,-;<=>?\\[\\]_{|}~ ]|^)[\\p{Alnum}]").matcher(name);

		StringBuilder buffer = new StringBuilder();
		while (matcher.find()) {
			buffer.append(matcher.group().toUpperCase());
		}

		return buffer.toString();
	}

	/**
	 * Lower-case all letters that are not initials.
	 * 
	 * e.g. "Gundam SEED" -> "Gundam Seed"
	 */
	public static String lowerTrail(String self) {
		Matcher matcher = compile("\\b(\\p{Alpha})(\\p{Alpha}+)\\b").matcher(self);

		StringBuffer buffer = new StringBuffer();
		while (matcher.find()) {
			matcher.appendReplacement(buffer, matcher.group(1) + matcher.group(2).toLowerCase());
		}
		matcher.appendTail(buffer);

		return buffer.toString();
	}

	/**
	 * Return substring before the given pattern.
	 */
	public static String before(String self, String pattern) {
		Matcher matcher = compile(pattern, CASE_INSENSITIVE | UNICODE_CASE).matcher(self);

		// pattern was found, return leading substring, else return original value
		return matcher.find() ? self.substring(0, matcher.start()).trim() : self;
	}

	/**
	 * Return substring after the given pattern.
	 */
	public static String after(String self, String pattern) {
		Matcher matcher = compile(pattern, CASE_INSENSITIVE | UNICODE_CASE).matcher(self);

		// pattern was found, return trailing substring, else return original value
		return matcher.find() ? self.substring(matcher.end(), self.length()).trim() : self;
	}

	/**
	 * Replace trailing parenthesis including any leading whitespace.
	 * 
	 * e.g. "The IT Crowd (UK)" -> "The IT Crowd"
	 */
	public static String replaceTrailingBrackets(String self) {
		return replaceTrailingBrackets(self, "");
	}

	public static String replaceTrailingBrackets(String self, String replacement) {
		return self.replaceAll("\\s*[(]([^)]*)[)]$", replacement).trim();
	}

	/**
	 * Replace 'part identifier'.
	 * 
	 * e.g. "Today Is the Day: Part 1" -> "Today Is the Day, Part 1" or "Today Is the Day (1)" -> "Today Is the Day, Part 1"
	 */
	public static String replacePart(String self) {
		return replacePart(self, "");
	}

	public static String replacePart(String self, String replacement) {
		// handle '(n)', '(Part n)' and ': Part n' like syntax
		String[] patterns = new String[] { "\\s*[(](\\w+)[)]$", "\\W+Part (\\w+)\\W*$" };

		for (String pattern : patterns) {
			Matcher matcher = compile(pattern, CASE_INSENSITIVE).matcher(self);
			if (matcher.find()) {
				return matcher.replaceAll(replacement).trim();
			}
		}

		// no pattern matches, nothing to replace
		return self;
	}

	/**
	 * Apply ICU transliteration
	 * 
	 * @see http://userguide.icu-project.org/transforms/general
	 */
	public static String transliterate(String self, String transformIdentifier) {
		return Transliterator.getInstance(transformIdentifier).transform(self);
	}

	/**
	 * Convert Unicode to ASCII as best as possible. Works with most alphabets/scripts used in the world.
	 * 
	 * e.g. "Österreich" -> "Osterreich" "カタカナ" -> "katakana"
	 */
	public static String ascii(String self) {
		return ascii(self, " ");
	}

	public static String ascii(String self, String fallback) {
		return Transliterator.getInstance("Any-Latin;Latin-ASCII;[:Diacritic:]remove").transform(self).replaceAll("[^\\p{ASCII}]+", fallback).trim();
	}

	/**
	 * Replace multiple replacement pairs
	 * 
	 * e.g. replace('ä', 'ae', 'ö', 'oe', 'ü', 'ue')
	 */
	public static String replace(String self, String tr0, String tr1, String... tr) {
		// the first two parameters are required, the rest of the parameter sequence is optional
		self = self.replace(tr0, tr1);

		for (int i = 0; i < tr.length - 1; i += 2) {
			String t = tr[i];
			String r = tr[i + 1];
			self = self.replace(t, r);
		}

		return self;
	}

	/**
	 * File utilities
	 */
	public static File getRoot(File self) {
		return FileUtilities.listPath(self).get(0);
	}

	public static List<File> listPath(File self) {
		return FileUtilities.listPath(self);
	}

	public static List<File> listPath(File self, int tailSize) {
		return FileUtilities.listPath(FileUtilities.getRelativePathTail(self, tailSize));
	}

	public static File getRelativePathTail(File self, int tailSize) {
		return FileUtilities.getRelativePathTail(self, tailSize);
	}

	public static long getDiskSpace(File self) {
		List<File> list = FileUtilities.listPath(self);
		for (int i = list.size() - 1; i >= 0; i--) {
			if (list.get(i).exists()) {
				long usableSpace = list.get(i).getUsableSpace();
				if (usableSpace > 0) {
					return usableSpace;
				}
			}
		}
		return 0;
	}

}
* fix package and import declarations 2014-04-19 02:30:29 -04:00			`package net.filebot.format;`
* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00
* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`import static java.util.regex.Pattern.*;`

			`import java.io.File;`
			`import java.util.ArrayList;`
			`import java.util.List;`
			`import java.util.regex.Matcher;`

* fix package and import declarations 2014-04-19 02:30:29 -04:00			`import net.filebot.util.FileUtilities;`
* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00
			`import com.ibm.icu.text.Transliterator;`

* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00			`public class ExpressionFormatMethods {`

* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`/**`
			`* Convenience methods for String.toLowerCase() and String.toUpperCase()`
			`*/`
* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00			`public static String lower(String self) {`
			`return self.toLowerCase();`
			`}`

			`public static String upper(String self) {`
			`return self.toUpperCase();`
			`}`

* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`/**`
			`* Pad strings or numbers with given characters ('0' by default).`
			`*`
			`* e.g. "1" -> "01"`
			`*/`
* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00			`public static String pad(String self, int length, String padding) {`
			`while (self.length() < length) {`
			`self = padding + self;`
			`}`
			`return self;`
			`}`

			`public static String pad(String self, int length) {`
			`return pad(self, length, "0");`
			`}`

			`public static String pad(Number self, int length) {`
* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`return pad(self.toString(), length, "0");`
			`}`

			`/**`
			`* Return a substring matching the given pattern or break.`
			`*/`
			`public static String match(String self, String pattern) {`
			`return match(self, pattern, -1);`
			`}`

			`public static String match(String self, String pattern, int matchGroup) {`
			`Matcher matcher = compile(pattern, CASE_INSENSITIVE \| UNICODE_CASE \| MULTILINE).matcher(self);`
			`if (matcher.find()) {`
			`return (matcher.groupCount() > 0 && matchGroup < 0 ? matcher.group(1) : matcher.group(matchGroup < 0 ? 0 : matchGroup)).trim();`
			`} else {`
			`throw new IllegalArgumentException("Pattern not found");`
			`}`
			`}`

			`/**`
			`* Return a list of all matching patterns or break.`
			`*/`
			`public static List<String> matchAll(String self, String pattern) {`
			`return matchAll(self, pattern, 0);`
			`}`

			`public static List<String> matchAll(String self, String pattern, int matchGroup) {`
			`List<String> matches = new ArrayList<String>();`
			`Matcher matcher = compile(pattern, CASE_INSENSITIVE \| UNICODE_CASE \| MULTILINE).matcher(self);`
			`while (matcher.find()) {`
			`matches.add(matcher.group(matchGroup).trim());`
			`}`

			`if (matches.size() > 0) {`
			`return matches;`
			`} else {`
			`throw new IllegalArgumentException("Pattern not found");`
			`}`
			`}`

* compatibility fixes 2014-04-19 01:55:23 -04:00			`public static String replaceAll(String self, String pattern) {`
			`return self.replaceAll(pattern, "");`
			`}`

* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`public static String removeAll(String self, String pattern) {`
			`return compile(pattern, CASE_INSENSITIVE \| UNICODE_CASE \| MULTILINE).matcher(self).replaceAll("").trim();`
			`}`

			`/**`
			`* Replace space characters with a given characters.`
			`*`
			`* e.g. "Doctor Who" -> "Doctor_Who"`
			`*/`
			`public static String space(String self, String replacement) {`
			`return self.replaceAll("[:?._]", " ").trim().replaceAll("\\s+", replacement);`
* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00			`}`
* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00
			`/**`
			`* Upper-case all initials.`
			`*`
			`* e.g. "The Day a new Demon was born" -> "The Day A New Demon Was Born"`
			`*/`
			`public static String upperInitial(String self) {`
			`Matcher matcher = compile("(?<=[&()+.,-;<=>?\\[\\]_{\|}~ ]\|^)[a-z]").matcher(self);`

			`StringBuffer buffer = new StringBuffer();`
			`while (matcher.find()) {`
			`matcher.appendReplacement(buffer, matcher.group().toUpperCase());`
			`}`
			`matcher.appendTail(buffer);`

			`return buffer.toString();`
			`}`

			`public static String sortName(String self) {`
			`return sortName(self, "$2, $1");`
			`}`

			`public static String sortName(String self, String replacement) {`
			`return compile("^(The\|A\|An)\\s(.+)", CASE_INSENSITIVE).matcher(self).replaceFirst(replacement).trim();`
			`}`

			`/**`
			`* Get acronym, i.e. first letter of each word.`
			`*`
			`* e.g. "Deep Space 9" -> "DS9"`
			`*/`
			`public static String acronym(String self) {`
			`String name = sortName(self, "$2");`
			`Matcher matcher = compile("(?<=[&()+.,-;<=>?\\[\\]_{\|}~ ]\|^)[\\p{Alnum}]").matcher(name);`

			`StringBuilder buffer = new StringBuilder();`
			`while (matcher.find()) {`
			`buffer.append(matcher.group().toUpperCase());`
			`}`

			`return buffer.toString();`
			`}`

			`/**`
			`* Lower-case all letters that are not initials.`
			`*`
			`* e.g. "Gundam SEED" -> "Gundam Seed"`
			`*/`
			`public static String lowerTrail(String self) {`
			`Matcher matcher = compile("\\b(\\p{Alpha})(\\p{Alpha}+)\\b").matcher(self);`

			`StringBuffer buffer = new StringBuffer();`
			`while (matcher.find()) {`
			`matcher.appendReplacement(buffer, matcher.group(1) + matcher.group(2).toLowerCase());`
			`}`
			`matcher.appendTail(buffer);`

			`return buffer.toString();`
			`}`

			`/**`
			`* Return substring before the given pattern.`
			`*/`
			`public static String before(String self, String pattern) {`
			`Matcher matcher = compile(pattern, CASE_INSENSITIVE \| UNICODE_CASE).matcher(self);`

			`// pattern was found, return leading substring, else return original value`
			`return matcher.find() ? self.substring(0, matcher.start()).trim() : self;`
			`}`

			`/**`
			`* Return substring after the given pattern.`
			`*/`
			`public static String after(String self, String pattern) {`
			`Matcher matcher = compile(pattern, CASE_INSENSITIVE \| UNICODE_CASE).matcher(self);`

			`// pattern was found, return trailing substring, else return original value`
			`return matcher.find() ? self.substring(matcher.end(), self.length()).trim() : self;`
			`}`

			`/**`
			`* Replace trailing parenthesis including any leading whitespace.`
			`*`
			`* e.g. "The IT Crowd (UK)" -> "The IT Crowd"`
			`*/`
			`public static String replaceTrailingBrackets(String self) {`
			`return replaceTrailingBrackets(self, "");`
			`}`

			`public static String replaceTrailingBrackets(String self, String replacement) {`
			`return self.replaceAll("\\s[(]([^)])[)]$", replacement).trim();`
			`}`

			`/**`
			`* Replace 'part identifier'.`
			`*`
			`* e.g. "Today Is the Day: Part 1" -> "Today Is the Day, Part 1" or "Today Is the Day (1)" -> "Today Is the Day, Part 1"`
			`*/`
			`public static String replacePart(String self) {`
			`return replacePart(self, "");`
			`}`

			`public static String replacePart(String self, String replacement) {`
			`// handle '(n)', '(Part n)' and ': Part n' like syntax`
			`String[] patterns = new String[] { "\\s[(](\\w+)[)]$", "\\W+Part (\\w+)\\W$" };`

			`for (String pattern : patterns) {`
			`Matcher matcher = compile(pattern, CASE_INSENSITIVE).matcher(self);`
			`if (matcher.find()) {`
			`return matcher.replaceAll(replacement).trim();`
			`}`
			`}`

			`// no pattern matches, nothing to replace`
			`return self;`
			`}`

			`/**`
			`* Apply ICU transliteration`
			`*`
			`* @see http://userguide.icu-project.org/transforms/general`
			`*/`
			`public static String transliterate(String self, String transformIdentifier) {`
			`return Transliterator.getInstance(transformIdentifier).transform(self);`
			`}`

			`/**`
			`* Convert Unicode to ASCII as best as possible. Works with most alphabets/scripts used in the world.`
			`*`
			`* e.g. "Österreich" -> "Osterreich" "カタカナ" -> "katakana"`
			`*/`
			`public static String ascii(String self) {`
			`return ascii(self, " ");`
			`}`

			`public static String ascii(String self, String fallback) {`
			`return Transliterator.getInstance("Any-Latin;Latin-ASCII;[:Diacritic:]remove").transform(self).replaceAll("[^\\p{ASCII}]+", fallback).trim();`
			`}`

			`/**`
			`* Replace multiple replacement pairs`
			`*`
			`* e.g. replace('ä', 'ae', 'ö', 'oe', 'ü', 'ue')`
			`*/`
			`public static String replace(String self, String tr0, String tr1, String... tr) {`
			`// the first two parameters are required, the rest of the parameter sequence is optional`
			`self = self.replace(tr0, tr1);`

			`for (int i = 0; i < tr.length - 1; i += 2) {`
			`String t = tr[i];`
			`String r = tr[i + 1];`
			`self = self.replace(t, r);`
			`}`

			`return self;`
			`}`

			`/**`
			`* File utilities`
			`*/`
			`public static File getRoot(File self) {`
			`return FileUtilities.listPath(self).get(0);`
			`}`

* temporary compatibility fix 2014-04-15 13:55:34 -04:00			`public static List<File> listPath(File self) {`
* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`return FileUtilities.listPath(self);`
			`}`

* temporary compatibility fix 2014-04-15 13:55:34 -04:00			`public static List<File> listPath(File self, int tailSize) {`
			`return FileUtilities.listPath(FileUtilities.getRelativePathTail(self, tailSize));`
			`}`

* finish rewrite of ExpressionFormat customizations 2014-04-15 08:23:58 -04:00			`public static File getRelativePathTail(File self, int tailSize) {`
			`return FileUtilities.getRelativePathTail(self, tailSize);`
			`}`

			`public static long getDiskSpace(File self) {`
			`List<File> list = FileUtilities.listPath(self);`
			`for (int i = list.size() - 1; i >= 0; i--) {`
			`if (list.get(i).exists()) {`
			`long usableSpace = list.get(i).getUsableSpace();`
			`if (usableSpace > 0) {`
			`return usableSpace;`
			`}`
			`}`
			`}`
			`return 0;`
			`}`

* inject methods using the Groovy Extension Module system (and slowly phase out the *.lib.groovy code) 2014-04-13 15:37:11 -04:00			`}`