mirror of
https://github.com/corda/corda.git
synced 2025-01-09 06:23:04 +00:00
e6ad10de04
Based on the just-implemented PikeVM, let's test it with a specific regular expression. At this point, no parsing is implemented but instead an explicit program executing a(bb)?a is hardcoded. Signed-off-by: Johannes Schindelin <johannes.schindelin@gmx.de>
107 lines
2.8 KiB
Java
107 lines
2.8 KiB
Java
/* Copyright (c) 2008-2013, Avian Contributors
|
|
|
|
Permission to use, copy, modify, and/or distribute this software
|
|
for any purpose with or without fee is hereby granted, provided
|
|
that the above copyright notice and this permission notice appear
|
|
in all copies.
|
|
|
|
There is NO WARRANTY for this software. See license.txt for
|
|
details. */
|
|
|
|
package regex;
|
|
|
|
import java.util.ArrayList;
|
|
import java.util.List;
|
|
|
|
/**
|
|
* This is a work in progress.
|
|
*
|
|
* @author zsombor and others
|
|
*
|
|
*/
|
|
public abstract class Pattern implements PikeVMOpcodes {
|
|
|
|
public static final int UNIX_LINES = 1;
|
|
public static final int CASE_INSENSITIVE = 2;
|
|
public static final int COMMENTS = 4;
|
|
public static final int MULTILINE = 8;
|
|
public static final int LITERAL = 16;
|
|
public static final int DOTALL = 32;
|
|
public static final int UNICODE_CASE = 64;
|
|
public static final int CANON_EQ = 128;
|
|
|
|
private final int patternFlags;
|
|
private final String pattern;
|
|
|
|
protected Pattern(String pattern, int flags) {
|
|
this.pattern = pattern;
|
|
this.patternFlags = flags;
|
|
}
|
|
|
|
public static Pattern compile(String regex) {
|
|
return compile(regex, 0);
|
|
}
|
|
|
|
public static Pattern compile(String regex, int flags) {
|
|
try {
|
|
return new TrivialPattern(regex, flags);
|
|
} catch (UnsupportedOperationException handledBelow) { }
|
|
if (flags != 0) {
|
|
throw new UnsupportedOperationException("TODO");
|
|
}
|
|
if ("a(bb)?a".equals(regex)) {
|
|
int[] program = new int[] {
|
|
SAVE_OFFSET, 0,
|
|
CHAR, 'a',
|
|
SPLIT, 14,
|
|
SAVE_OFFSET, 2,
|
|
CHAR, 'b',
|
|
CHAR, 'b',
|
|
SAVE_OFFSET, 3,
|
|
/* 14 */ CHAR, 'a',
|
|
SAVE_OFFSET, 1
|
|
};
|
|
return new RegexPattern(regex, flags, new PikeVM(program, 1));
|
|
}
|
|
throw new UnsupportedOperationException("Cannot handle regex " + regex);
|
|
}
|
|
|
|
public int flags() {
|
|
return patternFlags;
|
|
}
|
|
|
|
public abstract Matcher matcher(CharSequence input);
|
|
|
|
public static boolean matches(String regex, CharSequence input) {
|
|
return Pattern.compile(regex).matcher(input).matches();
|
|
}
|
|
|
|
public String pattern() {
|
|
return pattern;
|
|
}
|
|
|
|
public String[] split(CharSequence input) {
|
|
return split(input, 0);
|
|
}
|
|
|
|
public String[] split(CharSequence input, int limit) {
|
|
if (limit <= 0) {
|
|
limit = Integer.MAX_VALUE;
|
|
}
|
|
Matcher matcher = matcher(input);
|
|
List<String> result = new ArrayList<String>();
|
|
int offset = 0;
|
|
for (;;) {
|
|
if (result.size() >= limit || !matcher.find()) {
|
|
break;
|
|
}
|
|
result.add(input.subSequence(offset, matcher.start()).toString());
|
|
offset = matcher.end();
|
|
}
|
|
if (offset == 0 || offset < input.length()) {
|
|
result.add(input.subSequence(offset, input.length()).toString());
|
|
}
|
|
return result.toArray(new String[result.size()]);
|
|
}
|
|
}
|