package com.jayway.jsonpath.internal; import com.jayway.jsonpath.Criteria; import com.jayway.jsonpath.Filter; import com.jayway.jsonpath.InvalidPathException; import com.jayway.jsonpath.Predicate; import com.jayway.jsonpath.internal.compiler.ArrayPathToken; import com.jayway.jsonpath.internal.compiler.PathToken; import com.jayway.jsonpath.internal.compiler.PredicatePathToken; import com.jayway.jsonpath.internal.compiler.PropertyPathToken; import com.jayway.jsonpath.internal.compiler.RootPathToken; import com.jayway.jsonpath.internal.compiler.ScanPathToken; import com.jayway.jsonpath.internal.compiler.WildcardPathToken; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import java.util.ArrayList; import java.util.LinkedList; import java.util.List; import java.util.regex.Pattern; import static com.jayway.jsonpath.internal.Utils.notEmpty; import static java.util.Arrays.asList; public class PathCompiler { private static final Logger logger = LoggerFactory.getLogger(PathCompiler.class); private static final String PROPERTY_OPEN = "['"; private static final String PROPERTY_CLOSE = "']"; private static final char DOCUMENT = '$'; private static final char ANY = '*'; private static final char PERIOD = '.'; private static final char BRACKET_OPEN = '['; private static final char BRACKET_CLOSE = ']'; private static final char SPACE = ' '; private static final Cache cache = new Cache(200); private static final String[] OPERATORS = {"==", ">=", "<=", "!=", "<", ">",}; public static Path compile(String path, Predicate... filters) { notEmpty(path, "Path may not be null empty"); path = path.trim(); LinkedList filterList = new LinkedList(asList(filters)); if (path.charAt(0) != '$' && path.charAt(0) != '@') { path = "$." + path; } boolean isRootPath = (path.charAt(0) == '$'); if(path.charAt(0) == '@'){ path = "$" + path.substring(1); } String cacheKey = path + isRootPath + filterList.toString(); Path p = cache.get(cacheKey); if (p != null) { logger.debug("Using cached path"); return p; } RootPathToken root = null; int i = 0; int positions; String fragment = ""; do { char current = path.charAt(i); switch (current) { case SPACE: throw new InvalidPathException("Space not allowed in path"); case DOCUMENT: fragment = "$"; i++; break; case BRACKET_OPEN: positions = fastForwardUntilClosed(path, i); fragment = path.substring(i, i + positions); i += positions; break; case PERIOD: i++; if (path.charAt(i) == PERIOD) { //This is a deep scan fragment = ".."; i++; } else { positions = fastForward(path, i); if (positions == 0) { continue; } else if (positions == 1 && path.charAt(i) == '*') { fragment = new String("[*]"); } else { assertValidFieldChars(path, i, positions); fragment = PROPERTY_OPEN + path.substring(i, i + positions) + PROPERTY_CLOSE; } i += positions; } break; case ANY: fragment = new String("[*]"); i++; break; default: positions = fastForward(path, i); fragment = PROPERTY_OPEN + path.substring(i, i + positions) + PROPERTY_CLOSE; i += positions; break; } if (root == null) { root = (RootPathToken) PathComponentAnalyzer.analyze(fragment, filterList); } else { root.append(PathComponentAnalyzer.analyze(fragment, filterList)); } } while (i < path.length()); Path pa = new CompiledPath(root, isRootPath); cache.put(cacheKey, pa); return pa; } private static void assertValidFieldChars(String s, int start, int positions) { int i = start; while (i < start + positions) { char c = s.charAt(i); if (!Character.isLetterOrDigit(c) && c != '-' && c != '_' && c != '$' && c != '@') { throw new InvalidPathException("Invalid field name! Use bracket notation if your filed names does not match pattern: ([a-zA-Z@][a-zA-Z0-9@\\$_\\-]*)$"); } i++; } } private static int fastForward(String s, int index) { int skipCount = 0; while (index < s.length()) { char current = s.charAt(index); if (current == PERIOD || current == BRACKET_OPEN || current == SPACE) { break; } index++; skipCount++; } return skipCount; } private static int fastForwardUntilClosed(String s, int index) { int skipCount = 0; int nestedBrackets = 0; //First char is always '[' no need to check it index++; skipCount++; while (index < s.length()) { char current = s.charAt(index); index++; skipCount++; if (current == BRACKET_CLOSE && nestedBrackets == 0) { break; } if (current == BRACKET_OPEN) { nestedBrackets++; } if (current == BRACKET_CLOSE) { nestedBrackets--; } } return skipCount; } //--------------------------------------------- // // // //--------------------------------------------- static class PathComponentAnalyzer { private static final Pattern FILTER_PATTERN = Pattern.compile("^\\[\\s*\\?\\s*[,\\s*\\?]*?\\s*]$"); //[?] or [?, ?, ...] private int i; private char current; private final LinkedList filterList; private final String pathFragment; PathComponentAnalyzer(String pathFragment, LinkedList filterList) { this.pathFragment = pathFragment; this.filterList = filterList; } static PathToken analyze(String pathFragment, LinkedList filterList) { return new PathComponentAnalyzer(pathFragment, filterList).analyze(); } public PathToken analyze() { if ("$".equals(pathFragment)) return new RootPathToken(); else if ("..".equals(pathFragment)) return new ScanPathToken(); else if ("[*]".equals(pathFragment)) return new WildcardPathToken(); else if (".*".equals(pathFragment)) return new WildcardPathToken(); else if ("[?]".equals(pathFragment)) return new PredicatePathToken(filterList.poll()); else if (FILTER_PATTERN.matcher(pathFragment).matches()) { final int criteriaCount = Utils.countMatches(pathFragment, "?"); List filters = new ArrayList(criteriaCount); for (int i = 0; i < criteriaCount; i++) { filters.add(filterList.poll()); } return new PredicatePathToken(filters); } this.i = 0; do { current = pathFragment.charAt(i); switch (current) { case '?': return analyzeCriteriaSequence2(); case '\'': return analyzeProperty(); default: if (Character.isDigit(current) || current == ':' || current == '-' || current == '@') { return analyzeArraySequence(); } i++; break; } } while (i < pathFragment.length()); throw new InvalidPathException("Could not analyze path component: " + pathFragment); } private int findNext(char charToFind, boolean disregardStringContent) { int x = i; boolean inProperty = false; char analyzing; boolean found = false; while(!found){ analyzing = pathFragment.charAt(x); if(analyzing == '\'' && disregardStringContent){ inProperty = !inProperty; } if(!inProperty){ found = (analyzing == charToFind); } x++; } return x-1; } //[?(@.foo)] //[?(@['foo'])] //[?(@.foo == 'bar')] //[?(@['foo']['bar'] == 'bar')] //[?(@ == 'bar')] //[?(@.category == $.store.book[0].category)] //[?(@.category == @['category'])] private PathToken analyzeCriteriaSequence2() { List predicates = new ArrayList(); int startPos = findNext('(', true) + 1; int stopPos = findNext(')', true); String[] split = pathFragment.substring(startPos, stopPos).split("&&"); for (String criteria : split) { int operatorIndex = -1; String left = ""; String operator = ""; String right = ""; for (int y = 0; y < OPERATORS.length; y++) { operatorIndex = criteria.indexOf(OPERATORS[y]); if (operatorIndex != -1) { operator = OPERATORS[y]; break; } } if (!operator.isEmpty()) { left = criteria.substring(0, operatorIndex).trim(); right = criteria.substring(operatorIndex + operator.length()).trim(); } else { left = criteria.trim(); } predicates.add(Criteria.create(left, operator, right)); } i = stopPos; return new PredicatePathToken(Filter.filter(predicates)); } /* //[?(@.foo)] //[?(@['foo'])] //[?(@.foo == 'bar')] //[?(@['foo']['bar'] == 'bar')] //[?(@ == 'bar')] private PathToken analyzeCriteriaSequence() { StringBuilder pathBuffer = new StringBuilder(); StringBuilder operatorBuffer = new StringBuilder(); StringBuilder valueBuffer = new StringBuilder(); List criteria = new ArrayList(); int bracketCount = 0; boolean functionBracketOpened = false; boolean functionBracketClosed = false; boolean propertyOpen = false; current = pathFragment.charAt(++i); //skip the '?' while (current != ']' || bracketCount != 0) { switch (current) { case '[': bracketCount++; pathBuffer.append(current); break; case ']': bracketCount--; pathBuffer.append(current); break; case '@': pathBuffer.append('$'); break; case '(': if (!propertyOpen) { functionBracketOpened = true; break; } case ')': if (!propertyOpen) { functionBracketClosed = true; break; } default: if ('\'' == current) { if (propertyOpen) { propertyOpen = false; } else { propertyOpen = true; } } if (bracketCount == 0 && isOperatorChar(current)) { operatorBuffer.append(current); } else if (bracketCount == 0 && isLogicOperatorChar(current)) { if (isLogicOperatorChar(pathFragment.charAt(i + 1))) { ++i; } criteria.add(Criteria.create(pathBuffer.toString().trim(), operatorBuffer.toString().trim(), valueBuffer.toString().trim())); pathBuffer.setLength(0); operatorBuffer.setLength(0); valueBuffer.setLength(0); } else if (operatorBuffer.length() > 0) { valueBuffer.append(current); } else { pathBuffer.append(current); } break; } current = pathFragment.charAt(++i); } if (!functionBracketOpened || !functionBracketClosed) { throw new InvalidPathException("Function wrapping brackets are not matching. A filter function must match [?()]"); } criteria.add(Criteria.create(pathBuffer.toString().trim(), operatorBuffer.toString().trim(), valueBuffer.toString().trim())); Filter filter2 = Filter.filter(criteria); return new PredicatePathToken(filter2); } */ private static boolean isAnd(char c) { return c == '&'; } private static boolean isOr(char c) { if (c == '|') { throw new UnsupportedOperationException("OR operator is not supported."); } return false; } private static boolean isLogicOperatorChar(char c) { return isAnd(c) || isOr(c); } private static boolean isOperatorChar(char c) { return c == '=' || c == '!' || c == '<' || c == '>'; } //"['foo']" private PathToken analyzeProperty() { List properties = new ArrayList(); StringBuilder buffer = new StringBuilder(); boolean propertyIsOpen = false; while (current != ']') { switch (current) { case '\'': if (propertyIsOpen) { properties.add(buffer.toString()); buffer.setLength(0); propertyIsOpen = false; } else { propertyIsOpen = true; } break; default: if (propertyIsOpen) { buffer.append(current); } break; } current = pathFragment.charAt(++i); } return new PropertyPathToken(properties); } //"[-1:]" sliceFrom //"[:1]" sliceTo //"[0:5]" sliceBetween //"[1]" //"[1,2,3]" //"[(@.length - 1)]" private PathToken analyzeArraySequence() { StringBuilder buffer = new StringBuilder(); List numbers = new ArrayList(); boolean contextSize = (current == '@'); boolean sliceTo = false; boolean sliceFrom = false; boolean sliceBetween = false; boolean indexSequence = false; boolean singleIndex = false; if (contextSize) { current = pathFragment.charAt(++i); current = pathFragment.charAt(++i); while (current != '-') { if (current == ' ' || current == '(' || current == ')') { current = pathFragment.charAt(++i); continue; } buffer.append(current); current = pathFragment.charAt(++i); } String function = buffer.toString(); buffer.setLength(0); if (!function.equals("size") && !function.equals("length")) { throw new InvalidPathException("Invalid function: @." + function + ". Supported functions are: [(@.length - n)] and [(@.size() - n)]"); } while (current != ')') { if (current == ' ') { current = pathFragment.charAt(++i); continue; } buffer.append(current); current = pathFragment.charAt(++i); } } else { while (Character.isDigit(current) || current == ',' || current == ' ' || current == ':' || current == '-') { switch (current) { case ' ': break; case ':': if (buffer.length() == 0) { //this is a tail slice [:12] sliceTo = true; current = pathFragment.charAt(++i); while (Character.isDigit(current) || current == ' ' || current == '-') { if (current != ' ') { buffer.append(current); } current = pathFragment.charAt(++i); } numbers.add(Integer.parseInt(buffer.toString())); buffer.setLength(0); } else { //we now this starts with [12:??? numbers.add(Integer.parseInt(buffer.toString())); buffer.setLength(0); current = pathFragment.charAt(++i); //this is a tail slice [:12] while (Character.isDigit(current) || current == ' ' || current == '-') { if (current != ' ') { buffer.append(current); } current = pathFragment.charAt(++i); } if (buffer.length() == 0) { sliceFrom = true; } else { sliceBetween = true; numbers.add(Integer.parseInt(buffer.toString())); buffer.setLength(0); } } break; case ',': numbers.add(Integer.parseInt(buffer.toString())); buffer.setLength(0); indexSequence = true; break; default: buffer.append(current); break; } if (current == ']') { break; } current = pathFragment.charAt(++i); } } if (buffer.length() > 0) { numbers.add(Integer.parseInt(buffer.toString())); } singleIndex = (numbers.size() == 1) && !sliceTo && !sliceFrom && !contextSize; if (logger.isTraceEnabled()) { logger.debug("numbers are : {}", numbers.toString()); logger.debug("sequence is singleNumber : {}", singleIndex); logger.debug("sequence is numberSequence : {}", indexSequence); logger.debug("sequence is sliceFrom : {}", sliceFrom); logger.debug("sequence is sliceTo : {}", sliceTo); logger.debug("sequence is sliceBetween : {}", sliceBetween); logger.debug("sequence is contextFetch : {}", contextSize); logger.debug("---------------------------------------------"); } ArrayPathToken.Operation operation = null; if (singleIndex) operation = ArrayPathToken.Operation.SINGLE_INDEX; else if (indexSequence) operation = ArrayPathToken.Operation.INDEX_SEQUENCE; else if (sliceFrom) operation = ArrayPathToken.Operation.SLICE_FROM; else if (sliceTo) operation = ArrayPathToken.Operation.SLICE_TO; else if (sliceBetween) operation = ArrayPathToken.Operation.SLICE_BETWEEN; else if (contextSize) operation = ArrayPathToken.Operation.CONTEXT_SIZE; assert operation != null; return new ArrayPathToken(numbers, operation); } } }