| /* |
| * Copyright (C) 2010 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #define LOG_TAG "NativePattern" |
| |
| #include <stdlib.h> |
| |
| #include <nativehelper/JNIHelp.h> |
| #include <nativehelper/jni_macros.h> |
| |
| #include "IcuUtilities.h" |
| #include "MatcherState.h" |
| #include "unicode/parseerr.h" |
| #include "unicode/regex.h" |
| |
| #include "JniConstants.h" |
| #include "ScopedJavaUnicodeString.h" |
| |
| // ICU documentation: http://icu-project.org/apiref/icu4c/classRegexPattern.html |
| |
| static const char* regexDetailMessage(UErrorCode status) { |
| // These human-readable error messages were culled from "utypes.h", and then slightly tuned |
| // to make more sense in context. |
| // If we don't have a special-case, we'll just return the textual name of |
| // the enum value (such as U_REGEX_RULE_SYNTAX), which is better than nothing. |
| switch (status) { |
| case U_REGEX_INTERNAL_ERROR: return "An internal error was detected"; |
| case U_REGEX_RULE_SYNTAX: return "Syntax error in regexp pattern"; |
| case U_REGEX_INVALID_STATE: return "Matcher in invalid state for requested operation"; |
| case U_REGEX_BAD_ESCAPE_SEQUENCE: return "Unrecognized backslash escape sequence in pattern"; |
| case U_REGEX_PROPERTY_SYNTAX: return "Incorrect Unicode property"; |
| case U_REGEX_UNIMPLEMENTED: return "Use of unimplemented feature"; |
| case U_REGEX_MISMATCHED_PAREN: return "Incorrectly nested parentheses in regexp pattern"; |
| case U_REGEX_NUMBER_TOO_BIG: return "Decimal number is too large"; |
| case U_REGEX_BAD_INTERVAL: return "Error in {min,max} interval"; |
| case U_REGEX_MAX_LT_MIN: return "In {min,max}, max is less than min"; |
| case U_REGEX_INVALID_BACK_REF: return "Back-reference to a non-existent capture group"; |
| case U_REGEX_INVALID_FLAG: return "Invalid value for match mode flags"; |
| case U_REGEX_LOOK_BEHIND_LIMIT: return "Look-behind pattern matches must have a bounded maximum length"; |
| case U_REGEX_SET_CONTAINS_STRING: return "Regular expressions cannot have UnicodeSets containing strings"; |
| case U_REGEX_OCTAL_TOO_BIG: return "Octal character constants must be <= 0377."; |
| case U_REGEX_MISSING_CLOSE_BRACKET: return "Missing closing bracket in character class"; |
| case U_REGEX_INVALID_RANGE: return "In a character range [x-y], x is greater than y"; |
| case U_REGEX_STACK_OVERFLOW: return "Regular expression backtrack stack overflow"; |
| case U_REGEX_TIME_OUT: return "Maximum allowed match time exceeded"; |
| case U_REGEX_STOPPED_BY_CALLER: return "Matching operation aborted by user callback function"; |
| default: |
| return u_errorName(status); |
| } |
| } |
| |
| static void throwPatternSyntaxException(JNIEnv* env, UErrorCode status, jstring pattern, UParseError error) { |
| static jmethodID method = env->GetMethodID(JniConstants::GetPatternSyntaxExceptionClass(env), |
| "<init>", "(Ljava/lang/String;Ljava/lang/String;I)V"); |
| jstring message = env->NewStringUTF(regexDetailMessage(status)); |
| jclass exceptionClass = JniConstants::GetPatternSyntaxExceptionClass(env); |
| jobject exception = env->NewObject(exceptionClass, method, message, pattern, error.offset); |
| env->Throw(reinterpret_cast<jthrowable>(exception)); |
| } |
| |
| static void NativePattern_free(void* addr) { |
| delete reinterpret_cast<icu::RegexPattern*>(addr); |
| } |
| |
| static jlong NativePattern_getNativeFinalizer(JNIEnv*, jclass) { |
| return reinterpret_cast<jlong>(&NativePattern_free); |
| } |
| |
| static jlong NativePattern_compileImpl(JNIEnv* env, jclass, jstring javaRegex, jint flags) { |
| flags |= UREGEX_ERROR_ON_UNKNOWN_ESCAPES; |
| |
| UErrorCode status = U_ZERO_ERROR; |
| UParseError error; |
| error.offset = -1; |
| |
| ScopedJavaUnicodeString regex(env, javaRegex); |
| if (!regex.valid()) { |
| return 0; |
| } |
| icu::UnicodeString& regexString(regex.unicodeString()); |
| icu::RegexPattern* result = icu::RegexPattern::compile(regexString, flags, error, status); |
| if (!U_SUCCESS(status)) { |
| throwPatternSyntaxException(env, status, javaRegex, error); |
| } |
| return static_cast<jlong>(reinterpret_cast<uintptr_t>(result)); |
| } |
| |
| static jlong NativePattern_openMatcherImpl(JNIEnv* env, jclass, jlong addr) { |
| icu::RegexPattern* pattern = reinterpret_cast<icu::RegexPattern*>(static_cast<uintptr_t>(addr)); |
| UErrorCode status = U_ZERO_ERROR; |
| icu::RegexMatcher* result = pattern->matcher(status); |
| if (maybeThrowIcuException(env, "RegexPattern::matcher", status)) { |
| return 0; |
| } |
| |
| return reinterpret_cast<uintptr_t>(new MatcherState(result)); |
| } |
| |
| static jint NativePattern_getMatchedGroupIndexImpl(JNIEnv* env, jclass, jlong addr, jstring javaGroupName) { |
| icu::RegexPattern* pattern = reinterpret_cast<icu::RegexPattern*>(static_cast<uintptr_t>(addr)); |
| ScopedJavaUnicodeString groupName(env, javaGroupName); |
| UErrorCode status = U_ZERO_ERROR; |
| |
| jint result = pattern->groupNumberFromName(groupName.unicodeString(), status); |
| if (U_SUCCESS(status)) { |
| return result; |
| } |
| if (status == U_REGEX_INVALID_CAPTURE_GROUP_NAME) { |
| return -1; |
| } |
| maybeThrowIcuException(env, "RegexPattern::groupNumberFromName", status); |
| return -1; |
| } |
| |
| |
| static JNINativeMethod gMethods[] = { |
| NATIVE_METHOD(NativePattern, compileImpl, "(Ljava/lang/String;I)J"), |
| NATIVE_METHOD(NativePattern, getNativeFinalizer, "()J"), |
| NATIVE_METHOD(NativePattern, openMatcherImpl, "(J)J"), |
| NATIVE_METHOD(NativePattern, getMatchedGroupIndexImpl, "(JLjava/lang/String;)I"), |
| }; |
| |
| void register_com_android_icu_util_regex_NativePattern(JNIEnv* env) { |
| jniRegisterNativeMethods(env, "com/android/icu/util/regex/NativePattern", gMethods, NELEM(gMethods)); |
| } |