| Index: third_party/re2/re2/set.cc
|
| diff --git a/third_party/re2/re2/set.cc b/third_party/re2/re2/set.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..2bcd30acb486dc379b7dd3d04ca831402ceae3ed
|
| --- /dev/null
|
| +++ b/third_party/re2/re2/set.cc
|
| @@ -0,0 +1,113 @@
|
| +// Copyright 2010 The RE2 Authors. All Rights Reserved.
|
| +// Use of this source code is governed by a BSD-style
|
| +// license that can be found in the LICENSE file.
|
| +
|
| +#include "re2/set.h"
|
| +
|
| +#include "util/util.h"
|
| +#include "re2/stringpiece.h"
|
| +#include "re2/prog.h"
|
| +#include "re2/re2.h"
|
| +#include "re2/regexp.h"
|
| +
|
| +using namespace re2;
|
| +
|
| +RE2::Set::Set(const RE2::Options& options, RE2::Anchor anchor) {
|
| + options_.Copy(options);
|
| + anchor_ = anchor;
|
| + prog_ = NULL;
|
| + compiled_ = false;
|
| +}
|
| +
|
| +RE2::Set::~Set() {
|
| + for (int i = 0; i < re_.size(); i++)
|
| + re_[i]->Decref();
|
| + delete prog_;
|
| +}
|
| +
|
| +int RE2::Set::Add(const StringPiece& pattern, string* error) {
|
| + if (compiled_) {
|
| + LOG(DFATAL) << "RE2::Set::Add after Compile";
|
| + return -1;
|
| + }
|
| +
|
| + Regexp::ParseFlags pf = static_cast<Regexp::ParseFlags>(
|
| + options_.ParseFlags());
|
| +
|
| + RegexpStatus status;
|
| + re2::Regexp* re = Regexp::Parse(pattern, pf, &status);
|
| + if (re == NULL) {
|
| + if (error != NULL)
|
| + *error = status.Text();
|
| + if (options_.log_errors())
|
| + LOG(ERROR) << "Error parsing '" << pattern << "': " << status.Text();
|
| + return -1;
|
| + }
|
| +
|
| + // Concatenate with match index and push on vector.
|
| + int n = re_.size();
|
| + re2::Regexp* m = re2::Regexp::HaveMatch(n, pf);
|
| + if (re->op() == kRegexpConcat) {
|
| + int nsub = re->nsub();
|
| + re2::Regexp** sub = new re2::Regexp*[nsub + 1];
|
| + for (int i = 0; i < nsub; i++)
|
| + sub[i] = re->sub()[i]->Incref();
|
| + sub[nsub] = m;
|
| + re->Decref();
|
| + re = re2::Regexp::Concat(sub, nsub + 1, pf);
|
| + delete[] sub;
|
| + } else {
|
| + re2::Regexp* sub[2];
|
| + sub[0] = re;
|
| + sub[1] = m;
|
| + re = re2::Regexp::Concat(sub, 2, pf);
|
| + }
|
| + re_.push_back(re);
|
| + return n;
|
| +}
|
| +
|
| +bool RE2::Set::Compile() {
|
| + if (compiled_) {
|
| + LOG(DFATAL) << "RE2::Set::Compile multiple times";
|
| + return false;
|
| + }
|
| + compiled_ = true;
|
| +
|
| + Regexp::ParseFlags pf = static_cast<Regexp::ParseFlags>(
|
| + options_.ParseFlags());
|
| + re2::Regexp* re = re2::Regexp::Alternate(const_cast<re2::Regexp**>(&re_[0]),
|
| + re_.size(), pf);
|
| + re_.clear();
|
| + re2::Regexp* sre = re->Simplify();
|
| + re->Decref();
|
| + re = sre;
|
| + if (re == NULL) {
|
| + if (options_.log_errors())
|
| + LOG(ERROR) << "Error simplifying during Compile.";
|
| + return false;
|
| + }
|
| +
|
| + prog_ = Prog::CompileSet(options_, anchor_, re);
|
| + return prog_ != NULL;
|
| +}
|
| +
|
| +bool RE2::Set::Match(const StringPiece& text, vector<int>* v) const {
|
| + if (!compiled_) {
|
| + LOG(DFATAL) << "RE2::Set::Match without Compile";
|
| + return false;
|
| + }
|
| + v->clear();
|
| + bool failed;
|
| + bool ret = prog_->SearchDFA(text, text, Prog::kAnchored,
|
| + Prog::kManyMatch, NULL, &failed, v);
|
| + if (failed)
|
| + LOG(DFATAL) << "RE2::Set::Match: DFA ran out of cache space";
|
| +
|
| + if (ret == false)
|
| + return false;
|
| + if (v->size() == 0) {
|
| + LOG(DFATAL) << "RE2::Set::Match: match but unknown regexp set";
|
| + return false;
|
| + }
|
| + return true;
|
| +}
|
|
|