+++ /dev/null
-package org.apache.lucene.benchmark.byTask.tasks;
-
-/**
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-import java.lang.reflect.Constructor;
-import java.util.StringTokenizer;
-
-import org.apache.lucene.analysis.Analyzer;
-import org.apache.lucene.analysis.shingle.ShingleAnalyzerWrapper;
-import org.apache.lucene.benchmark.byTask.PerfRunData;
-import org.apache.lucene.util.Version;
-
-/**
- * Task to support benchmarking ShingleFilter / ShingleAnalyzerWrapper
- * <p>
- * <ul>
- * <li> <code>NewShingleAnalyzer</code> (constructs with all defaults)
- * <li> <code>NewShingleAnalyzer(analyzer:o.a.l.analysis.StandardAnalyzer,maxShingleSize:2,outputUnigrams:true)</code>
- * </ul>
- * </p>
- */
-public class NewShingleAnalyzerTask extends PerfTask {
-
- private String analyzerClassName = "standard.StandardAnalyzer";
- private int maxShingleSize = 2;
- private boolean outputUnigrams = true;
-
- public NewShingleAnalyzerTask(PerfRunData runData) {
- super(runData);
- }
-
- private void setAnalyzer() throws Exception {
- Class<? extends Analyzer> clazz = null;
- Analyzer wrappedAnalyzer;
- try {
- if (analyzerClassName == null || analyzerClassName.equals("")) {
- analyzerClassName
- = "org.apache.lucene.analysis.standard.StandardAnalyzer";
- }
- if (analyzerClassName.indexOf(".") == -1
- || analyzerClassName.startsWith("standard.")) {
- //there is no package name, assume o.a.l.analysis
- analyzerClassName = "org.apache.lucene.analysis." + analyzerClassName;
- }
- clazz = Class.forName(analyzerClassName).asSubclass(Analyzer.class);
- // first try to use a ctor with version parameter (needed for many new
- // Analyzers that have no default one anymore)
- Constructor<? extends Analyzer> ctor = clazz.getConstructor(Version.class);
- wrappedAnalyzer = ctor.newInstance(Version.LUCENE_CURRENT);
- } catch (NoSuchMethodException e) {
- // otherwise use default ctor
- wrappedAnalyzer = clazz.newInstance();
- }
- ShingleAnalyzerWrapper analyzer
- = new ShingleAnalyzerWrapper(wrappedAnalyzer, maxShingleSize);
- analyzer.setOutputUnigrams(outputUnigrams);
- getRunData().setAnalyzer(analyzer);
- }
-
- @Override
- public int doLogic() throws Exception {
- try {
- setAnalyzer();
- System.out.println
- ("Changed Analyzer to: ShingleAnalyzerWrapper, wrapping ShingleFilter over"
- + analyzerClassName);
- } catch (Exception e) {
- throw new RuntimeException("Error creating Analyzer", e);
- }
- return 1;
- }
-
- @Override
- public void setParams(String params) {
- super.setParams(params);
- StringTokenizer st = new StringTokenizer(params, ",");
- while (st.hasMoreTokens()) {
- String param = st.nextToken();
- StringTokenizer expr = new StringTokenizer(param, ":");
- String key = expr.nextToken();
- String value = expr.nextToken();
- if (key.equalsIgnoreCase("analyzer")) {
- analyzerClassName = value;
- } else if (key.equalsIgnoreCase("outputUnigrams")) {
- outputUnigrams = Boolean.parseBoolean(value);
- } else if (key.equalsIgnoreCase("maxShingleSize")) {
- maxShingleSize = (int)Double.parseDouble(value);
- } else {
- throw new RuntimeException("Unknown parameter " + param);
- }
- }
- }
-
- @Override
- public boolean supportsParams() {
- return true;
- }
-}