source.dussan.org Git - archiva.git/blob

   1 package org.apache.maven.repository.indexing;
   2
   3 /*
   4  * Copyright 2001-2005 The Apache Software Foundation.
   5  *
   6  * Licensed under the Apache License, Version 2.0 (the "License");
   7  * you may not use this file except in compliance with the License.
   8  * You may obtain a copy of the License at
   9  *
  10  *      http://www.apache.org/licenses/LICENSE-2.0
  11
  12  *
  13  * Unless required by applicable law or agreed to in writing, software
  14  * distributed under the License is distributed on an "AS IS" BASIS,
  15  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  16  * See the License for the specific language governing permissions and
  17  * limitations under the License.
  18  */
  19
  20 import java.io.Reader;
  21 import java.util.HashMap;
  22 import java.util.Map;
  23 import org.apache.lucene.analysis.Analyzer;
  24 import org.apache.lucene.analysis.CharTokenizer;
  25 import org.apache.lucene.analysis.TokenStream;
  26
  27 /**
  28  * Class created specifically to index artifacts
  29  *
  30  * @author Edwin Punzalan
  31  */
  32 public class ArtifactRepositoryIndexAnalyzer
  33     extends Analyzer
  34 {
  35     private Analyzer defaultAnalyzer;
  36
  37     /**
  38      * constructor to for this analyzer
  39      *
  40      * @character defaultAnalyzer the analyzer to use as default for the general fields of the artifact indeces
  41      */
  42     public ArtifactRepositoryIndexAnalyzer( Analyzer defaultAnalyzer )
  43     {
  44         this.defaultAnalyzer = defaultAnalyzer;
  45     }
  46
  47     /**
  48      * Method called by lucence during indexing operations
  49      *
  50      * @character fieldName the field name that the lucene object is currently processing
  51      * @character reader a Reader object to the index stream
  52      *
  53      * @return an analyzer to specific to the field name or the default analyzer if none is present
  54      */
  55     public TokenStream tokenStream( String fieldName, Reader reader )
  56     {
  57         TokenStream tokenStream;
  58
  59         if ( "version".equals( fieldName ) )
  60         {
  61             tokenStream = new VersionTokenizer( reader );
  62         }
  63         else
  64         {
  65             tokenStream = defaultAnalyzer.tokenStream( fieldName, reader );
  66         }
  67
  68         return tokenStream;
  69     }
  70
  71     /**
  72      * Class used to tokenize an artifact's version.
  73      */
  74     private class VersionTokenizer
  75         extends CharTokenizer
  76     {
  77         /**
  78          * Constructor with the required reader to the index stream
  79          *
  80          * @reader the Reader object of the index stream
  81          */
  82         public VersionTokenizer( Reader reader )
  83         {
  84             super( reader );
  85         }
  86
  87         /**
  88          * method that lucene calls to check tokenization of a stream character
  89          *
  90          * @param character char currently being processed
  91          *
  92          * @return true if the char is a token, false if the char is a stop char
  93          */
  94         protected boolean isTokenChar( char character )
  95         {
  96             boolean token;
  97
  98             switch( character )
  99             {
 100                 case '.':
 101                 case '-':
 102                     token = false; break;
 103                 default:
 104                     token = true;
 105             }
 106
 107             return token;
 108         }
 109     }
 110 }