1 package org.apache.archiva.indexer.search;
4 * Licensed to the Apache Software Foundation (ASF) under one
5 * or more contributor license agreements. See the NOTICE file
6 * distributed with this work for additional information
7 * regarding copyright ownership. The ASF licenses this file
8 * to you under the Apache License, Version 2.0 (the
9 * "License"); you may not use this file except in compliance
10 * with the License. You may obtain a copy of the License at
12 * http://www.apache.org/licenses/LICENSE-2.0
14 * Unless required by applicable law or agreed to in writing,
15 * software distributed under the License is distributed on an
16 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
17 * KIND, either express or implied. See the License for the
18 * specific language governing permissions and limitations
22 import org.apache.archiva.admin.model.RepositoryAdminException;
23 import org.apache.archiva.admin.model.beans.ManagedRepository;
24 import org.apache.archiva.admin.model.beans.ProxyConnector;
25 import org.apache.archiva.admin.model.managed.ManagedRepositoryAdmin;
26 import org.apache.archiva.admin.model.proxyconnector.ProxyConnectorAdmin;
27 import org.apache.archiva.common.plexusbridge.MavenIndexerUtils;
28 import org.apache.archiva.common.plexusbridge.PlexusSisuBridge;
29 import org.apache.archiva.common.plexusbridge.PlexusSisuBridgeException;
30 import org.apache.archiva.indexer.util.SearchUtil;
31 import org.apache.commons.lang.StringUtils;
32 import org.apache.lucene.search.BooleanClause.Occur;
33 import org.apache.lucene.search.BooleanQuery;
34 import org.apache.maven.index.ArtifactInfo;
35 import org.apache.maven.index.FlatSearchRequest;
36 import org.apache.maven.index.FlatSearchResponse;
37 import org.apache.maven.index.MAVEN;
38 import org.apache.maven.index.NexusIndexer;
39 import org.apache.maven.index.OSGI;
40 import org.apache.maven.index.context.IndexCreator;
41 import org.apache.maven.index.context.IndexingContext;
42 import org.apache.maven.index.context.UnsupportedExistingLuceneIndexException;
43 import org.apache.maven.index.expr.StringSearchExpression;
44 import org.slf4j.Logger;
45 import org.slf4j.LoggerFactory;
46 import org.springframework.stereotype.Service;
48 import javax.inject.Inject;
50 import java.io.IOException;
51 import java.util.ArrayList;
52 import java.util.Collections;
53 import java.util.HashSet;
54 import java.util.List;
59 * RepositorySearch implementation which uses the Nexus Indexer for searching.
61 @Service( "nexusSearch" )
62 public class NexusRepositorySearch
63 implements RepositorySearch
65 private Logger log = LoggerFactory.getLogger( getClass() );
67 private NexusIndexer indexer;
69 private ManagedRepositoryAdmin managedRepositoryAdmin;
71 private ProxyConnectorAdmin proxyConnectorAdmin;
73 private MavenIndexerUtils mavenIndexerUtils;
76 public NexusRepositorySearch( PlexusSisuBridge plexusSisuBridge, ManagedRepositoryAdmin managedRepositoryAdmin,
77 MavenIndexerUtils mavenIndexerUtils, ProxyConnectorAdmin proxyConnectorAdmin )
78 throws PlexusSisuBridgeException
80 this.indexer = plexusSisuBridge.lookup( NexusIndexer.class );
81 this.managedRepositoryAdmin = managedRepositoryAdmin;
82 this.mavenIndexerUtils = mavenIndexerUtils;
83 this.proxyConnectorAdmin = proxyConnectorAdmin;
87 * @see RepositorySearch#search(String, List, String, SearchResultLimits, List)
89 public SearchResults search( String principal, List<String> selectedRepos, String term, SearchResultLimits limits,
90 List<String> previousSearchTerms )
91 throws RepositorySearchException
93 List<String> indexingContextIds = addIndexingContexts( selectedRepos );
95 // since upgrade to nexus 2.0.0, query has changed from g:[QUERIED TERM]* to g:*[QUERIED TERM]*
96 // resulting to more wildcard searches so we need to increase max clause count
97 BooleanQuery.setMaxClauseCount( Integer.MAX_VALUE );
98 BooleanQuery q = new BooleanQuery();
100 if ( previousSearchTerms == null || previousSearchTerms.isEmpty() )
102 constructQuery( term, q );
106 for ( String previousTerm : previousSearchTerms )
108 BooleanQuery iQuery = new BooleanQuery();
109 constructQuery( previousTerm, iQuery );
111 q.add( iQuery, Occur.MUST );
114 BooleanQuery iQuery = new BooleanQuery();
115 constructQuery( term, iQuery );
116 q.add( iQuery, Occur.MUST );
119 // we retun only artifacts without classifier in quick search, olamy cannot find a way to say with this field empty
120 // FIXME cannot find a way currently to setup this in constructQuery !!!
121 return search( limits, q, indexingContextIds, NoClassifierArtifactInfoFiler.LIST, principal, selectedRepos );
126 * @see RepositorySearch#search(String, SearchFields, SearchResultLimits)
128 public SearchResults search( String principal, SearchFields searchFields, SearchResultLimits limits )
129 throws RepositorySearchException
131 if ( searchFields.getRepositories() == null )
133 throw new RepositorySearchException( "Repositories cannot be null." );
136 List<String> indexingContextIds = addIndexingContexts( searchFields.getRepositories() );
138 BooleanQuery q = new BooleanQuery();
139 if ( StringUtils.isNotBlank( searchFields.getGroupId() ) )
141 q.add( indexer.constructQuery( MAVEN.GROUP_ID, new StringSearchExpression( searchFields.getGroupId() ) ),
145 if ( StringUtils.isNotBlank( searchFields.getArtifactId() ) )
148 indexer.constructQuery( MAVEN.ARTIFACT_ID, new StringSearchExpression( searchFields.getArtifactId() ) ),
152 if ( StringUtils.isNotBlank( searchFields.getVersion() ) )
154 q.add( indexer.constructQuery( MAVEN.VERSION, new StringSearchExpression( searchFields.getVersion() ) ),
158 if ( StringUtils.isNotBlank( searchFields.getPackaging() ) )
160 q.add( indexer.constructQuery( MAVEN.PACKAGING, new StringSearchExpression( searchFields.getPackaging() ) ),
164 if ( StringUtils.isNotBlank( searchFields.getClassName() ) )
167 indexer.constructQuery( MAVEN.CLASSNAMES, new StringSearchExpression( searchFields.getClassName() ) ),
171 if ( StringUtils.isNotBlank( searchFields.getBundleSymbolicName() ) )
173 q.add( indexer.constructQuery( OSGI.SYMBOLIC_NAME,
174 new StringSearchExpression( searchFields.getBundleSymbolicName() ) ),
178 if ( StringUtils.isNotBlank( searchFields.getBundleVersion() ) )
181 indexer.constructQuery( OSGI.VERSION, new StringSearchExpression( searchFields.getBundleVersion() ) ),
185 if ( StringUtils.isNotBlank( searchFields.getBundleExportPackage() ) )
187 q.add( indexer.constructQuery( OSGI.EXPORT_PACKAGE,
188 new StringSearchExpression( searchFields.getBundleExportPackage() ) ),
192 if ( StringUtils.isNotBlank( searchFields.getBundleExportService() ) )
194 q.add( indexer.constructQuery( OSGI.EXPORT_SERVICE,
195 new StringSearchExpression( searchFields.getBundleExportService() ) ),
199 if ( StringUtils.isNotBlank( searchFields.getBundleImportPackage() ) )
201 q.add( indexer.constructQuery( OSGI.IMPORT_PACKAGE,
202 new StringSearchExpression( searchFields.getBundleImportPackage() ) ),
206 if ( StringUtils.isNotBlank( searchFields.getBundleName() ) )
208 q.add( indexer.constructQuery( OSGI.NAME, new StringSearchExpression( searchFields.getBundleName() ) ),
212 if ( StringUtils.isNotBlank( searchFields.getClassifier() ) )
215 indexer.constructQuery( MAVEN.CLASSIFIER, new StringSearchExpression( searchFields.getClassifier() ) ),
219 if ( q.getClauses() == null || q.getClauses().length <= 0 )
221 throw new RepositorySearchException( "No search fields set." );
224 return search( limits, q, indexingContextIds, Collections.<ArtifactInfoFiler>emptyList(), principal,
225 searchFields.getRepositories() );
228 private SearchResults search( SearchResultLimits limits, BooleanQuery q, List<String> indexingContextIds,
229 List<? extends ArtifactInfoFiler> filters, String principal,
230 List<String> selectedRepos )
231 throws RepositorySearchException
236 FlatSearchRequest request = new FlatSearchRequest( q );
237 request.setContexts( getIndexingContexts( indexingContextIds ) );
238 FlatSearchResponse response = indexer.searchFlat( request );
240 if ( response == null || response.getTotalHits() == 0 )
242 SearchResults results = new SearchResults();
243 results.setLimits( limits );
247 return convertToSearchResults( response, limits, filters, principal, selectedRepos );
249 catch ( IOException e )
251 throw new RepositorySearchException( e.getMessage(), e );
253 catch ( RepositoryAdminException e )
255 throw new RepositorySearchException( e.getMessage(), e );
260 private List<IndexingContext> getIndexingContexts( List<String> ids )
262 List<IndexingContext> contexts = new ArrayList<IndexingContext>( ids.size() );
264 for ( String id : ids )
266 IndexingContext context = indexer.getIndexingContexts().get( id );
267 if ( context != null )
269 contexts.add( context );
273 log.warn( "context with id {} not exists", id );
280 private void constructQuery( String term, BooleanQuery q )
282 q.add( indexer.constructQuery( MAVEN.GROUP_ID, new StringSearchExpression( term ) ), Occur.SHOULD );
283 q.add( indexer.constructQuery( MAVEN.ARTIFACT_ID, new StringSearchExpression( term ) ), Occur.SHOULD );
284 q.add( indexer.constructQuery( MAVEN.VERSION, new StringSearchExpression( term ) ), Occur.SHOULD );
285 q.add( indexer.constructQuery( MAVEN.PACKAGING, new StringSearchExpression( term ) ), Occur.SHOULD );
286 q.add( indexer.constructQuery( MAVEN.CLASSNAMES, new StringSearchExpression( term ) ), Occur.SHOULD );
289 // new WildcardQuery( new Term( MAVEN.CLASSNAMES.getFieldName(), "*" ) );
290 //q.add( query, Occur.MUST_NOT );
291 // olamy IMHO we could set this option as at least one must match
292 //q.setMinimumNumberShouldMatch( 1 );
297 * @param selectedRepos
298 * @return indexing contextId used
300 private List<String> addIndexingContexts( List<String> selectedRepos )
302 Set<String> indexingContextIds = new HashSet<String>();
303 for ( String repo : selectedRepos )
307 ManagedRepository repoConfig = managedRepositoryAdmin.getManagedRepository( repo );
309 if ( repoConfig != null )
311 String indexDir = repoConfig.getIndexDirectory();
312 File indexDirectory = null;
313 if ( indexDir != null && !"".equals( indexDir ) )
315 indexDirectory = new File( repoConfig.getIndexDirectory() );
319 indexDirectory = new File( repoConfig.getLocation(), ".indexer" );
322 IndexingContext context = indexer.getIndexingContexts().get( repoConfig.getId() );
323 if ( context != null )
325 // alreday here so no need to record it again
326 log.debug( "index with id {} already exists skip adding it", repoConfig.getId() );
327 // set searchable flag
328 context.setSearchable( repoConfig.isScanned() );
329 indexingContextIds.add( context.getId() );
330 indexingContextIds.addAll( getRemoteIndexingContextIds( repo ) );
334 context = indexer.addIndexingContext( repoConfig.getId(), repoConfig.getId(),
335 new File( repoConfig.getLocation() ), indexDirectory, null,
336 null, getAllIndexCreators() );
337 context.setSearchable( repoConfig.isScanned() );
338 if ( context.isSearchable() )
340 indexingContextIds.addAll( getRemoteIndexingContextIds( repo ) );
341 indexingContextIds.add( context.getId() );
345 log.warn( "indexingContext with id {} not searchable", repoConfig.getId() );
351 log.warn( "Repository '" + repo + "' not found in configuration." );
354 catch ( UnsupportedExistingLuceneIndexException e )
356 log.warn( "Error accessing index of repository '" + repo + "' : " + e.getMessage() );
359 catch ( IOException e )
361 log.warn( "IO error occured while accessing index of repository '" + repo + "' : " + e.getMessage() );
364 catch ( RepositoryAdminException e )
366 log.warn( "RepositoryAdminException occured while accessing index of repository '" + repo + "' : "
372 return new ArrayList<String>( indexingContextIds );
376 private Set<String> getRemoteIndexingContextIds( String managedRepoId )
377 throws RepositoryAdminException
379 Set<String> ids = new HashSet<String>();
381 List<ProxyConnector> proxyConnectors = proxyConnectorAdmin.getProxyConnectorAsMap().get( managedRepoId );
383 if ( proxyConnectors == null || proxyConnectors.isEmpty() )
388 for ( ProxyConnector proxyConnector : proxyConnectors )
390 String remoteId = "remote-" + proxyConnector.getTargetRepoId();
391 IndexingContext context = indexer.getIndexingContexts().get( remoteId );
392 if ( context != null && context.isSearchable() )
402 protected List<? extends IndexCreator> getAllIndexCreators()
404 return mavenIndexerUtils.getAllIndexCreators();
408 private SearchResults convertToSearchResults( FlatSearchResponse response, SearchResultLimits limits,
409 List<? extends ArtifactInfoFiler> artifactInfoFilers,
410 String principal, List<String> selectedRepos )
411 throws RepositoryAdminException
413 SearchResults results = new SearchResults();
414 Set<ArtifactInfo> artifactInfos = response.getResults();
416 for ( ArtifactInfo artifactInfo : artifactInfos )
418 String id = SearchUtil.getHitId( artifactInfo.groupId, artifactInfo.artifactId, artifactInfo.classifier,
419 artifactInfo.packaging );
420 Map<String, SearchResultHit> hitsMap = results.getHitsMap();
422 if ( !applyArtifactInfoFilters( artifactInfo, artifactInfoFilers, hitsMap ) )
427 SearchResultHit hit = hitsMap.get( id );
430 if ( !hit.getVersions().contains( artifactInfo.version ) )
432 hit.addVersion( artifactInfo.version );
437 hit = new SearchResultHit();
438 hit.setArtifactId( artifactInfo.artifactId );
439 hit.setGroupId( artifactInfo.groupId );
440 hit.setRepositoryId( artifactInfo.repository );
441 hit.addVersion( artifactInfo.version );
442 hit.setBundleExportPackage( artifactInfo.bundleExportPackage );
443 hit.setBundleExportService( artifactInfo.bundleExportService );
444 hit.setBundleSymbolicName( artifactInfo.bundleSymbolicName );
445 hit.setBundleVersion( artifactInfo.bundleVersion );
446 hit.setBundleDescription( artifactInfo.bundleDescription );
447 hit.setBundleDocUrl( artifactInfo.bundleDocUrl );
448 hit.setBundleRequireBundle( artifactInfo.bundleRequireBundle );
449 hit.setBundleImportPackage( artifactInfo.bundleImportPackage );
450 hit.setBundleLicense( artifactInfo.bundleLicense );
451 hit.setBundleName( artifactInfo.bundleName );
452 hit.setContext( artifactInfo.context );
453 hit.setGoals( artifactInfo.goals );
454 hit.setPrefix( artifactInfo.prefix );
455 hit.setPackaging( artifactInfo.packaging );
456 hit.setClassifier( artifactInfo.classifier );
457 hit.setUrl( getBaseUrl( artifactInfo, selectedRepos ) );
460 results.addHit( id, hit );
463 results.setTotalHits( response.getTotalHitsCount() );
464 results.setReturnedHitsCount( response.getReturnedHitsCount() );
465 results.setLimits( limits );
467 if ( limits == null || limits.getSelectedPage() == SearchResultLimits.ALL_PAGES )
473 return paginate( results );
478 * calculate baseUrl without the context and base Archiva Url
480 * @param artifactInfo
483 protected String getBaseUrl( ArtifactInfo artifactInfo, List<String> selectedRepos )
484 throws RepositoryAdminException
486 StringBuilder sb = new StringBuilder();
487 if ( StringUtils.startsWith( artifactInfo.context, "remote-" ) )
489 // it's a remote index result we search a managed which proxying this remote and on which
490 // current user has read karma
491 String managedRepoId =
492 getManagedRepoId( StringUtils.substringAfter( artifactInfo.context, "remote-" ), selectedRepos );
493 if ( managedRepoId != null )
495 sb.append( '/' ).append( managedRepoId );
500 sb.append( '/' ).append( artifactInfo.context );
503 sb.append( '/' ).append( StringUtils.replaceChars( artifactInfo.groupId, '.', '/' ) );
504 sb.append( '/' ).append( artifactInfo.artifactId );
505 sb.append( '/' ).append( artifactInfo.version );
506 sb.append( '/' ).append( artifactInfo.artifactId );
507 sb.append( '-' ).append( artifactInfo.version );
508 if ( StringUtils.isNotBlank( artifactInfo.classifier ) )
510 sb.append( '-' ).append( artifactInfo.classifier );
512 // maven-plugin packaging is a jar
513 if ( StringUtils.equals( "maven-plugin", artifactInfo.packaging ) )
519 sb.append( '.' ).append( artifactInfo.packaging );
522 return sb.toString();
526 * return a managed repo for a remote result
529 * @param selectedRepos
531 * @throws RepositoryAdminException
533 private String getManagedRepoId( String remoteRepo, List<String> selectedRepos )
534 throws RepositoryAdminException
536 Map<String, List<ProxyConnector>> proxyConnectorMap = proxyConnectorAdmin.getProxyConnectorAsMap();
537 if ( proxyConnectorMap == null || proxyConnectorMap.isEmpty() )
541 if ( selectedRepos != null && !selectedRepos.isEmpty() )
543 for ( Map.Entry<String, List<ProxyConnector>> entry : proxyConnectorMap.entrySet() )
545 if ( selectedRepos.contains( entry.getKey() ) )
547 for ( ProxyConnector proxyConnector : entry.getValue() )
549 if ( StringUtils.equals( remoteRepo, proxyConnector.getTargetRepoId() ) )
551 return proxyConnector.getSourceRepoId();
558 // we don't find in search selected repos so return the first one
559 for ( Map.Entry<String, List<ProxyConnector>> entry : proxyConnectorMap.entrySet() )
562 for ( ProxyConnector proxyConnector : entry.getValue() )
564 if ( StringUtils.equals( remoteRepo, proxyConnector.getTargetRepoId() ) )
566 return proxyConnector.getSourceRepoId();
574 private boolean applyArtifactInfoFilters( ArtifactInfo artifactInfo,
575 List<? extends ArtifactInfoFiler> artifactInfoFilers,
576 Map<String, SearchResultHit> currentResult )
578 if ( artifactInfoFilers == null || artifactInfoFilers.isEmpty() )
583 for ( ArtifactInfoFiler filter : artifactInfoFilers )
585 if ( !filter.addArtifactInResult( artifactInfo, currentResult ) )
593 private SearchResults paginate( SearchResults results )
595 SearchResultLimits limits = results.getLimits();
596 SearchResults paginated = new SearchResults();
598 int fetchCount = limits.getPageSize();
599 int offset = ( limits.getSelectedPage() * limits.getPageSize() );
601 if ( fetchCount > results.getTotalHits() )
603 fetchCount = results.getTotalHits();
607 if ( offset < results.getTotalHits() )
609 // only process if the offset is within the hit count.
610 for ( int i = 0; i < fetchCount; i++ )
612 // Stop fetching if we are past the total # of available hits.
613 if ( offset + i >= results.getHits().size() )
618 SearchResultHit hit = results.getHits().get( ( offset + i ) );
621 String id = SearchUtil.getHitId( hit.getGroupId(), hit.getArtifactId(), hit.getClassifier(),
622 hit.getPackaging() );
623 paginated.addHit( id, hit );
631 paginated.setTotalHits( results.getTotalHits() );
632 paginated.setReturnedHitsCount( paginated.getHits().size() );
633 paginated.setLimits( limits );