mirror of
				https://github.com/go-gitea/gitea.git
				synced 2025-10-31 02:46:04 +01:00 
			
		
		
		
	* Support elastic search for code search * Finished elastic search implementation and add some tests * Enable test on drone and added docs * Add new fields to elastic search * Fix bug * remove unused changes * Use indexer alias to keep the gitea indexer version * Improve codes * Some code improvements * The real indexer name changed to xxx.v1 Co-authored-by: zeripath <art27@cantab.net>
		
			
				
	
	
		
			155 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			155 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2019 The Gitea Authors. All rights reserved.
 | |
| // Use of this source code is governed by a MIT-style
 | |
| // license that can be found in the LICENSE file.
 | |
| 
 | |
| package code
 | |
| 
 | |
| import (
 | |
| 	"os"
 | |
| 
 | |
| 	"code.gitea.io/gitea/models"
 | |
| 	"code.gitea.io/gitea/modules/graceful"
 | |
| 	"code.gitea.io/gitea/modules/log"
 | |
| )
 | |
| 
 | |
| type repoIndexerOperation struct {
 | |
| 	repoID   int64
 | |
| 	deleted  bool
 | |
| 	watchers []chan<- error
 | |
| }
 | |
| 
 | |
| var repoIndexerOperationQueue chan repoIndexerOperation
 | |
| 
 | |
| func initQueue(queueLength int) {
 | |
| 	repoIndexerOperationQueue = make(chan repoIndexerOperation, queueLength)
 | |
| }
 | |
| 
 | |
| func index(indexer Indexer, repoID int64) error {
 | |
| 	repo, err := models.GetRepositoryByID(repoID)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	sha, err := getDefaultBranchSha(repo)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	changes, err := getRepoChanges(repo, sha)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	} else if changes == nil {
 | |
| 		return nil
 | |
| 	}
 | |
| 
 | |
| 	if err := indexer.Index(repo, sha, changes); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	return repo.UpdateIndexerStatus(models.RepoIndexerTypeCode, sha)
 | |
| }
 | |
| 
 | |
| func processRepoIndexerOperationQueue(indexer Indexer) {
 | |
| 	for {
 | |
| 		select {
 | |
| 		case op := <-repoIndexerOperationQueue:
 | |
| 			var err error
 | |
| 			if op.deleted {
 | |
| 				if err = indexer.Delete(op.repoID); err != nil {
 | |
| 					log.Error("indexer.Delete: %v", err)
 | |
| 				}
 | |
| 			} else {
 | |
| 				if err = index(indexer, op.repoID); err != nil {
 | |
| 					log.Error("indexer.Index: %v", err)
 | |
| 				}
 | |
| 			}
 | |
| 			for _, watcher := range op.watchers {
 | |
| 				watcher <- err
 | |
| 			}
 | |
| 		case <-graceful.GetManager().IsShutdown():
 | |
| 			log.Info("PID: %d Repository indexer queue processing stopped", os.Getpid())
 | |
| 			return
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // DeleteRepoFromIndexer remove all of a repository's entries from the indexer
 | |
| func DeleteRepoFromIndexer(repo *models.Repository, watchers ...chan<- error) {
 | |
| 	addOperationToQueue(repoIndexerOperation{repoID: repo.ID, deleted: true, watchers: watchers})
 | |
| }
 | |
| 
 | |
| // UpdateRepoIndexer update a repository's entries in the indexer
 | |
| func UpdateRepoIndexer(repo *models.Repository, watchers ...chan<- error) {
 | |
| 	addOperationToQueue(repoIndexerOperation{repoID: repo.ID, deleted: false, watchers: watchers})
 | |
| }
 | |
| 
 | |
| func addOperationToQueue(op repoIndexerOperation) {
 | |
| 	select {
 | |
| 	case repoIndexerOperationQueue <- op:
 | |
| 		break
 | |
| 	default:
 | |
| 		go func() {
 | |
| 			repoIndexerOperationQueue <- op
 | |
| 		}()
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // populateRepoIndexer populate the repo indexer with pre-existing data. This
 | |
| // should only be run when the indexer is created for the first time.
 | |
| func populateRepoIndexer() {
 | |
| 	log.Info("Populating the repo indexer with existing repositories")
 | |
| 
 | |
| 	isShutdown := graceful.GetManager().IsShutdown()
 | |
| 
 | |
| 	exist, err := models.IsTableNotEmpty("repository")
 | |
| 	if err != nil {
 | |
| 		log.Fatal("System error: %v", err)
 | |
| 	} else if !exist {
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	// if there is any existing repo indexer metadata in the DB, delete it
 | |
| 	// since we are starting afresh. Also, xorm requires deletes to have a
 | |
| 	// condition, and we want to delete everything, thus 1=1.
 | |
| 	if err := models.DeleteAllRecords("repo_indexer_status"); err != nil {
 | |
| 		log.Fatal("System error: %v", err)
 | |
| 	}
 | |
| 
 | |
| 	var maxRepoID int64
 | |
| 	if maxRepoID, err = models.GetMaxID("repository"); err != nil {
 | |
| 		log.Fatal("System error: %v", err)
 | |
| 	}
 | |
| 
 | |
| 	// start with the maximum existing repo ID and work backwards, so that we
 | |
| 	// don't include repos that are created after gitea starts; such repos will
 | |
| 	// already be added to the indexer, and we don't need to add them again.
 | |
| 	for maxRepoID > 0 {
 | |
| 		select {
 | |
| 		case <-isShutdown:
 | |
| 			log.Info("Repository Indexer population shutdown before completion")
 | |
| 			return
 | |
| 		default:
 | |
| 		}
 | |
| 		ids, err := models.GetUnindexedRepos(models.RepoIndexerTypeCode, maxRepoID, 0, 50)
 | |
| 		if err != nil {
 | |
| 			log.Error("populateRepoIndexer: %v", err)
 | |
| 			return
 | |
| 		} else if len(ids) == 0 {
 | |
| 			break
 | |
| 		}
 | |
| 		for _, id := range ids {
 | |
| 			select {
 | |
| 			case <-isShutdown:
 | |
| 				log.Info("Repository Indexer population shutdown before completion")
 | |
| 				return
 | |
| 			default:
 | |
| 			}
 | |
| 			repoIndexerOperationQueue <- repoIndexerOperation{
 | |
| 				repoID:  id,
 | |
| 				deleted: false,
 | |
| 			}
 | |
| 			maxRepoID = id - 1
 | |
| 		}
 | |
| 	}
 | |
| 	log.Info("Done (re)populating the repo indexer with existing repositories")
 | |
| }
 |