mirror of
				https://codeberg.org/forgejo/forgejo.git
				synced 2025-10-26 20:11:02 +00:00 
			
		
		
		
	meilisearch does not have an search option to contorl fuzzynes per query right now: - https://github.com/meilisearch/meilisearch/issues/1192 - https://github.com/orgs/meilisearch/discussions/377 - https://github.com/meilisearch/meilisearch/discussions/1096 so we have to create a workaround by post-filter the search result in gitea until this is addressed. For future works I added an option in backend only atm, to enable fuzzynes for issue indexer too. And also refactored the code so the fuzzy option is equal in logic to code indexer --- *Sponsored by Kithara Software GmbH* Conflicts: routers/web/repo/search.go trivial context confict s/isMatch/isFuzzy/
		
			
				
	
	
		
			148 lines
		
	
	
	
		
			3.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			148 lines
		
	
	
	
		
			3.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2017 The Gitea Authors. All rights reserved.
 | |
| // SPDX-License-Identifier: MIT
 | |
| 
 | |
| package code
 | |
| 
 | |
| import (
 | |
| 	"bytes"
 | |
| 	"context"
 | |
| 	"html/template"
 | |
| 	"strings"
 | |
| 
 | |
| 	"code.gitea.io/gitea/modules/highlight"
 | |
| 	"code.gitea.io/gitea/modules/indexer/code/internal"
 | |
| 	"code.gitea.io/gitea/modules/timeutil"
 | |
| )
 | |
| 
 | |
| // Result a search result to display
 | |
| type Result struct {
 | |
| 	RepoID      int64
 | |
| 	Filename    string
 | |
| 	CommitID    string
 | |
| 	UpdatedUnix timeutil.TimeStamp
 | |
| 	Language    string
 | |
| 	Color       string
 | |
| 	Lines       []ResultLine
 | |
| }
 | |
| 
 | |
| type ResultLine struct {
 | |
| 	Num              int
 | |
| 	FormattedContent template.HTML
 | |
| }
 | |
| 
 | |
| type SearchResultLanguages = internal.SearchResultLanguages
 | |
| 
 | |
| func indices(content string, selectionStartIndex, selectionEndIndex int) (int, int) {
 | |
| 	startIndex := selectionStartIndex
 | |
| 	numLinesBefore := 0
 | |
| 	for ; startIndex > 0; startIndex-- {
 | |
| 		if content[startIndex-1] == '\n' {
 | |
| 			if numLinesBefore == 1 {
 | |
| 				break
 | |
| 			}
 | |
| 			numLinesBefore++
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	endIndex := selectionEndIndex
 | |
| 	numLinesAfter := 0
 | |
| 	for ; endIndex < len(content); endIndex++ {
 | |
| 		if content[endIndex] == '\n' {
 | |
| 			if numLinesAfter == 1 {
 | |
| 				break
 | |
| 			}
 | |
| 			numLinesAfter++
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return startIndex, endIndex
 | |
| }
 | |
| 
 | |
| func writeStrings(buf *bytes.Buffer, strs ...string) error {
 | |
| 	for _, s := range strs {
 | |
| 		_, err := buf.WriteString(s)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| func searchResult(result *internal.SearchResult, startIndex, endIndex int) (*Result, error) {
 | |
| 	startLineNum := 1 + strings.Count(result.Content[:startIndex], "\n")
 | |
| 
 | |
| 	var formattedLinesBuffer bytes.Buffer
 | |
| 
 | |
| 	contentLines := strings.SplitAfter(result.Content[startIndex:endIndex], "\n")
 | |
| 	lines := make([]ResultLine, 0, len(contentLines))
 | |
| 	index := startIndex
 | |
| 	for i, line := range contentLines {
 | |
| 		var err error
 | |
| 		if index < result.EndIndex &&
 | |
| 			result.StartIndex < index+len(line) &&
 | |
| 			result.StartIndex < result.EndIndex {
 | |
| 			openActiveIndex := max(result.StartIndex-index, 0)
 | |
| 			closeActiveIndex := min(result.EndIndex-index, len(line))
 | |
| 			err = writeStrings(&formattedLinesBuffer,
 | |
| 				line[:openActiveIndex],
 | |
| 				line[openActiveIndex:closeActiveIndex],
 | |
| 				line[closeActiveIndex:],
 | |
| 			)
 | |
| 		} else {
 | |
| 			err = writeStrings(&formattedLinesBuffer,
 | |
| 				line,
 | |
| 			)
 | |
| 		}
 | |
| 		if err != nil {
 | |
| 			return nil, err
 | |
| 		}
 | |
| 
 | |
| 		lines = append(lines, ResultLine{Num: startLineNum + i})
 | |
| 		index += len(line)
 | |
| 	}
 | |
| 
 | |
| 	// we should highlight the whole code block first, otherwise it doesn't work well with multiple line highlighting
 | |
| 	hl, _ := highlight.Code(result.Filename, "", formattedLinesBuffer.String())
 | |
| 	highlightedLines := strings.Split(string(hl), "\n")
 | |
| 
 | |
| 	// The lines outputted by highlight.Code might not match the original lines, because "highlight" removes the last `\n`
 | |
| 	lines = lines[:min(len(highlightedLines), len(lines))]
 | |
| 	highlightedLines = highlightedLines[:len(lines)]
 | |
| 	for i := 0; i < len(lines); i++ {
 | |
| 		lines[i].FormattedContent = template.HTML(highlightedLines[i])
 | |
| 	}
 | |
| 
 | |
| 	return &Result{
 | |
| 		RepoID:      result.RepoID,
 | |
| 		Filename:    result.Filename,
 | |
| 		CommitID:    result.CommitID,
 | |
| 		UpdatedUnix: result.UpdatedUnix,
 | |
| 		Language:    result.Language,
 | |
| 		Color:       result.Color,
 | |
| 		Lines:       lines,
 | |
| 	}, nil
 | |
| }
 | |
| 
 | |
| // PerformSearch perform a search on a repository
 | |
| // if isFuzzy is true set the Damerau-Levenshtein distance from 0 to 2
 | |
| func PerformSearch(ctx context.Context, repoIDs []int64, language, keyword string, page, pageSize int, isFuzzy bool) (int, []*Result, []*internal.SearchResultLanguages, error) {
 | |
| 	if len(keyword) == 0 {
 | |
| 		return 0, nil, nil, nil
 | |
| 	}
 | |
| 
 | |
| 	total, results, resultLanguages, err := (*globalIndexer.Load()).Search(ctx, repoIDs, language, keyword, page, pageSize, isFuzzy)
 | |
| 	if err != nil {
 | |
| 		return 0, nil, nil, err
 | |
| 	}
 | |
| 
 | |
| 	displayResults := make([]*Result, len(results))
 | |
| 
 | |
| 	for i, result := range results {
 | |
| 		startIndex, endIndex := indices(result.Content, result.StartIndex, result.EndIndex)
 | |
| 		displayResults[i], err = searchResult(result, startIndex, endIndex)
 | |
| 		if err != nil {
 | |
| 			return 0, nil, nil, err
 | |
| 		}
 | |
| 	}
 | |
| 	return int(total), displayResults, resultLanguages, nil
 | |
| }
 |