mirror of
				https://codeberg.org/forgejo/forgejo.git
				synced 2025-10-22 01:52:24 +00:00 
			
		
		
		
	Exclude generated files from language statistics (#11653)
* Update go-enry to v2.5.2
This commit is contained in:
		
					parent
					
						
							
								e8955173a9
							
						
					
				
			
			
				commit
				
					
						bd2335671f
					
				
			
		
					 28 changed files with 1402 additions and 1260 deletions
				
			
		
							
								
								
									
										22
									
								
								vendor/github.com/go-enry/go-oniguruma/chelper.c
									
										
									
										generated
									
									
										vendored
									
									
								
							
							
						
						
									
										22
									
								
								vendor/github.com/go-enry/go-oniguruma/chelper.c
									
										
									
										generated
									
									
										vendored
									
									
								
							|  | @ -7,7 +7,7 @@ | |||
| #include "chelper.h" | ||||
| 
 | ||||
| int NewOnigRegex( char *pattern, int pattern_length, int option, | ||||
|                   OnigRegex *regex, OnigRegion **region, OnigEncoding *encoding, OnigErrorInfo **error_info, char **error_buffer) { | ||||
|                   OnigRegex *regex, OnigEncoding *encoding, OnigErrorInfo **error_info, char **error_buffer) { | ||||
|     int ret = ONIG_NORMAL; | ||||
|     int error_msg_len = 0; | ||||
| 
 | ||||
|  | @ -23,8 +23,6 @@ int NewOnigRegex( char *pattern, int pattern_length, int option, | |||
| 
 | ||||
|     memset(*error_buffer, 0, ONIG_MAX_ERROR_MESSAGE_LEN * sizeof(char)); | ||||
| 
 | ||||
|     *region = onig_region_new(); | ||||
| 
 | ||||
|     ret = onig_new(regex, pattern_start, pattern_end, (OnigOptionType)(option), *encoding, OnigDefaultSyntax, *error_info); | ||||
| 
 | ||||
|     if (ret != ONIG_NORMAL) { | ||||
|  | @ -38,9 +36,10 @@ int NewOnigRegex( char *pattern, int pattern_length, int option, | |||
| } | ||||
| 
 | ||||
| int SearchOnigRegex( void *str, int str_length, int offset, int option, | ||||
|                   OnigRegex regex, OnigRegion *region, OnigErrorInfo *error_info, char *error_buffer, int *captures, int *numCaptures) { | ||||
|                   OnigRegex regex, OnigErrorInfo *error_info, char *error_buffer, int *captures, int *numCaptures) { | ||||
|     int ret = ONIG_MISMATCH; | ||||
|     int error_msg_len = 0; | ||||
|     OnigRegion *region; | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     struct timeval tim1, tim2; | ||||
|     long t; | ||||
|  | @ -55,6 +54,8 @@ int SearchOnigRegex( void *str, int str_length, int offset, int option, | |||
|     gettimeofday(&tim1, NULL); | ||||
| #endif | ||||
| 
 | ||||
|     region = onig_region_new(); | ||||
| 
 | ||||
|     ret = onig_search(regex, str_start, str_end, search_start, search_end, region, option); | ||||
|     if (ret < 0 && error_buffer != NULL) { | ||||
|         error_msg_len = onig_error_code_to_str((unsigned char*)(error_buffer), ret, error_info); | ||||
|  | @ -74,6 +75,8 @@ int SearchOnigRegex( void *str, int str_length, int offset, int option, | |||
|         *numCaptures = count; | ||||
|     } | ||||
| 
 | ||||
|     onig_region_free(region, 1); | ||||
| 
 | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     gettimeofday(&tim2, NULL); | ||||
|     t = (tim2.tv_sec - tim1.tv_sec) * 1000000 + tim2.tv_usec - tim1.tv_usec; | ||||
|  | @ -83,9 +86,10 @@ int SearchOnigRegex( void *str, int str_length, int offset, int option, | |||
| } | ||||
| 
 | ||||
| int MatchOnigRegex(void *str, int str_length, int offset, int option, | ||||
|                   OnigRegex regex, OnigRegion *region) { | ||||
|                   OnigRegex regex) { | ||||
|     int ret = ONIG_MISMATCH; | ||||
|     int error_msg_len = 0; | ||||
|     OnigRegion *region; | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     struct timeval tim1, tim2; | ||||
|     long t; | ||||
|  | @ -98,7 +102,9 @@ int MatchOnigRegex(void *str, int str_length, int offset, int option, | |||
| #ifdef BENCHMARK_CHELP | ||||
|     gettimeofday(&tim1, NULL); | ||||
| #endif | ||||
|     region = onig_region_new(); | ||||
|     ret = onig_match(regex, str_start, str_end, search_start, region, option); | ||||
|     onig_region_free(region, 1); | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     gettimeofday(&tim2, NULL); | ||||
|     t = (tim2.tv_sec - tim1.tv_sec) * 1000000 + tim2.tv_usec - tim1.tv_usec; | ||||
|  | @ -108,8 +114,9 @@ int MatchOnigRegex(void *str, int str_length, int offset, int option, | |||
| } | ||||
| 
 | ||||
| int LookupOnigCaptureByName(char *name, int name_length, | ||||
|                   OnigRegex regex, OnigRegion *region) { | ||||
|                   OnigRegex regex) { | ||||
|     int ret = ONIGERR_UNDEFINED_NAME_REFERENCE; | ||||
|     OnigRegion *region; | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     struct timeval tim1, tim2; | ||||
|     long t; | ||||
|  | @ -119,7 +126,9 @@ int LookupOnigCaptureByName(char *name, int name_length, | |||
| #ifdef BENCHMARK_CHELP | ||||
|     gettimeofday(&tim1, NULL); | ||||
| #endif | ||||
|     region = onig_region_new(); | ||||
|     ret = onig_name_to_backref_number(regex, name_start, name_end, region); | ||||
|     onig_region_free(region, 1); | ||||
| #ifdef BENCHMARK_CHELP | ||||
|     gettimeofday(&tim2, NULL); | ||||
|     t = (tim2.tv_sec - tim1.tv_sec) * 1000000 + tim2.tv_usec - tim1.tv_usec; | ||||
|  | @ -181,4 +190,3 @@ int GetCaptureNames(OnigRegex reg, void *buffer, int bufferSize, int* groupNumbe | |||
|     onig_foreach_name(reg, name_callback, (void* )&groupInfo); | ||||
|     return groupInfo.bufferOffset; | ||||
| } | ||||
| 
 | ||||
|  |  | |||
							
								
								
									
										8
									
								
								vendor/github.com/go-enry/go-oniguruma/chelper.h
									
										
									
										generated
									
									
										vendored
									
									
								
							
							
						
						
									
										8
									
								
								vendor/github.com/go-enry/go-oniguruma/chelper.h
									
										
									
										generated
									
									
										vendored
									
									
								
							|  | @ -1,14 +1,14 @@ | |||
| #include <oniguruma.h> | ||||
| 
 | ||||
| extern int NewOnigRegex( char *pattern, int pattern_length, int option, | ||||
|                                   OnigRegex *regex, OnigRegion **region, OnigEncoding *encoding, OnigErrorInfo **error_info, char **error_buffer); | ||||
|                                   OnigRegex *regex, OnigEncoding *encoding, OnigErrorInfo **error_info, char **error_buffer); | ||||
| 
 | ||||
| extern int SearchOnigRegex( void *str, int str_length, int offset, int option, | ||||
|                                   OnigRegex regex, OnigRegion *region, OnigErrorInfo *error_info, char *error_buffer, int *captures, int *numCaptures); | ||||
|                                   OnigRegex regex, OnigErrorInfo *error_info, char *error_buffer, int *captures, int *numCaptures); | ||||
| 
 | ||||
| extern int MatchOnigRegex( void *str, int str_length, int offset, int option, | ||||
|                   OnigRegex regex, OnigRegion *region); | ||||
|                   OnigRegex regex); | ||||
| 
 | ||||
| extern int LookupOnigCaptureByName(char *name, int name_length, OnigRegex regex, OnigRegion *region); | ||||
| extern int LookupOnigCaptureByName(char *name, int name_length, OnigRegex regex); | ||||
| 
 | ||||
| extern int GetCaptureNames(OnigRegex regex, void *buffer, int bufferSize, int* groupNumbers); | ||||
|  |  | |||
							
								
								
									
										401
									
								
								vendor/github.com/go-enry/go-oniguruma/regex.go
									
										
									
										generated
									
									
										vendored
									
									
								
							
							
						
						
									
										401
									
								
								vendor/github.com/go-enry/go-oniguruma/regex.go
									
										
									
										generated
									
									
										vendored
									
									
								
							|  | @ -14,7 +14,6 @@ import ( | |||
| 	"errors" | ||||
| 	"fmt" | ||||
| 	"io" | ||||
| 	"log" | ||||
| 	"runtime" | ||||
| 	"strconv" | ||||
| 	"sync" | ||||
|  | @ -22,62 +21,52 @@ import ( | |||
| 	"unsafe" | ||||
| ) | ||||
| 
 | ||||
| type strRange []int | ||||
| 
 | ||||
| const numMatchStartSize = 4 | ||||
| const numReadBufferStartSize = 256 | ||||
| 
 | ||||
| var mutex sync.Mutex | ||||
| 
 | ||||
| type MatchData struct { | ||||
| 	count   int | ||||
| 	indexes [][]int32 | ||||
| } | ||||
| 
 | ||||
| type NamedGroupInfo map[string]int | ||||
| 
 | ||||
| type Regexp struct { | ||||
| 	pattern        string | ||||
| 	regex          C.OnigRegex | ||||
| 	region         *C.OnigRegion | ||||
| 	encoding       C.OnigEncoding | ||||
| 	errorInfo      *C.OnigErrorInfo | ||||
| 	errorBuf       *C.char | ||||
| 	matchData      *MatchData | ||||
| 	pattern   string | ||||
| 	regex     C.OnigRegex | ||||
| 	encoding  C.OnigEncoding | ||||
| 	errorInfo *C.OnigErrorInfo | ||||
| 	errorBuf  *C.char | ||||
| 
 | ||||
| 	numCaptures    int32 | ||||
| 	namedGroupInfo NamedGroupInfo | ||||
| } | ||||
| 
 | ||||
| // NewRegexp creates and initializes a new Regexp with the given pattern and option. | ||||
| func NewRegexp(pattern string, option int) (re *Regexp, err error) { | ||||
| func NewRegexp(pattern string, option int) (*Regexp, error) { | ||||
| 	return initRegexp(&Regexp{pattern: pattern, encoding: C.ONIG_ENCODING_UTF8}, option) | ||||
| } | ||||
| 
 | ||||
| // NewRegexpASCII is equivalent to NewRegexp, but with the encoding restricted to ASCII. | ||||
| func NewRegexpASCII(pattern string, option int) (re *Regexp, err error) { | ||||
| func NewRegexpASCII(pattern string, option int) (*Regexp, error) { | ||||
| 	return initRegexp(&Regexp{pattern: pattern, encoding: C.ONIG_ENCODING_ASCII}, option) | ||||
| } | ||||
| 
 | ||||
| func initRegexp(re *Regexp, option int) (*Regexp, error) { | ||||
| 	var err error | ||||
| 	patternCharPtr := C.CString(re.pattern) | ||||
| 	defer C.free(unsafe.Pointer(patternCharPtr)) | ||||
| 
 | ||||
| 	mutex.Lock() | ||||
| 	defer mutex.Unlock() | ||||
| 	errorCode := C.NewOnigRegex(patternCharPtr, C.int(len(re.pattern)), C.int(option), &re.regex, &re.region, &re.encoding, &re.errorInfo, &re.errorBuf) | ||||
| 
 | ||||
| 	errorCode := C.NewOnigRegex(patternCharPtr, C.int(len(re.pattern)), C.int(option), &re.regex, &re.encoding, &re.errorInfo, &re.errorBuf) | ||||
| 	if errorCode != C.ONIG_NORMAL { | ||||
| 		err = errors.New(C.GoString(re.errorBuf)) | ||||
| 	} else { | ||||
| 		err = nil | ||||
| 		numCapturesInPattern := int(C.onig_number_of_captures(re.regex)) + 1 | ||||
| 		re.matchData = &MatchData{} | ||||
| 		re.matchData.indexes = make([][]int32, numMatchStartSize) | ||||
| 		for i := 0; i < numMatchStartSize; i++ { | ||||
| 			re.matchData.indexes[i] = make([]int32, numCapturesInPattern*2) | ||||
| 		} | ||||
| 		re.namedGroupInfo = re.getNamedGroupInfo() | ||||
| 		runtime.SetFinalizer(re, (*Regexp).Free) | ||||
| 		return re, errors.New(C.GoString(re.errorBuf)) | ||||
| 	} | ||||
| 	return re, err | ||||
| 
 | ||||
| 	re.numCaptures = int32(C.onig_number_of_captures(re.regex)) + 1 | ||||
| 	re.namedGroupInfo = re.getNamedGroupInfo() | ||||
| 
 | ||||
| 	runtime.SetFinalizer(re, (*Regexp).Free) | ||||
| 
 | ||||
| 	return re, nil | ||||
| } | ||||
| 
 | ||||
| func Compile(str string) (*Regexp, error) { | ||||
|  | @ -89,6 +78,7 @@ func MustCompile(str string) *Regexp { | |||
| 	if error != nil { | ||||
| 		panic("regexp: compiling " + str + ": " + error.Error()) | ||||
| 	} | ||||
| 
 | ||||
| 	return regexp | ||||
| } | ||||
| 
 | ||||
|  | @ -101,6 +91,7 @@ func MustCompileWithOption(str string, option int) *Regexp { | |||
| 	if error != nil { | ||||
| 		panic("regexp: compiling " + str + ": " + error.Error()) | ||||
| 	} | ||||
| 
 | ||||
| 	return regexp | ||||
| } | ||||
| 
 | ||||
|  | @ -110,6 +101,7 @@ func MustCompileASCII(str string) *Regexp { | |||
| 	if error != nil { | ||||
| 		panic("regexp: compiling " + str + ": " + error.Error()) | ||||
| 	} | ||||
| 
 | ||||
| 	return regexp | ||||
| } | ||||
| 
 | ||||
|  | @ -119,10 +111,6 @@ func (re *Regexp) Free() { | |||
| 		C.onig_free(re.regex) | ||||
| 		re.regex = nil | ||||
| 	} | ||||
| 	if re.region != nil { | ||||
| 		C.onig_region_free(re.region, 1) | ||||
| 		re.region = nil | ||||
| 	} | ||||
| 	mutex.Unlock() | ||||
| 	if re.errorInfo != nil { | ||||
| 		C.free(unsafe.Pointer(re.errorInfo)) | ||||
|  | @ -134,149 +122,149 @@ func (re *Regexp) Free() { | |||
| 	} | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) getNamedGroupInfo() (namedGroupInfo NamedGroupInfo) { | ||||
| func (re *Regexp) getNamedGroupInfo() NamedGroupInfo { | ||||
| 	numNamedGroups := int(C.onig_number_of_names(re.regex)) | ||||
| 	//when any named capture exisits, there is no numbered capture even if there are unnamed captures | ||||
| 	if numNamedGroups > 0 { | ||||
| 		namedGroupInfo = make(map[string]int) | ||||
| 		//try to get the names | ||||
| 		bufferSize := len(re.pattern) * 2 | ||||
| 		nameBuffer := make([]byte, bufferSize) | ||||
| 		groupNumbers := make([]int32, numNamedGroups) | ||||
| 		bufferPtr := unsafe.Pointer(&nameBuffer[0]) | ||||
| 		numbersPtr := unsafe.Pointer(&groupNumbers[0]) | ||||
| 		length := int(C.GetCaptureNames(re.regex, bufferPtr, (C.int)(bufferSize), (*C.int)(numbersPtr))) | ||||
| 		if length > 0 { | ||||
| 			namesAsBytes := bytes.Split(nameBuffer[:length], ([]byte)(";")) | ||||
| 			if len(namesAsBytes) != numNamedGroups { | ||||
| 				log.Fatalf("the number of named groups (%d) does not match the number names found (%d)\n", numNamedGroups, len(namesAsBytes)) | ||||
| 			} | ||||
| 			for i, nameAsBytes := range namesAsBytes { | ||||
| 				name := string(nameAsBytes) | ||||
| 				namedGroupInfo[name] = int(groupNumbers[i]) | ||||
| 			} | ||||
| 		} else { | ||||
| 			log.Fatalf("could not get the capture group names from %q", re.String()) | ||||
| 		} | ||||
| 	// when any named capture exists, there is no numbered capture even if | ||||
| 	// there are unnamed captures. | ||||
| 	if numNamedGroups == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 	return | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) groupNameToId(name string) (id int) { | ||||
| 	if re.namedGroupInfo == nil { | ||||
| 		id = ONIGERR_UNDEFINED_NAME_REFERENCE | ||||
| 	} else { | ||||
| 		id = re.namedGroupInfo[name] | ||||
| 	namedGroupInfo := make(map[string]int) | ||||
| 
 | ||||
| 	//try to get the names | ||||
| 	bufferSize := len(re.pattern) * 2 | ||||
| 	nameBuffer := make([]byte, bufferSize) | ||||
| 	groupNumbers := make([]int32, numNamedGroups) | ||||
| 	bufferPtr := unsafe.Pointer(&nameBuffer[0]) | ||||
| 	numbersPtr := unsafe.Pointer(&groupNumbers[0]) | ||||
| 
 | ||||
| 	length := int(C.GetCaptureNames(re.regex, bufferPtr, (C.int)(bufferSize), (*C.int)(numbersPtr))) | ||||
| 	if length == 0 { | ||||
| 		panic(fmt.Errorf("could not get the capture group names from %q", re.String())) | ||||
| 	} | ||||
| 	return | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) processMatch(numCaptures int) (match []int32) { | ||||
| 	if numCaptures <= 0 { | ||||
| 		panic("cannot have 0 captures when processing a match") | ||||
| 	namesAsBytes := bytes.Split(nameBuffer[:length], ([]byte)(";")) | ||||
| 	if len(namesAsBytes) != numNamedGroups { | ||||
| 		panic(fmt.Errorf( | ||||
| 			"the number of named groups (%d) does not match the number names found (%d)", | ||||
| 			numNamedGroups, len(namesAsBytes), | ||||
| 		)) | ||||
| 	} | ||||
| 	matchData := re.matchData | ||||
| 	return matchData.indexes[matchData.count][:numCaptures*2] | ||||
| 
 | ||||
| 	for i, nameAsBytes := range namesAsBytes { | ||||
| 		name := string(nameAsBytes) | ||||
| 		namedGroupInfo[name] = int(groupNumbers[i]) | ||||
| 	} | ||||
| 
 | ||||
| 	return namedGroupInfo | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) ClearMatchData() { | ||||
| 	matchData := re.matchData | ||||
| 	matchData.count = 0 | ||||
| } | ||||
| func (re *Regexp) find(b []byte, n int, offset int) []int { | ||||
| 	match := make([]int, re.numCaptures*2) | ||||
| 
 | ||||
| func (re *Regexp) find(b []byte, n int, offset int) (match []int) { | ||||
| 	if n == 0 { | ||||
| 		b = []byte{0} | ||||
| 	} | ||||
| 	ptr := unsafe.Pointer(&b[0]) | ||||
| 	matchData := re.matchData | ||||
| 	capturesPtr := unsafe.Pointer(&(matchData.indexes[matchData.count][0])) | ||||
| 	numCaptures := int32(0) | ||||
| 
 | ||||
| 	bytesPtr := unsafe.Pointer(&b[0]) | ||||
| 
 | ||||
| 	// captures contains two pairs of ints, start and end, so we need list | ||||
| 	// twice the size of the capture groups. | ||||
| 	captures := make([]C.int, re.numCaptures*2) | ||||
| 	capturesPtr := unsafe.Pointer(&captures[0]) | ||||
| 
 | ||||
| 	var numCaptures int32 | ||||
| 	numCapturesPtr := unsafe.Pointer(&numCaptures) | ||||
| 	pos := int(C.SearchOnigRegex((ptr), C.int(n), C.int(offset), C.int(ONIG_OPTION_DEFAULT), re.regex, re.region, re.errorInfo, (*C.char)(nil), (*C.int)(capturesPtr), (*C.int)(numCapturesPtr))) | ||||
| 	if pos >= 0 { | ||||
| 		if numCaptures <= 0 { | ||||
| 			panic("cannot have 0 captures when processing a match") | ||||
| 		} | ||||
| 		match2 := matchData.indexes[matchData.count][:numCaptures*2] | ||||
| 		match = make([]int, len(match2)) | ||||
| 		for i := range match2 { | ||||
| 			match[i] = int(match2[i]) | ||||
| 		} | ||||
| 		numCapturesInPattern := int32(C.onig_number_of_captures(re.regex)) + 1 | ||||
| 		if numCapturesInPattern != numCaptures { | ||||
| 			log.Fatalf("expected %d captures but got %d\n", numCapturesInPattern, numCaptures) | ||||
| 		} | ||||
| 
 | ||||
| 	pos := int(C.SearchOnigRegex( | ||||
| 		bytesPtr, C.int(n), C.int(offset), C.int(ONIG_OPTION_DEFAULT), | ||||
| 		re.regex, re.errorInfo, (*C.char)(nil), (*C.int)(capturesPtr), (*C.int)(numCapturesPtr), | ||||
| 	)) | ||||
| 
 | ||||
| 	if pos < 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 	return | ||||
| 
 | ||||
| 	if numCaptures <= 0 { | ||||
| 		panic("cannot have 0 captures when processing a match") | ||||
| 	} | ||||
| 
 | ||||
| 	if re.numCaptures != numCaptures { | ||||
| 		panic(fmt.Errorf("expected %d captures but got %d", re.numCaptures, numCaptures)) | ||||
| 	} | ||||
| 
 | ||||
| 	for i := range captures { | ||||
| 		match[i] = int(captures[i]) | ||||
| 	} | ||||
| 
 | ||||
| 	return match | ||||
| } | ||||
| 
 | ||||
| func getCapture(b []byte, beg int, end int) []byte { | ||||
| 	if beg < 0 || end < 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return b[beg:end] | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) match(b []byte, n int, offset int) bool { | ||||
| 	re.ClearMatchData() | ||||
| 	if n == 0 { | ||||
| 		b = []byte{0} | ||||
| 	} | ||||
| 	ptr := unsafe.Pointer(&b[0]) | ||||
| 	pos := int(C.SearchOnigRegex((ptr), C.int(n), C.int(offset), C.int(ONIG_OPTION_DEFAULT), re.regex, re.region, re.errorInfo, (*C.char)(nil), (*C.int)(nil), (*C.int)(nil))) | ||||
| 
 | ||||
| 	bytesPtr := unsafe.Pointer(&b[0]) | ||||
| 	pos := int(C.SearchOnigRegex( | ||||
| 		bytesPtr, C.int(n), C.int(offset), C.int(ONIG_OPTION_DEFAULT), | ||||
| 		re.regex, re.errorInfo, nil, nil, nil, | ||||
| 	)) | ||||
| 
 | ||||
| 	return pos >= 0 | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) findAll(b []byte, n int) (matches [][]int) { | ||||
| 	re.ClearMatchData() | ||||
| 
 | ||||
| func (re *Regexp) findAll(b []byte, n int) [][]int { | ||||
| 	if n < 0 { | ||||
| 		n = len(b) | ||||
| 	} | ||||
| 	matchData := re.matchData | ||||
| 	offset := 0 | ||||
| 
 | ||||
| 	capture := make([][]int, 0, numMatchStartSize) | ||||
| 	var offset int | ||||
| 	for offset <= n { | ||||
| 		if matchData.count >= len(matchData.indexes) { | ||||
| 			length := len(matchData.indexes[0]) | ||||
| 			matchData.indexes = append(matchData.indexes, make([]int32, length)) | ||||
| 		} | ||||
| 		if match := re.find(b, n, offset); len(match) > 0 { | ||||
| 			matchData.count += 1 | ||||
| 			//move offset to the ending index of the current match and prepare to find the next non-overlapping match | ||||
| 			offset = match[1] | ||||
| 			//if match[0] == match[1], it means the current match does not advance the search. we need to exit the loop to avoid getting stuck here. | ||||
| 			if match[0] == match[1] { | ||||
| 				if offset < n && offset >= 0 { | ||||
| 					//there are more bytes, so move offset by a word | ||||
| 					_, width := utf8.DecodeRune(b[offset:]) | ||||
| 					offset += width | ||||
| 				} else { | ||||
| 					//search is over, exit loop | ||||
| 					break | ||||
| 				} | ||||
| 			} | ||||
| 		} else { | ||||
| 		match := re.find(b, n, offset) | ||||
| 		if match == nil { | ||||
| 			break | ||||
| 		} | ||||
| 	} | ||||
| 	matches2 := matchData.indexes[:matchData.count] | ||||
| 	matches = make([][]int, len(matches2)) | ||||
| 	for i, v := range matches2 { | ||||
| 		matches[i] = make([]int, len(v)) | ||||
| 		for j, v2 := range v { | ||||
| 			matches[i][j] = int(v2) | ||||
| 
 | ||||
| 		capture = append(capture, match) | ||||
| 
 | ||||
| 		// move offset to the ending index of the current match and prepare to | ||||
| 		// find the next non-overlapping match. | ||||
| 		offset = match[1] | ||||
| 
 | ||||
| 		// if match[0] == match[1], it means the current match does not advance | ||||
| 		// the search. we need to exit the loop to avoid getting stuck here. | ||||
| 		if match[0] == match[1] { | ||||
| 			if offset < n && offset >= 0 { | ||||
| 				//there are more bytes, so move offset by a word | ||||
| 				_, width := utf8.DecodeRune(b[offset:]) | ||||
| 				offset += width | ||||
| 			} else { | ||||
| 				//search is over, exit loop | ||||
| 				break | ||||
| 			} | ||||
| 		} | ||||
| 	} | ||||
| 	return | ||||
| 
 | ||||
| 	return capture | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindIndex(b []byte) []int { | ||||
| 	re.ClearMatchData() | ||||
| 	match := re.find(b, len(b), 0) | ||||
| 	if len(match) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return match[:2] | ||||
| } | ||||
| 
 | ||||
|  | @ -285,21 +273,21 @@ func (re *Regexp) Find(b []byte) []byte { | |||
| 	if loc == nil { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return getCapture(b, loc[0], loc[1]) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindString(s string) string { | ||||
| 	b := []byte(s) | ||||
| 	mb := re.Find(b) | ||||
| 	mb := re.Find([]byte(s)) | ||||
| 	if mb == nil { | ||||
| 		return "" | ||||
| 	} | ||||
| 
 | ||||
| 	return string(mb) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindStringIndex(s string) []int { | ||||
| 	b := []byte(s) | ||||
| 	return re.FindIndex(b) | ||||
| 	return re.FindIndex([]byte(s)) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindAllIndex(b []byte, n int) [][]int { | ||||
|  | @ -307,6 +295,7 @@ func (re *Regexp) FindAllIndex(b []byte, n int) [][]int { | |||
| 	if len(matches) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return matches | ||||
| } | ||||
| 
 | ||||
|  | @ -315,10 +304,12 @@ func (re *Regexp) FindAll(b []byte, n int) [][]byte { | |||
| 	if matches == nil { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	matchBytes := make([][]byte, 0, len(matches)) | ||||
| 	for _, match := range matches { | ||||
| 		matchBytes = append(matchBytes, getCapture(b, match[0], match[1])) | ||||
| 	} | ||||
| 
 | ||||
| 	return matchBytes | ||||
| } | ||||
| 
 | ||||
|  | @ -328,6 +319,7 @@ func (re *Regexp) FindAllString(s string, n int) []string { | |||
| 	if matches == nil { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	matchStrings := make([]string, 0, len(matches)) | ||||
| 	for _, match := range matches { | ||||
| 		m := getCapture(b, match[0], match[1]) | ||||
|  | @ -337,51 +329,50 @@ func (re *Regexp) FindAllString(s string, n int) []string { | |||
| 			matchStrings = append(matchStrings, string(m)) | ||||
| 		} | ||||
| 	} | ||||
| 
 | ||||
| 	return matchStrings | ||||
| 
 | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindAllStringIndex(s string, n int) [][]int { | ||||
| 	b := []byte(s) | ||||
| 	return re.FindAllIndex(b, n) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) findSubmatchIndex(b []byte) (match []int) { | ||||
| 	re.ClearMatchData() | ||||
| 	match = re.find(b, len(b), 0) | ||||
| 	return | ||||
| 	return re.FindAllIndex([]byte(s), n) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindSubmatchIndex(b []byte) []int { | ||||
| 	match := re.findSubmatchIndex(b) | ||||
| 	match := re.find(b, len(b), 0) | ||||
| 	if len(match) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return match | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindSubmatch(b []byte) [][]byte { | ||||
| 	match := re.findSubmatchIndex(b) | ||||
| 	match := re.FindSubmatchIndex(b) | ||||
| 	if match == nil { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	length := len(match) / 2 | ||||
| 	if length == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	results := make([][]byte, 0, length) | ||||
| 	for i := 0; i < length; i++ { | ||||
| 		results = append(results, getCapture(b, match[2*i], match[2*i+1])) | ||||
| 	} | ||||
| 
 | ||||
| 	return results | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindStringSubmatch(s string) []string { | ||||
| 	b := []byte(s) | ||||
| 	match := re.findSubmatchIndex(b) | ||||
| 	match := re.FindSubmatchIndex(b) | ||||
| 	if match == nil { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	length := len(match) / 2 | ||||
| 	if length == 0 { | ||||
| 		return nil | ||||
|  | @ -396,12 +387,12 @@ func (re *Regexp) FindStringSubmatch(s string) []string { | |||
| 			results = append(results, string(cap)) | ||||
| 		} | ||||
| 	} | ||||
| 
 | ||||
| 	return results | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindStringSubmatchIndex(s string) []int { | ||||
| 	b := []byte(s) | ||||
| 	return re.FindSubmatchIndex(b) | ||||
| 	return re.FindSubmatchIndex([]byte(s)) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindAllSubmatchIndex(b []byte, n int) [][]int { | ||||
|  | @ -409,6 +400,7 @@ func (re *Regexp) FindAllSubmatchIndex(b []byte, n int) [][]int { | |||
| 	if len(matches) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	return matches | ||||
| } | ||||
| 
 | ||||
|  | @ -417,6 +409,7 @@ func (re *Regexp) FindAllSubmatch(b []byte, n int) [][][]byte { | |||
| 	if len(matches) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	allCapturedBytes := make([][][]byte, 0, len(matches)) | ||||
| 	for _, match := range matches { | ||||
| 		length := len(match) / 2 | ||||
|  | @ -424,6 +417,7 @@ func (re *Regexp) FindAllSubmatch(b []byte, n int) [][][]byte { | |||
| 		for i := 0; i < length; i++ { | ||||
| 			capturedBytes = append(capturedBytes, getCapture(b, match[2*i], match[2*i+1])) | ||||
| 		} | ||||
| 
 | ||||
| 		allCapturedBytes = append(allCapturedBytes, capturedBytes) | ||||
| 	} | ||||
| 
 | ||||
|  | @ -432,10 +426,12 @@ func (re *Regexp) FindAllSubmatch(b []byte, n int) [][][]byte { | |||
| 
 | ||||
| func (re *Regexp) FindAllStringSubmatch(s string, n int) [][]string { | ||||
| 	b := []byte(s) | ||||
| 
 | ||||
| 	matches := re.findAll(b, n) | ||||
| 	if len(matches) == 0 { | ||||
| 		return nil | ||||
| 	} | ||||
| 
 | ||||
| 	allCapturedStrings := make([][]string, 0, len(matches)) | ||||
| 	for _, match := range matches { | ||||
| 		length := len(match) / 2 | ||||
|  | @ -448,14 +444,15 @@ func (re *Regexp) FindAllStringSubmatch(s string, n int) [][]string { | |||
| 				capturedStrings = append(capturedStrings, string(cap)) | ||||
| 			} | ||||
| 		} | ||||
| 
 | ||||
| 		allCapturedStrings = append(allCapturedStrings, capturedStrings) | ||||
| 	} | ||||
| 
 | ||||
| 	return allCapturedStrings | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) FindAllStringSubmatchIndex(s string, n int) [][]int { | ||||
| 	b := []byte(s) | ||||
| 	return re.FindAllSubmatchIndex(b, n) | ||||
| 	return re.FindAllSubmatchIndex([]byte(s), n) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) Match(b []byte) bool { | ||||
|  | @ -463,44 +460,25 @@ func (re *Regexp) Match(b []byte) bool { | |||
| } | ||||
| 
 | ||||
| func (re *Regexp) MatchString(s string) bool { | ||||
| 	b := []byte(s) | ||||
| 	return re.Match(b) | ||||
| 	return re.Match([]byte(s)) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) NumSubexp() int { | ||||
| 	return (int)(C.onig_number_of_captures(re.regex)) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) getNamedCapture(name []byte, capturedBytes [][]byte) []byte { | ||||
| 	nameStr := string(name) | ||||
| 	capNum := re.groupNameToId(nameStr) | ||||
| 	if capNum < 0 || capNum >= len(capturedBytes) { | ||||
| 		panic(fmt.Sprintf("capture group name (%q) has error\n", nameStr)) | ||||
| 	} | ||||
| 	return capturedBytes[capNum] | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) getNumberedCapture(num int, capturedBytes [][]byte) []byte { | ||||
| 	//when named capture groups exist, numbered capture groups returns "" | ||||
| 	if re.namedGroupInfo == nil && num <= (len(capturedBytes)-1) && num >= 0 { | ||||
| 		return capturedBytes[num] | ||||
| 	} | ||||
| 	return ([]byte)("") | ||||
| } | ||||
| 
 | ||||
| func fillCapturedValues(repl []byte, _ []byte, capturedBytes map[string][]byte) []byte { | ||||
| 	replLen := len(repl) | ||||
| 	newRepl := make([]byte, 0, replLen*3) | ||||
| 	inEscapeMode := false | ||||
| 	inGroupNameMode := false | ||||
| 	groupName := make([]byte, 0, replLen) | ||||
| 	for index := 0; index < replLen; index += 1 { | ||||
| 
 | ||||
| 	var inGroupNameMode, inEscapeMode bool | ||||
| 	for index := 0; index < replLen; index++ { | ||||
| 		ch := repl[index] | ||||
| 		if inGroupNameMode && ch == byte('<') { | ||||
| 		} else if inGroupNameMode && ch == byte('>') { | ||||
| 			inGroupNameMode = false | ||||
| 			groupNameStr := string(groupName) | ||||
| 			capBytes := capturedBytes[groupNameStr] | ||||
| 			capBytes := capturedBytes[string(groupName)] | ||||
| 			newRepl = append(newRepl, capBytes...) | ||||
| 			groupName = groupName[:0] //reset the name | ||||
| 		} else if inGroupNameMode { | ||||
|  | @ -512,7 +490,7 @@ func fillCapturedValues(repl []byte, _ []byte, capturedBytes map[string][]byte) | |||
| 		} else if inEscapeMode && ch == byte('k') && (index+1) < replLen && repl[index+1] == byte('<') { | ||||
| 			inGroupNameMode = true | ||||
| 			inEscapeMode = false | ||||
| 			index += 1 //bypass the next char '<' | ||||
| 			index++ //bypass the next char '<' | ||||
| 		} else if inEscapeMode { | ||||
| 			newRepl = append(newRepl, '\\') | ||||
| 			newRepl = append(newRepl, ch) | ||||
|  | @ -523,6 +501,7 @@ func fillCapturedValues(repl []byte, _ []byte, capturedBytes map[string][]byte) | |||
| 			inEscapeMode = !inEscapeMode | ||||
| 		} | ||||
| 	} | ||||
| 
 | ||||
| 	return newRepl | ||||
| } | ||||
| 
 | ||||
|  | @ -532,10 +511,12 @@ func (re *Regexp) replaceAll(src, repl []byte, replFunc func([]byte, []byte, map | |||
| 	if len(matches) == 0 { | ||||
| 		return src | ||||
| 	} | ||||
| 
 | ||||
| 	dest := make([]byte, 0, srcLen) | ||||
| 	for i, match := range matches { | ||||
| 		length := len(match) / 2 | ||||
| 		capturedBytes := make(map[string][]byte) | ||||
| 
 | ||||
| 		if re.namedGroupInfo == nil { | ||||
| 			for j := 0; j < length; j++ { | ||||
| 				capturedBytes[strconv.Itoa(j)] = getCapture(src, match[2*j], match[2*j+1]) | ||||
|  | @ -545,6 +526,7 @@ func (re *Regexp) replaceAll(src, repl []byte, replFunc func([]byte, []byte, map | |||
| 				capturedBytes[name] = getCapture(src, match[2*j], match[2*j+1]) | ||||
| 			} | ||||
| 		} | ||||
| 
 | ||||
| 		matchBytes := getCapture(src, match[0], match[1]) | ||||
| 		newRepl := replFunc(repl, matchBytes, capturedBytes) | ||||
| 		prevEnd := 0 | ||||
|  | @ -552,15 +534,19 @@ func (re *Regexp) replaceAll(src, repl []byte, replFunc func([]byte, []byte, map | |||
| 			prevMatch := matches[i-1][:2] | ||||
| 			prevEnd = prevMatch[1] | ||||
| 		} | ||||
| 
 | ||||
| 		if match[0] > prevEnd && prevEnd >= 0 && match[0] <= srcLen { | ||||
| 			dest = append(dest, src[prevEnd:match[0]]...) | ||||
| 		} | ||||
| 
 | ||||
| 		dest = append(dest, newRepl...) | ||||
| 	} | ||||
| 
 | ||||
| 	lastEnd := matches[len(matches)-1][1] | ||||
| 	if lastEnd < srcLen && lastEnd >= 0 { | ||||
| 		dest = append(dest, src[lastEnd:]...) | ||||
| 	} | ||||
| 
 | ||||
| 	return dest | ||||
| } | ||||
| 
 | ||||
|  | @ -569,7 +555,7 @@ func (re *Regexp) ReplaceAll(src, repl []byte) []byte { | |||
| } | ||||
| 
 | ||||
| func (re *Regexp) ReplaceAllFunc(src []byte, repl func([]byte) []byte) []byte { | ||||
| 	return re.replaceAll(src, []byte(""), func(_ []byte, matchBytes []byte, _ map[string][]byte) []byte { | ||||
| 	return re.replaceAll(src, nil, func(_ []byte, matchBytes []byte, _ map[string][]byte) []byte { | ||||
| 		return repl(matchBytes) | ||||
| 	}) | ||||
| } | ||||
|  | @ -579,43 +565,44 @@ func (re *Regexp) ReplaceAllString(src, repl string) string { | |||
| } | ||||
| 
 | ||||
| func (re *Regexp) ReplaceAllStringFunc(src string, repl func(string) string) string { | ||||
| 	srcB := []byte(src) | ||||
| 	destB := re.replaceAll(srcB, []byte(""), func(_ []byte, matchBytes []byte, _ map[string][]byte) []byte { | ||||
| 	return string(re.replaceAll([]byte(src), nil, func(_ []byte, matchBytes []byte, _ map[string][]byte) []byte { | ||||
| 		return []byte(repl(string(matchBytes))) | ||||
| 	}) | ||||
| 	return string(destB) | ||||
| 	})) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) String() string { | ||||
| 	return re.pattern | ||||
| } | ||||
| 
 | ||||
| func grow_buffer(b []byte, offset int, n int) []byte { | ||||
| func growBuffer(b []byte, offset int, n int) []byte { | ||||
| 	if offset+n > cap(b) { | ||||
| 		buf := make([]byte, 2*cap(b)+n) | ||||
| 		copy(buf, b[:offset]) | ||||
| 		return buf | ||||
| 	} | ||||
| 
 | ||||
| 	return b | ||||
| } | ||||
| 
 | ||||
| func fromReader(r io.RuneReader) []byte { | ||||
| 	b := make([]byte, numReadBufferStartSize) | ||||
| 	offset := 0 | ||||
| 	var err error = nil | ||||
| 	for err == nil { | ||||
| 
 | ||||
| 	var offset int | ||||
| 	for { | ||||
| 		rune, runeWidth, err := r.ReadRune() | ||||
| 		if err == nil { | ||||
| 			b = grow_buffer(b, offset, runeWidth) | ||||
| 			writeWidth := utf8.EncodeRune(b[offset:], rune) | ||||
| 			if runeWidth != writeWidth { | ||||
| 				panic("reading rune width not equal to the written rune width") | ||||
| 			} | ||||
| 			offset += writeWidth | ||||
| 		} else { | ||||
| 		if err != nil { | ||||
| 			break | ||||
| 		} | ||||
| 
 | ||||
| 		b = growBuffer(b, offset, runeWidth) | ||||
| 		writeWidth := utf8.EncodeRune(b[offset:], rune) | ||||
| 		if runeWidth != writeWidth { | ||||
| 			panic("reading rune width not equal to the written rune width") | ||||
| 		} | ||||
| 
 | ||||
| 		offset += writeWidth | ||||
| 	} | ||||
| 
 | ||||
| 	return b[:offset] | ||||
| } | ||||
| 
 | ||||
|  | @ -644,25 +631,25 @@ func MatchString(pattern string, s string) (matched bool, error error) { | |||
| 	if err != nil { | ||||
| 		return false, err | ||||
| 	} | ||||
| 
 | ||||
| 	return re.MatchString(s), nil | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) Gsub(src, repl string) string { | ||||
| 	srcBytes := ([]byte)(src) | ||||
| 	replBytes := ([]byte)(repl) | ||||
| 	replaced := re.replaceAll(srcBytes, replBytes, fillCapturedValues) | ||||
| 	return string(replaced) | ||||
| 	return string(re.replaceAll([]byte(src), []byte(repl), fillCapturedValues)) | ||||
| } | ||||
| 
 | ||||
| func (re *Regexp) GsubFunc(src string, replFunc func(string, map[string]string) string) string { | ||||
| 	srcBytes := ([]byte)(src) | ||||
| 	replaced := re.replaceAll(srcBytes, nil, func(_ []byte, matchBytes []byte, capturedBytes map[string][]byte) []byte { | ||||
| 		capturedStrings := make(map[string]string) | ||||
| 		for name, capBytes := range capturedBytes { | ||||
| 			capturedStrings[name] = string(capBytes) | ||||
| 		} | ||||
| 		matchString := string(matchBytes) | ||||
| 		return ([]byte)(replFunc(matchString, capturedStrings)) | ||||
| 	}) | ||||
| 	replaced := re.replaceAll([]byte(src), nil, | ||||
| 		func(_ []byte, matchBytes []byte, capturedBytes map[string][]byte) []byte { | ||||
| 			capturedStrings := make(map[string]string) | ||||
| 			for name, capBytes := range capturedBytes { | ||||
| 				capturedStrings[name] = string(capBytes) | ||||
| 			} | ||||
| 			matchString := string(matchBytes) | ||||
| 			return ([]byte)(replFunc(matchString, capturedStrings)) | ||||
| 		}, | ||||
| 	) | ||||
| 
 | ||||
| 	return string(replaced) | ||||
| } | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue