2020-02-11 11:34:17 +02:00
|
|
|
// Copyright 2020 The Gitea Authors. All rights reserved.
|
2022-11-27 13:20:29 -05:00
|
|
|
// SPDX-License-Identifier: MIT
|
2020-02-11 11:34:17 +02:00
|
|
|
|
|
|
|
package git
|
|
|
|
|
2023-05-25 03:37:36 +08:00
|
|
|
import (
|
|
|
|
"strings"
|
|
|
|
"unicode"
|
|
|
|
)
|
|
|
|
|
2022-01-20 18:46:10 +01:00
|
|
|
const (
|
|
|
|
fileSizeLimit int64 = 16 * 1024 // 16 KiB
|
|
|
|
bigFileSize int64 = 1024 * 1024 // 1 MiB
|
|
|
|
)
|
2023-05-25 03:37:36 +08:00
|
|
|
|
2024-01-11 00:20:32 +01:00
|
|
|
type LinguistBoolAttrib struct {
|
|
|
|
Value string
|
|
|
|
}
|
|
|
|
|
|
|
|
func (attrib *LinguistBoolAttrib) IsTrue() bool {
|
|
|
|
return attrib.Value == "set" || attrib.Value == "true"
|
|
|
|
}
|
|
|
|
|
|
|
|
func (attrib *LinguistBoolAttrib) IsFalse() bool {
|
|
|
|
return attrib.Value == "unset" || attrib.Value == "false"
|
|
|
|
}
|
|
|
|
|
2023-05-25 03:37:36 +08:00
|
|
|
// mergeLanguageStats mergers language names with different cases. The name with most upper case letters is used.
|
|
|
|
func mergeLanguageStats(stats map[string]int64) map[string]int64 {
|
|
|
|
names := map[string]struct {
|
|
|
|
uniqueName string
|
|
|
|
upperCount int
|
|
|
|
}{}
|
|
|
|
|
|
|
|
countUpper := func(s string) (count int) {
|
|
|
|
for _, r := range s {
|
|
|
|
if unicode.IsUpper(r) {
|
|
|
|
count++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return count
|
|
|
|
}
|
|
|
|
|
|
|
|
for name := range stats {
|
|
|
|
cnt := countUpper(name)
|
|
|
|
lower := strings.ToLower(name)
|
|
|
|
if cnt >= names[lower].upperCount {
|
|
|
|
names[lower] = struct {
|
|
|
|
uniqueName string
|
|
|
|
upperCount int
|
|
|
|
}{uniqueName: name, upperCount: cnt}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
res := make(map[string]int64, len(names))
|
|
|
|
for name, num := range stats {
|
|
|
|
res[names[strings.ToLower(name)].uniqueName] += num
|
|
|
|
}
|
|
|
|
return res
|
|
|
|
}
|