mirror of
https://codeberg.org/forgejo/forgejo
synced 2024-11-30 05:36:07 +01:00
cf27403e18
Fix #22023 I've changed how the percentages for the language statistics are rounded because they did not always add up to 100% Now it's done with the largest remainder method, which makes sure that total is 100% Co-authored-by: Lauris BH <lauris@nix.lv>
243 lines
6.1 KiB
Go
243 lines
6.1 KiB
Go
// Copyright 2020 The Gitea Authors. All rights reserved.
|
|
// SPDX-License-Identifier: MIT
|
|
|
|
package repo
|
|
|
|
import (
|
|
"context"
|
|
"math"
|
|
"sort"
|
|
"strings"
|
|
|
|
"code.gitea.io/gitea/models/db"
|
|
"code.gitea.io/gitea/modules/timeutil"
|
|
|
|
"github.com/go-enry/go-enry/v2"
|
|
)
|
|
|
|
// LanguageStat describes language statistics of a repository
|
|
type LanguageStat struct {
|
|
ID int64 `xorm:"pk autoincr"`
|
|
RepoID int64 `xorm:"UNIQUE(s) INDEX NOT NULL"`
|
|
CommitID string
|
|
IsPrimary bool
|
|
Language string `xorm:"VARCHAR(50) UNIQUE(s) INDEX NOT NULL"`
|
|
Percentage float32 `xorm:"-"`
|
|
Size int64 `xorm:"NOT NULL DEFAULT 0"`
|
|
Color string `xorm:"-"`
|
|
CreatedUnix timeutil.TimeStamp `xorm:"INDEX CREATED"`
|
|
}
|
|
|
|
func init() {
|
|
db.RegisterModel(new(LanguageStat))
|
|
}
|
|
|
|
// LanguageStatList defines a list of language statistics
|
|
type LanguageStatList []*LanguageStat
|
|
|
|
// LoadAttributes loads attributes
|
|
func (stats LanguageStatList) LoadAttributes() {
|
|
for i := range stats {
|
|
stats[i].Color = enry.GetColor(stats[i].Language)
|
|
}
|
|
}
|
|
|
|
func (stats LanguageStatList) getLanguagePercentages() map[string]float32 {
|
|
langPerc := make(map[string]float32)
|
|
var otherPerc float32
|
|
var total int64
|
|
|
|
for _, stat := range stats {
|
|
total += stat.Size
|
|
}
|
|
if total > 0 {
|
|
for _, stat := range stats {
|
|
perc := float32(float64(stat.Size) / float64(total) * 100)
|
|
if perc <= 0.1 {
|
|
otherPerc += perc
|
|
continue
|
|
}
|
|
langPerc[stat.Language] = perc
|
|
}
|
|
}
|
|
if otherPerc > 0 {
|
|
langPerc["other"] = otherPerc
|
|
}
|
|
roundByLargestRemainder(langPerc, 100)
|
|
return langPerc
|
|
}
|
|
|
|
// Rounds to 1 decimal point, target should be the expected sum of percs
|
|
func roundByLargestRemainder(percs map[string]float32, target float32) {
|
|
leftToDistribute := int(target * 10)
|
|
|
|
keys := make([]string, 0, len(percs))
|
|
|
|
for k, v := range percs {
|
|
percs[k] = v * 10
|
|
floored := math.Floor(float64(percs[k]))
|
|
leftToDistribute -= int(floored)
|
|
keys = append(keys, k)
|
|
}
|
|
|
|
// Sort the keys by the largest remainder
|
|
sort.SliceStable(keys, func(i, j int) bool {
|
|
_, remainderI := math.Modf(float64(percs[keys[i]]))
|
|
_, remainderJ := math.Modf(float64(percs[keys[j]]))
|
|
return remainderI > remainderJ
|
|
})
|
|
|
|
// Increment the values in order of largest remainder
|
|
for _, k := range keys {
|
|
percs[k] = float32(math.Floor(float64(percs[k])))
|
|
if leftToDistribute > 0 {
|
|
percs[k]++
|
|
leftToDistribute--
|
|
}
|
|
percs[k] /= 10
|
|
}
|
|
}
|
|
|
|
// GetLanguageStats returns the language statistics for a repository
|
|
func GetLanguageStats(ctx context.Context, repo *Repository) (LanguageStatList, error) {
|
|
stats := make(LanguageStatList, 0, 6)
|
|
if err := db.GetEngine(ctx).Where("`repo_id` = ?", repo.ID).Desc("`size`").Find(&stats); err != nil {
|
|
return nil, err
|
|
}
|
|
return stats, nil
|
|
}
|
|
|
|
// GetTopLanguageStats returns the top language statistics for a repository
|
|
func GetTopLanguageStats(repo *Repository, limit int) (LanguageStatList, error) {
|
|
stats, err := GetLanguageStats(db.DefaultContext, repo)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
perc := stats.getLanguagePercentages()
|
|
topstats := make(LanguageStatList, 0, limit)
|
|
var other float32
|
|
for i := range stats {
|
|
if _, ok := perc[stats[i].Language]; !ok {
|
|
continue
|
|
}
|
|
if stats[i].Language == "other" || len(topstats) >= limit {
|
|
other += perc[stats[i].Language]
|
|
continue
|
|
}
|
|
stats[i].Percentage = perc[stats[i].Language]
|
|
topstats = append(topstats, stats[i])
|
|
}
|
|
if other > 0 {
|
|
topstats = append(topstats, &LanguageStat{
|
|
RepoID: repo.ID,
|
|
Language: "other",
|
|
Color: "#cccccc",
|
|
Percentage: float32(math.Round(float64(other)*10) / 10),
|
|
})
|
|
}
|
|
topstats.LoadAttributes()
|
|
return topstats, nil
|
|
}
|
|
|
|
// UpdateLanguageStats updates the language statistics for repository
|
|
func UpdateLanguageStats(repo *Repository, commitID string, stats map[string]int64) error {
|
|
ctx, committer, err := db.TxContext(db.DefaultContext)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer committer.Close()
|
|
sess := db.GetEngine(ctx)
|
|
|
|
oldstats, err := GetLanguageStats(ctx, repo)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
var topLang string
|
|
var s int64
|
|
for lang, size := range stats {
|
|
if size > s {
|
|
s = size
|
|
topLang = strings.ToLower(lang)
|
|
}
|
|
}
|
|
|
|
for lang, size := range stats {
|
|
upd := false
|
|
llang := strings.ToLower(lang)
|
|
for _, s := range oldstats {
|
|
// Update already existing language
|
|
if strings.ToLower(s.Language) == llang {
|
|
s.CommitID = commitID
|
|
s.IsPrimary = llang == topLang
|
|
s.Size = size
|
|
if _, err := sess.ID(s.ID).Cols("`commit_id`", "`size`", "`is_primary`").Update(s); err != nil {
|
|
return err
|
|
}
|
|
upd = true
|
|
break
|
|
}
|
|
}
|
|
// Insert new language
|
|
if !upd {
|
|
if err := db.Insert(ctx, &LanguageStat{
|
|
RepoID: repo.ID,
|
|
CommitID: commitID,
|
|
IsPrimary: llang == topLang,
|
|
Language: lang,
|
|
Size: size,
|
|
}); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
}
|
|
// Delete old languages
|
|
statsToDelete := make([]int64, 0, len(oldstats))
|
|
for _, s := range oldstats {
|
|
if s.CommitID != commitID {
|
|
statsToDelete = append(statsToDelete, s.ID)
|
|
}
|
|
}
|
|
if len(statsToDelete) > 0 {
|
|
if _, err := sess.In("`id`", statsToDelete).Delete(&LanguageStat{}); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
// Update indexer status
|
|
if err = UpdateIndexerStatus(ctx, repo, RepoIndexerTypeStats, commitID); err != nil {
|
|
return err
|
|
}
|
|
|
|
return committer.Commit()
|
|
}
|
|
|
|
// CopyLanguageStat Copy originalRepo language stat information to destRepo (use for forked repo)
|
|
func CopyLanguageStat(originalRepo, destRepo *Repository) error {
|
|
ctx, committer, err := db.TxContext(db.DefaultContext)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer committer.Close()
|
|
|
|
RepoLang := make(LanguageStatList, 0, 6)
|
|
if err := db.GetEngine(ctx).Where("`repo_id` = ?", originalRepo.ID).Desc("`size`").Find(&RepoLang); err != nil {
|
|
return err
|
|
}
|
|
if len(RepoLang) > 0 {
|
|
for i := range RepoLang {
|
|
RepoLang[i].ID = 0
|
|
RepoLang[i].RepoID = destRepo.ID
|
|
RepoLang[i].CreatedUnix = timeutil.TimeStampNow()
|
|
}
|
|
// update destRepo's indexer status
|
|
tmpCommitID := RepoLang[0].CommitID
|
|
if err := UpdateIndexerStatus(ctx, destRepo, RepoIndexerTypeStats, tmpCommitID); err != nil {
|
|
return err
|
|
}
|
|
if err := db.Insert(ctx, &RepoLang); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
return committer.Commit()
|
|
}
|