2019-12-12 08:18:07 -05:00
// Copyright 2019 The Gitea Authors. All rights reserved.
// Use of this source code is governed by a MIT-style
// license that can be found in the LICENSE file.
package git
import (
"bytes"
2021-09-09 16:13:36 -04:00
"context"
2019-12-12 08:18:07 -05:00
"fmt"
2021-09-09 16:13:36 -04:00
"io"
"os"
"strconv"
"strings"
2021-09-20 15:46:51 -04:00
"code.gitea.io/gitea/modules/log"
2019-12-12 08:18:07 -05:00
)
// CheckAttributeOpts represents the possible options to CheckAttribute
type CheckAttributeOpts struct {
CachedOnly bool
AllAttributes bool
Attributes [ ] string
Filenames [ ] string
2021-11-17 15:37:00 -05:00
IndexFile string
WorkTree string
2019-12-12 08:18:07 -05:00
}
// CheckAttribute return the Blame object of file
func ( repo * Repository ) CheckAttribute ( opts CheckAttributeOpts ) ( map [ string ] map [ string ] string , error ) {
2021-11-17 15:37:00 -05:00
env := [ ] string { }
2022-06-16 11:47:44 -04:00
if len ( opts . IndexFile ) > 0 {
2021-11-17 15:37:00 -05:00
env = append ( env , "GIT_INDEX_FILE=" + opts . IndexFile )
}
2022-06-16 11:47:44 -04:00
if len ( opts . WorkTree ) > 0 {
2021-11-17 15:37:00 -05:00
env = append ( env , "GIT_WORK_TREE=" + opts . WorkTree )
}
if len ( env ) > 0 {
env = append ( os . Environ ( ) , env ... )
}
2019-12-12 08:18:07 -05:00
stdOut := new ( bytes . Buffer )
stdErr := new ( bytes . Buffer )
cmdArgs := [ ] string { "check-attr" , "-z" }
if opts . AllAttributes {
cmdArgs = append ( cmdArgs , "-a" )
} else {
for _ , attribute := range opts . Attributes {
if attribute != "" {
cmdArgs = append ( cmdArgs , attribute )
}
}
}
2022-06-16 11:47:44 -04:00
if opts . CachedOnly {
2019-12-12 08:18:07 -05:00
cmdArgs = append ( cmdArgs , "--cached" )
}
cmdArgs = append ( cmdArgs , "--" )
for _ , arg := range opts . Filenames {
if arg != "" {
cmdArgs = append ( cmdArgs , arg )
}
}
2022-02-06 14:01:47 -05:00
cmd := NewCommand ( repo . Ctx , cmdArgs ... )
2019-12-12 08:18:07 -05:00
2022-03-31 22:55:30 -04:00
if err := cmd . Run ( & RunOpts {
Env : env ,
Dir : repo . Path ,
Stdout : stdOut ,
Stderr : stdErr ,
2022-02-11 07:47:22 -05:00
} ) ; err != nil {
2021-09-09 16:13:36 -04:00
return nil , fmt . Errorf ( "failed to run check-attr: %v\n%s\n%s" , err , stdOut . String ( ) , stdErr . String ( ) )
2019-12-12 08:18:07 -05:00
}
2021-09-09 16:13:36 -04:00
// FIXME: This is incorrect on versions < 1.8.5
2019-12-12 08:18:07 -05:00
fields := bytes . Split ( stdOut . Bytes ( ) , [ ] byte { '\000' } )
if len ( fields ) % 3 != 1 {
2021-09-09 16:13:36 -04:00
return nil , fmt . Errorf ( "wrong number of fields in return from check-attr" )
2019-12-12 08:18:07 -05:00
}
2022-01-20 12:46:10 -05:00
name2attribute2info := make ( map [ string ] map [ string ] string )
2019-12-12 08:18:07 -05:00
for i := 0 ; i < ( len ( fields ) / 3 ) ; i ++ {
filename := string ( fields [ 3 * i ] )
attribute := string ( fields [ 3 * i + 1 ] )
info := string ( fields [ 3 * i + 2 ] )
attribute2info := name2attribute2info [ filename ]
if attribute2info == nil {
attribute2info = make ( map [ string ] string )
}
attribute2info [ attribute ] = info
name2attribute2info [ filename ] = attribute2info
}
return name2attribute2info , nil
}
2021-09-09 16:13:36 -04:00
// CheckAttributeReader provides a reader for check-attribute content that can be long running
type CheckAttributeReader struct {
// params
Attributes [ ] string
Repo * Repository
IndexFile string
WorkTree string
stdinReader io . ReadCloser
stdinWriter * os . File
stdOut attributeWriter
cmd * Command
env [ ] string
ctx context . Context
cancel context . CancelFunc
}
2022-06-09 21:57:49 -04:00
// Init initializes the CheckAttributeReader
2021-09-09 16:13:36 -04:00
func ( c * CheckAttributeReader ) Init ( ctx context . Context ) error {
cmdArgs := [ ] string { "check-attr" , "--stdin" , "-z" }
2022-06-16 11:47:44 -04:00
if len ( c . IndexFile ) > 0 {
2021-09-09 16:13:36 -04:00
cmdArgs = append ( cmdArgs , "--cached" )
2021-09-20 15:46:51 -04:00
c . env = append ( c . env , "GIT_INDEX_FILE=" + c . IndexFile )
2021-09-09 16:13:36 -04:00
}
2022-06-16 11:47:44 -04:00
if len ( c . WorkTree ) > 0 {
2021-09-20 15:46:51 -04:00
c . env = append ( c . env , "GIT_WORK_TREE=" + c . WorkTree )
2021-09-09 16:13:36 -04:00
}
2021-09-20 15:46:51 -04:00
c . env = append ( c . env , "GIT_FLUSH=1" )
if len ( c . Attributes ) == 0 {
2021-09-09 16:13:36 -04:00
lw := new ( nulSeparatedAttributeWriter )
lw . attributes = make ( chan attributeTriple )
2021-09-20 15:46:51 -04:00
lw . closed = make ( chan struct { } )
2021-09-09 16:13:36 -04:00
c . stdOut = lw
c . stdOut . Close ( )
return fmt . Errorf ( "no provided Attributes to check" )
}
2021-09-20 15:46:51 -04:00
cmdArgs = append ( cmdArgs , c . Attributes ... )
cmdArgs = append ( cmdArgs , "--" )
2021-09-09 16:13:36 -04:00
c . ctx , c . cancel = context . WithCancel ( ctx )
2022-02-06 14:01:47 -05:00
c . cmd = NewCommand ( c . ctx , cmdArgs ... )
2021-09-20 15:46:51 -04:00
2021-09-09 16:13:36 -04:00
var err error
2021-09-20 15:46:51 -04:00
2021-09-09 16:13:36 -04:00
c . stdinReader , c . stdinWriter , err = os . Pipe ( )
if err != nil {
2021-09-20 15:46:51 -04:00
c . cancel ( )
2021-09-09 16:13:36 -04:00
return err
}
2022-06-16 11:47:44 -04:00
lw := new ( nulSeparatedAttributeWriter )
lw . attributes = make ( chan attributeTriple , 5 )
lw . closed = make ( chan struct { } )
c . stdOut = lw
2021-09-09 16:13:36 -04:00
return nil
}
// Run run cmd
func ( c * CheckAttributeReader ) Run ( ) error {
2021-09-20 15:46:51 -04:00
defer func ( ) {
2022-02-14 12:03:56 -05:00
_ = c . stdinReader . Close ( )
_ = c . stdOut . Close ( )
2021-09-20 15:46:51 -04:00
} ( )
2021-09-09 16:13:36 -04:00
stdErr := new ( bytes . Buffer )
2022-03-31 22:55:30 -04:00
err := c . cmd . Run ( & RunOpts {
Env : c . env ,
Dir : c . Repo . Path ,
Stdin : c . stdinReader ,
Stdout : c . stdOut ,
Stderr : stdErr ,
2021-09-09 16:13:36 -04:00
} )
2022-03-08 03:30:14 -05:00
if err != nil && // If there is an error we need to return but:
c . ctx . Err ( ) != err && // 1. Ignore the context error if the context is cancelled or exceeds the deadline (RunWithContext could return c.ctx.Err() which is Canceled or DeadlineExceeded)
err . Error ( ) != "signal: killed" { // 2. We should not pass up errors due to the program being killed
2021-09-09 16:13:36 -04:00
return fmt . Errorf ( "failed to run attr-check. Error: %w\nStderr: %s" , err , stdErr . String ( ) )
}
return nil
}
// CheckPath check attr for given path
2021-09-20 15:46:51 -04:00
func ( c * CheckAttributeReader ) CheckPath ( path string ) ( rs map [ string ] string , err error ) {
defer func ( ) {
2022-10-10 16:54:30 -04:00
if err != nil && err != c . ctx . Err ( ) {
log . Error ( "Unexpected error when checking path %s in %s. Error: %v" , path , c . Repo . Path , err )
2021-09-20 15:46:51 -04:00
}
} ( )
2021-09-09 16:13:36 -04:00
select {
case <- c . ctx . Done ( ) :
return nil , c . ctx . Err ( )
2022-04-27 23:19:33 -04:00
default :
2021-09-09 16:13:36 -04:00
}
2021-09-20 15:46:51 -04:00
if _ , err = c . stdinWriter . Write ( [ ] byte ( path + "\x00" ) ) ; err != nil {
defer c . Close ( )
2021-09-09 16:13:36 -04:00
return nil , err
}
2021-09-20 15:46:51 -04:00
rs = make ( map [ string ] string )
2021-09-09 16:13:36 -04:00
for range c . Attributes {
select {
2021-09-20 15:46:51 -04:00
case attr , ok := <- c . stdOut . ReadAttribute ( ) :
if ! ok {
return nil , c . ctx . Err ( )
}
2021-09-09 16:13:36 -04:00
rs [ attr . Attribute ] = attr . Value
case <- c . ctx . Done ( ) :
return nil , c . ctx . Err ( )
}
}
return rs , nil
}
// Close close pip after use
func ( c * CheckAttributeReader ) Close ( ) error {
2021-09-20 15:46:51 -04:00
c . cancel ( )
2022-02-14 12:03:56 -05:00
err := c . stdinWriter . Close ( )
2021-09-20 15:46:51 -04:00
return err
2021-09-09 16:13:36 -04:00
}
type attributeWriter interface {
io . WriteCloser
ReadAttribute ( ) <- chan attributeTriple
}
type attributeTriple struct {
Filename string
Attribute string
Value string
}
type nulSeparatedAttributeWriter struct {
tmp [ ] byte
attributes chan attributeTriple
2021-09-20 15:46:51 -04:00
closed chan struct { }
2021-09-09 16:13:36 -04:00
working attributeTriple
pos int
}
func ( wr * nulSeparatedAttributeWriter ) Write ( p [ ] byte ) ( n int , err error ) {
l , read := len ( p ) , 0
nulIdx := bytes . IndexByte ( p , '\x00' )
for nulIdx >= 0 {
wr . tmp = append ( wr . tmp , p [ : nulIdx ] ... )
switch wr . pos {
case 0 :
wr . working = attributeTriple {
Filename : string ( wr . tmp ) ,
}
case 1 :
wr . working . Attribute = string ( wr . tmp )
case 2 :
wr . working . Value = string ( wr . tmp )
}
wr . tmp = wr . tmp [ : 0 ]
wr . pos ++
if wr . pos > 2 {
wr . attributes <- wr . working
wr . pos = 0
}
read += nulIdx + 1
if l > read {
p = p [ nulIdx + 1 : ]
nulIdx = bytes . IndexByte ( p , '\x00' )
} else {
return l , nil
}
}
wr . tmp = append ( wr . tmp , p ... )
return len ( p ) , nil
}
func ( wr * nulSeparatedAttributeWriter ) ReadAttribute ( ) <- chan attributeTriple {
return wr . attributes
}
func ( wr * nulSeparatedAttributeWriter ) Close ( ) error {
2021-09-20 15:46:51 -04:00
select {
case <- wr . closed :
return nil
default :
}
2021-09-09 16:13:36 -04:00
close ( wr . attributes )
2021-09-20 15:46:51 -04:00
close ( wr . closed )
2021-09-09 16:13:36 -04:00
return nil
}
type lineSeparatedAttributeWriter struct {
tmp [ ] byte
attributes chan attributeTriple
2021-09-20 15:46:51 -04:00
closed chan struct { }
2021-09-09 16:13:36 -04:00
}
func ( wr * lineSeparatedAttributeWriter ) Write ( p [ ] byte ) ( n int , err error ) {
l := len ( p )
nlIdx := bytes . IndexByte ( p , '\n' )
for nlIdx >= 0 {
wr . tmp = append ( wr . tmp , p [ : nlIdx ] ... )
if len ( wr . tmp ) == 0 {
// This should not happen
if len ( p ) > nlIdx + 1 {
wr . tmp = wr . tmp [ : 0 ]
p = p [ nlIdx + 1 : ]
nlIdx = bytes . IndexByte ( p , '\n' )
continue
} else {
return l , nil
}
}
working := attributeTriple { }
if wr . tmp [ 0 ] == '"' {
sb := new ( strings . Builder )
remaining := string ( wr . tmp [ 1 : ] )
for len ( remaining ) > 0 {
rn , _ , tail , err := strconv . UnquoteChar ( remaining , '"' )
if err != nil {
if len ( remaining ) > 2 && remaining [ 0 ] == '"' && remaining [ 1 ] == ':' && remaining [ 2 ] == ' ' {
working . Filename = sb . String ( )
wr . tmp = [ ] byte ( remaining [ 3 : ] )
break
}
2022-06-20 06:02:49 -04:00
return l , fmt . Errorf ( "unexpected tail %s" , remaining )
2021-09-09 16:13:36 -04:00
}
_ , _ = sb . WriteRune ( rn )
remaining = tail
}
} else {
idx := bytes . IndexByte ( wr . tmp , ':' )
if idx < 0 {
return l , fmt . Errorf ( "unexpected input %s" , string ( wr . tmp ) )
}
working . Filename = string ( wr . tmp [ : idx ] )
if len ( wr . tmp ) < idx + 2 {
return l , fmt . Errorf ( "unexpected input %s" , string ( wr . tmp ) )
}
wr . tmp = wr . tmp [ idx + 2 : ]
}
idx := bytes . IndexByte ( wr . tmp , ':' )
if idx < 0 {
return l , fmt . Errorf ( "unexpected input %s" , string ( wr . tmp ) )
}
working . Attribute = string ( wr . tmp [ : idx ] )
if len ( wr . tmp ) < idx + 2 {
return l , fmt . Errorf ( "unexpected input %s" , string ( wr . tmp ) )
}
working . Value = string ( wr . tmp [ idx + 2 : ] )
wr . attributes <- working
wr . tmp = wr . tmp [ : 0 ]
if len ( p ) > nlIdx + 1 {
p = p [ nlIdx + 1 : ]
nlIdx = bytes . IndexByte ( p , '\n' )
continue
} else {
return l , nil
}
}
wr . tmp = append ( wr . tmp , p ... )
return l , nil
}
func ( wr * lineSeparatedAttributeWriter ) ReadAttribute ( ) <- chan attributeTriple {
return wr . attributes
}
func ( wr * lineSeparatedAttributeWriter ) Close ( ) error {
2021-09-20 15:46:51 -04:00
select {
case <- wr . closed :
return nil
default :
}
2021-09-09 16:13:36 -04:00
close ( wr . attributes )
2021-09-20 15:46:51 -04:00
close ( wr . closed )
2021-09-09 16:13:36 -04:00
return nil
}
2022-06-16 11:47:44 -04:00
// Create a check attribute reader for the current repository and provided commit ID
func ( repo * Repository ) CheckAttributeReader ( commitID string ) ( * CheckAttributeReader , context . CancelFunc ) {
indexFilename , worktree , deleteTemporaryFile , err := repo . ReadTreeToTemporaryIndex ( commitID )
if err != nil {
return nil , func ( ) { }
}
checker := & CheckAttributeReader {
Attributes : [ ] string { "linguist-vendored" , "linguist-generated" , "linguist-language" , "gitlab-language" } ,
Repo : repo ,
IndexFile : indexFilename ,
WorkTree : worktree ,
}
ctx , cancel := context . WithCancel ( repo . Ctx )
if err := checker . Init ( ctx ) ; err != nil {
log . Error ( "Unable to open checker for %s. Error: %v" , commitID , err )
} else {
go func ( ) {
err := checker . Run ( )
if err != nil && err != ctx . Err ( ) {
log . Error ( "Unable to open checker for %s. Error: %v" , commitID , err )
}
cancel ( )
} ( )
}
deferable := func ( ) {
_ = checker . Close ( )
cancel ( )
deleteTemporaryFile ( )
}
return checker , deferable
}