Add counting mode, and only programming languages flags. (#110)

Signed-off-by: Zachary Romero <zacromero3@gmail.com>
This commit is contained in:
Zachary Romero 2018-02-23 18:06:05 +03:00 committed by Denys Smirnov
parent 83cc32253e
commit 35d103b4e4
2 changed files with 169 additions and 31 deletions

View File

@ -1,6 +1,7 @@
package main package main
import ( import (
"bufio"
"bytes" "bytes"
"encoding/json" "encoding/json"
"flag" "flag"
@ -27,6 +28,9 @@ func main() {
breakdownFlag := flag.Bool("breakdown", false, "") breakdownFlag := flag.Bool("breakdown", false, "")
jsonFlag := flag.Bool("json", false, "") jsonFlag := flag.Bool("json", false, "")
showVersion := flag.Bool("version", false, "Show the enry version information") showVersion := flag.Bool("version", false, "Show the enry version information")
onlyProg := flag.Bool("prog", false, "Only show programming file types in output")
countMode := flag.String("mode", "file", "the method used to count file size. Available options are: file, line and byte")
flag.Parse() flag.Parse()
if *showVersion { if *showVersion {
@ -45,7 +49,10 @@ func main() {
} }
if fileInfo.Mode().IsRegular() { if fileInfo.Mode().IsRegular() {
printFileAnalysis(root) err = printFileAnalysis(root)
if err != nil {
fmt.Println(err)
}
return return
} }
@ -103,6 +110,11 @@ func main() {
} }
} }
// If we are displaying only prog. and language is not prog. skip it.
if *onlyProg && enry.GetLanguageType(language) != enry.Programming {
return nil
}
out[language] = append(out[language], relativePath) out[language] = append(out[language], relativePath)
return nil return nil
}) })
@ -118,11 +130,11 @@ func main() {
case *jsonFlag && *breakdownFlag: case *jsonFlag && *breakdownFlag:
printBreakDown(out, &buff) printBreakDown(out, &buff)
case *breakdownFlag: case *breakdownFlag:
printPercents(out, &buff) printPercents(out, &buff, *countMode)
buff.WriteByte('\n') buff.WriteByte('\n')
printBreakDown(out, &buff) printBreakDown(out, &buff)
default: default:
printPercents(out, &buff) printPercents(out, &buff, *countMode)
} }
fmt.Print(buff.String()) fmt.Print(buff.String())
@ -133,9 +145,9 @@ func usage() {
os.Stderr, os.Stderr,
` %[1]s %[2]s build: %[3]s commit: %[4]s, based on linguist commit: %[5]s ` %[1]s %[2]s build: %[3]s commit: %[4]s, based on linguist commit: %[5]s
%[1]s, A simple (and faster) implementation of github/linguist %[1]s, A simple (and faster) implementation of github/linguist
usage: %[1]s <path> usage: %[1]s [-mode=(file|line|byte)] [-prog] <path>
%[1]s [-json] [-breakdown] <path> %[1]s [-mode=(file|line|byte)] [-prog] [-json] [-breakdown] <path>
%[1]s [-json] [-breakdown] %[1]s [-mode=(file|line|byte)] [-prog] [-json] [-breakdown]
%[1]s [-version] %[1]s [-version]
`, `,
os.Args[0], version, build, commit, data.LinguistCommit[:7], os.Args[0], version, build, commit, data.LinguistCommit[:7],
@ -159,33 +171,107 @@ func printJson(out map[string][]string, buff *bytes.Buffer) {
buff.WriteByte('\n') buff.WriteByte('\n')
} }
func printPercents(out map[string][]string, buff *bytes.Buffer) { // filelistError represents a failed operation that took place across multiple files.
var fileCountList enry.FileCountList type filelistError []string
total := 0
for name, language := range out {
fc := enry.FileCount{Name: name, Count: len(language)}
fileCountList = append(fileCountList, fc)
total += len(language)
}
// Sort the fileCountList in descending order of their count value.
sort.Sort(sort.Reverse(fileCountList))
for _, fc := range fileCountList { func (e filelistError) Error() string {
percent := float32(fc.Count) / float32(total) * 100 return fmt.Sprintf("Could not process the following files:\n%s", strings.Join(e, "\n"))
buff.WriteString(fmt.Sprintf("%.2f%% %s\n", percent, fc.Name))
}
} }
func printFileAnalysis(file string) { func printPercents(fSummary map[string][]string, buff *bytes.Buffer, mode string) {
content, err := ioutil.ReadFile(file) // Select the way we quantify 'amount' of code.
var reducer func([]string) (float64, filelistError)
switch mode {
case "file":
reducer = fileCountValues
case "line":
reducer = lineCountValues
case "byte":
reducer = byteCountValues
default:
reducer = fileCountValues
}
// Reduce the list of files to a quantity of file type.
var total float64
fileValues := make(map[string]float64)
keys := []string{}
var unreadableFiles filelistError
for fType, files := range fSummary {
val, err := reducer(files)
if err != nil { if err != nil {
fmt.Println(err) unreadableFiles = append(unreadableFiles, err...)
}
fileValues[fType] = val
keys = append(keys, fType)
total += val
} }
totalLines, nonBlank := getLines(file, string(content)) // Slice the keys by their quantity (file count, line count, byte size, etc.).
fileType := getFileType(file, content) sort.Slice(keys, func(i, j int) bool {
language := enry.GetLanguage(file, content) return fileValues[keys[i]] > fileValues[keys[j]]
mimeType := enry.GetMimeType(file, language) })
// Calculate and write percentages of each file type.
for _, fType := range keys {
val := fileValues[fType]
percent := val / total * 100.0
buff.WriteString(fmt.Sprintf("%.2f%%\t%s\n", percent, fType))
if unreadableFiles != nil {
buff.WriteString(fmt.Sprintf("\n%s", unreadableFiles.Error()))
}
}
}
func fileCountValues(files []string) (float64, filelistError) {
return float64(len(files)), nil
}
func lineCountValues(files []string) (float64, filelistError) {
var filesErr filelistError
var t float64
for _, fName := range files {
content, err := ioutil.ReadFile(fName)
if err != nil {
filesErr = append(filesErr, fName)
continue
}
l, _ := getLines(content)
t += float64(l)
}
return t, filesErr
}
func byteCountValues(files []string) (float64, filelistError) {
var filesErr filelistError
var t float64
for _, fName := range files {
f, err := os.Open(fName)
if err != nil {
filesErr = append(filesErr, fName)
continue
}
fi, err := f.Stat()
f.Close()
if err != nil {
filesErr = append(filesErr, fName)
continue
}
t += float64(fi.Size())
}
return t, filesErr
}
func printFileAnalysis(fName string) error {
content, err := ioutil.ReadFile(fName)
if err != nil {
return err
}
totalLines, nonBlank := getLines(content)
fileType := getFileType(fName, content)
language := enry.GetLanguage(fName, content)
mimeType := enry.GetMimeType(fName, language)
fmt.Printf( fmt.Printf(
`%s: %d lines (%d sloc) `%s: %d lines (%d sloc)
@ -193,14 +279,30 @@ func printFileAnalysis(file string) {
mime_type: %s mime_type: %s
language: %s language: %s
`, `,
filepath.Base(file), totalLines, nonBlank, fileType, mimeType, language, filepath.Base(fName), totalLines, nonBlank, fileType, mimeType, language,
) )
return nil
} }
func getLines(file string, content string) (int, int) { func getLines(b []byte) (total int, nonBlank int) {
totalLines := strings.Count(content, "\n") scanner := bufio.NewScanner(bytes.NewReader(b))
nonBlank := totalLines - strings.Count(content, "\n\n") lineCt := 0
return totalLines, nonBlank blankCt := 0
for scanner.Scan() {
lineCt++
line := bytes.TrimSpace(scanner.Bytes())
if len(line) == 0 {
blankCt++
}
}
// Scanner doesn't catch the case of last byte newline.
if len(b) > 0 && b[len(b)-1] == '\n' {
lineCt++
blankCt++
}
return lineCt, lineCt - blankCt
} }
func getFileType(file string, content []byte) string { func getFileType(file string, content []byte) string {

36
cmd/enry/main_test.go Normal file
View File

@ -0,0 +1,36 @@
package main
import (
"testing"
)
func TestGetLines(t *testing.T) {
tests := []struct {
content string
wantTotal int
wantNonBlank int
}{
// 0
{content: "This is one line", wantTotal: 1, wantNonBlank: 1},
// 1 Test no content
{content: "", wantTotal: 0, wantNonBlank: 0},
// 2 A single blank line
{content: "One blank line\n\nTwo nonblank lines", wantTotal: 3, wantNonBlank: 2},
// 3 Testing multiple blank lines in a row
{content: "\n\n", wantTotal: 3, wantNonBlank: 0},
// 4 '
{content: "\n\n\n\n", wantTotal: 5, wantNonBlank: 0},
// 5 Multiple blank lines content on ends
{content: "content\n\n\n\ncontent", wantTotal: 5, wantNonBlank: 2},
// 6 Content with blank lines on ends
{content: "\n\n\ncontent\n\n\n", wantTotal: 7, wantNonBlank: 1},
}
for i, test := range tests {
gotTotal, gotNonBlank := getLines([]byte(test.content))
if gotTotal != test.wantTotal || gotNonBlank != test.wantNonBlank {
t.Errorf("wrong line counts obtained for test case #%d:\n %7s, %7s\nGOT: %7d, %7d\nWANT: %7d, %7d\n", i, "TOTAL", "NON_BLANK",
gotTotal, gotNonBlank, test.wantTotal, test.wantNonBlank)
}
}
}