mirror of
https://github.com/ralsina/tartrazine.git
synced 2025-06-19 22:53:05 -03:00
new by content heuristisc
This commit is contained in:
@ -1,10 +1,12 @@
|
||||
package slinguist
|
||||
|
||||
import (
|
||||
"fmt"
|
||||
"io/ioutil"
|
||||
"os"
|
||||
"path"
|
||||
"path/filepath"
|
||||
"text/tabwriter"
|
||||
|
||||
. "gopkg.in/check.v1"
|
||||
)
|
||||
@ -28,6 +30,7 @@ func (s *TSuite) TestGetLanguageByContentH(c *C) {
|
||||
s.testGetLanguageByContent(c, "Prolog")
|
||||
s.testGetLanguageByContent(c, "Perl")
|
||||
s.testGetLanguageByContent(c, "Perl6")
|
||||
s.testGetLanguageByContent(c, "Hack")
|
||||
}
|
||||
|
||||
func (s *TSuite) testGetLanguageByContent(c *C, expected string) {
|
||||
@ -41,7 +44,6 @@ func (s *TSuite) testGetLanguageByContent(c *C, expected string) {
|
||||
}
|
||||
|
||||
content, _ := ioutil.ReadFile(file)
|
||||
|
||||
obtained, _ := GetLanguageByContent(path.Base(file), content)
|
||||
if obtained == OtherLanguage {
|
||||
continue
|
||||
@ -50,3 +52,51 @@ func (s *TSuite) testGetLanguageByContent(c *C, expected string) {
|
||||
c.Check(obtained, Equals, expected, Commentf(file))
|
||||
}
|
||||
}
|
||||
|
||||
func (s *TSuite) TestGetLanguageByContentLinguistCorpus(c *C) {
|
||||
var total, failed, ok, other, unsafe int
|
||||
|
||||
w := new(tabwriter.Writer)
|
||||
w.Init(os.Stdout, 0, 8, 0, '\t', 0)
|
||||
|
||||
filepath.Walk(".linguist/samples", func(path string, f os.FileInfo, err error) error {
|
||||
if f.IsDir() {
|
||||
if f.Name() == "filenames" {
|
||||
return filepath.SkipDir
|
||||
}
|
||||
return nil
|
||||
}
|
||||
|
||||
total++
|
||||
expected := filepath.Base(filepath.Dir(path))
|
||||
filename := filepath.Base(path)
|
||||
content, _ := ioutil.ReadFile(path)
|
||||
|
||||
obtained, safe := GetLanguageByContent(filename, content)
|
||||
if obtained == OtherLanguage {
|
||||
other++
|
||||
}
|
||||
|
||||
var status string
|
||||
if expected == obtained {
|
||||
status = "ok"
|
||||
ok++
|
||||
} else {
|
||||
status = "failed"
|
||||
failed++
|
||||
if !safe {
|
||||
unsafe++
|
||||
}
|
||||
}
|
||||
|
||||
fmt.Fprintf(w, "%s\t%s\t%s\t%v\t%s\n", filename, expected, obtained, safe, status)
|
||||
|
||||
return nil
|
||||
})
|
||||
|
||||
fmt.Fprintln(w)
|
||||
w.Flush()
|
||||
|
||||
fmt.Printf("total files: %d, ok: %d, failed: %d, unsafe: %d, other: %d\n", total, ok, failed, unsafe, other)
|
||||
|
||||
}
|
||||
|
Reference in New Issue
Block a user