Rename Sample -> Samples

This commit is contained in:
Joshua Peek
2012-07-23 13:15:27 -05:00
parent 0c9a947f39
commit 80e8ee7ce6
6 changed files with 19 additions and 19 deletions

View File

@@ -9,8 +9,8 @@ end
file 'lib/linguist/samples.yml' => Dir['samples/**/*'] do |f| file 'lib/linguist/samples.yml' => Dir['samples/**/*'] do |f|
require 'linguist/sample' require 'linguist/samples'
File.open(f.name, 'w') { |io| Linguist::Sample.serialize_to_yaml(Linguist::Sample::DATA, io) } File.open(f.name, 'w') { |io| Linguist::Samples.serialize_to_yaml(Linguist::Samples::DATA, io) }
end end
CLOBBER.include 'lib/linguist/samples.yml' CLOBBER.include 'lib/linguist/samples.yml'
@@ -31,7 +31,7 @@ namespace :classifier do
next if file_language.nil? || file_language == 'Text' next if file_language.nil? || file_language == 'Text'
begin begin
data = open(file_url).read data = open(file_url).read
guessed_language, score = Linguist::Classifier.new(Sample::DATA).classify(data).first guessed_language, score = Linguist::Classifier.new(Samples::DATA).classify(data).first
total += 1 total += 1
guessed_language == file_language ? correct += 1 : incorrect += 1 guessed_language == file_language ? correct += 1 : incorrect += 1

View File

@@ -2,7 +2,7 @@ require 'linguist/classifier'
require 'linguist/language' require 'linguist/language'
require 'linguist/mime' require 'linguist/mime'
require 'linguist/pathname' require 'linguist/pathname'
require 'linguist/sample' require 'linguist/samples'
require 'charlock_holmes' require 'charlock_holmes'
require 'escape_utils' require 'escape_utils'
@@ -442,7 +442,7 @@ module Linguist
if Language.ambiguous?(extname) if Language.ambiguous?(extname)
possible_languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) possible_languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name)
if possible_languages.any? if possible_languages.any?
if result = Classifier.new(Sample::DATA).classify(data, possible_languages).first if result = Classifier.new(Samples::DATA).classify(data, possible_languages).first
Language[result[0]] Language[result[0]]
end end
end end

View File

@@ -2,7 +2,7 @@ require 'escape_utils'
require 'pygments' require 'pygments'
require 'yaml' require 'yaml'
require 'linguist/sample' require 'linguist/samples'
module Linguist module Linguist
# Language names that are recognizable by GitHub. Defined languages # Language names that are recognizable by GitHub. Defined languages
@@ -441,8 +441,8 @@ module Linguist
end end
end end
extensions = Sample.extensions extensions = Samples.extensions
filenames = Sample.filenames filenames = Samples.filenames
popular = YAML.load_file(File.expand_path("../popular.yml", __FILE__)) popular = YAML.load_file(File.expand_path("../popular.yml", __FILE__))
YAML.load_file(File.expand_path("../languages.yml", __FILE__)).each do |name, options| YAML.load_file(File.expand_path("../languages.yml", __FILE__)).each do |name, options|

View File

@@ -3,7 +3,7 @@ require 'yaml'
module Linguist module Linguist
# Model for accessing classifier training data. # Model for accessing classifier training data.
module Sample module Samples
# Samples live in test/ for now, we'll eventually move them out # Samples live in test/ for now, we'll eventually move them out
PATH = File.expand_path("../../../samples", __FILE__) PATH = File.expand_path("../../../samples", __FILE__)

View File

@@ -1,5 +1,5 @@
require 'linguist/file_blob' require 'linguist/file_blob'
require 'linguist/sample' require 'linguist/samples'
require 'test/unit' require 'test/unit'
require 'mime/types' require 'mime/types'
@@ -275,7 +275,7 @@ class TestBlob < Test::Unit::TestCase
end end
def test_language def test_language
Sample.each do |sample| Samples.each do |sample|
blob = blob(sample[:path]) blob = blob(sample[:path])
language = Linguist::Language.find_by_alias(sample[:language]) language = Linguist::Language.find_by_alias(sample[:language])
assert_equal language, blob.language, blob.name assert_equal language, blob.language, blob.name

View File

@@ -1,6 +1,6 @@
require 'linguist/classifier' require 'linguist/classifier'
require 'linguist/language' require 'linguist/language'
require 'linguist/sample' require 'linguist/samples'
require 'linguist/tokenizer' require 'linguist/tokenizer'
require 'linguist/md5' require 'linguist/md5'
@@ -18,8 +18,8 @@ class TestClassifier < Test::Unit::TestCase
end end
def test_instance_freshness def test_instance_freshness
serialized = Linguist::MD5.hexdigest(Sample::DATA) serialized = Linguist::MD5.hexdigest(Samples::DATA)
latest = Linguist::MD5.hexdigest(Linguist::Sample.classifier.to_hash) latest = Linguist::MD5.hexdigest(Linguist::Samples.classifier.to_hash)
# Just warn, it shouldn't scare people off by breaking the build. # Just warn, it shouldn't scare people off by breaking the build.
if serialized != latest if serialized != latest
@@ -55,16 +55,16 @@ class TestClassifier < Test::Unit::TestCase
end end
def test_instance_classify_empty def test_instance_classify_empty
results = Classifier.new(Sample::DATA).classify("") results = Classifier.new(Samples::DATA).classify("")
assert results.first[1] < 0.5, results.first.inspect assert results.first[1] < 0.5, results.first.inspect
end end
def test_instance_classify_nil def test_instance_classify_nil
assert_equal [], Classifier.new(Sample::DATA).classify(nil) assert_equal [], Classifier.new(Samples::DATA).classify(nil)
end end
def test_verify def test_verify
data = Sample::DATA data = Samples::DATA
assert_equal data['languages_total'], data['languages'].inject(0) { |n, (_, c)| n += c } assert_equal data['languages_total'], data['languages'].inject(0) { |n, (_, c)| n += c }
assert_equal data['tokens_total'], data['language_tokens'].inject(0) { |n, (_, c)| n += c } assert_equal data['tokens_total'], data['language_tokens'].inject(0) { |n, (_, c)| n += c }
@@ -72,7 +72,7 @@ class TestClassifier < Test::Unit::TestCase
end end
def test_classify_ambiguous_languages def test_classify_ambiguous_languages
Sample.each do |sample| Samples.each do |sample|
language = Linguist::Language.find_by_alias(sample[:language]) language = Linguist::Language.find_by_alias(sample[:language])
next unless language.overrides.any? next unless language.overrides.any?
@@ -80,7 +80,7 @@ class TestClassifier < Test::Unit::TestCase
languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name)
next unless languages.length > 1 next unless languages.length > 1
results = Classifier.new(Sample::DATA).classify(File.read(sample[:path]), languages) results = Classifier.new(Samples::DATA).classify(File.read(sample[:path]), languages)
assert_equal language.name, results.first[0], "#{sample[:path]}\n#{results.inspect}" assert_equal language.name, results.first[0], "#{sample[:path]}\n#{results.inspect}"
end end
end end