mirror of
				https://github.com/KevinMidboe/linguist.git
				synced 2025-10-29 17:50:22 +00:00 
			
		
		
		
	Rename Sample -> Samples
This commit is contained in:
		
							
								
								
									
										6
									
								
								Rakefile
									
									
									
									
									
								
							
							
						
						
									
										6
									
								
								Rakefile
									
									
									
									
									
								
							| @@ -9,8 +9,8 @@ end | |||||||
|  |  | ||||||
|  |  | ||||||
| file 'lib/linguist/samples.yml' => Dir['samples/**/*'] do |f| | file 'lib/linguist/samples.yml' => Dir['samples/**/*'] do |f| | ||||||
|   require 'linguist/sample' |   require 'linguist/samples' | ||||||
|   File.open(f.name, 'w') { |io| Linguist::Sample.serialize_to_yaml(Linguist::Sample::DATA, io) } |   File.open(f.name, 'w') { |io| Linguist::Samples.serialize_to_yaml(Linguist::Samples::DATA, io) } | ||||||
| end | end | ||||||
|  |  | ||||||
| CLOBBER.include 'lib/linguist/samples.yml' | CLOBBER.include 'lib/linguist/samples.yml' | ||||||
| @@ -31,7 +31,7 @@ namespace :classifier do | |||||||
|       next if file_language.nil? || file_language == 'Text' |       next if file_language.nil? || file_language == 'Text' | ||||||
|       begin |       begin | ||||||
|         data = open(file_url).read |         data = open(file_url).read | ||||||
|         guessed_language, score = Linguist::Classifier.new(Sample::DATA).classify(data).first |         guessed_language, score = Linguist::Classifier.new(Samples::DATA).classify(data).first | ||||||
|  |  | ||||||
|         total += 1 |         total += 1 | ||||||
|         guessed_language == file_language ? correct += 1 : incorrect += 1 |         guessed_language == file_language ? correct += 1 : incorrect += 1 | ||||||
|   | |||||||
| @@ -2,7 +2,7 @@ require 'linguist/classifier' | |||||||
| require 'linguist/language' | require 'linguist/language' | ||||||
| require 'linguist/mime' | require 'linguist/mime' | ||||||
| require 'linguist/pathname' | require 'linguist/pathname' | ||||||
| require 'linguist/sample' | require 'linguist/samples' | ||||||
|  |  | ||||||
| require 'charlock_holmes' | require 'charlock_holmes' | ||||||
| require 'escape_utils' | require 'escape_utils' | ||||||
| @@ -442,7 +442,7 @@ module Linguist | |||||||
|       if Language.ambiguous?(extname) |       if Language.ambiguous?(extname) | ||||||
|         possible_languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) |         possible_languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) | ||||||
|         if possible_languages.any? |         if possible_languages.any? | ||||||
|           if result = Classifier.new(Sample::DATA).classify(data, possible_languages).first |           if result = Classifier.new(Samples::DATA).classify(data, possible_languages).first | ||||||
|             Language[result[0]] |             Language[result[0]] | ||||||
|           end |           end | ||||||
|         end |         end | ||||||
|   | |||||||
| @@ -2,7 +2,7 @@ require 'escape_utils' | |||||||
| require 'pygments' | require 'pygments' | ||||||
| require 'yaml' | require 'yaml' | ||||||
|  |  | ||||||
| require 'linguist/sample' | require 'linguist/samples' | ||||||
|  |  | ||||||
| module Linguist | module Linguist | ||||||
|   # Language names that are recognizable by GitHub. Defined languages |   # Language names that are recognizable by GitHub. Defined languages | ||||||
| @@ -441,8 +441,8 @@ module Linguist | |||||||
|     end |     end | ||||||
|   end |   end | ||||||
|  |  | ||||||
|   extensions = Sample.extensions |   extensions = Samples.extensions | ||||||
|   filenames = Sample.filenames |   filenames = Samples.filenames | ||||||
|   popular = YAML.load_file(File.expand_path("../popular.yml", __FILE__)) |   popular = YAML.load_file(File.expand_path("../popular.yml", __FILE__)) | ||||||
|  |  | ||||||
|   YAML.load_file(File.expand_path("../languages.yml", __FILE__)).each do |name, options| |   YAML.load_file(File.expand_path("../languages.yml", __FILE__)).each do |name, options| | ||||||
|   | |||||||
| @@ -3,7 +3,7 @@ require 'yaml' | |||||||
| 
 | 
 | ||||||
| module Linguist | module Linguist | ||||||
|   # Model for accessing classifier training data. |   # Model for accessing classifier training data. | ||||||
|   module Sample |   module Samples | ||||||
|     # Samples live in test/ for now, we'll eventually move them out |     # Samples live in test/ for now, we'll eventually move them out | ||||||
|     PATH = File.expand_path("../../../samples", __FILE__) |     PATH = File.expand_path("../../../samples", __FILE__) | ||||||
| 
 | 
 | ||||||
| @@ -1,5 +1,5 @@ | |||||||
| require 'linguist/file_blob' | require 'linguist/file_blob' | ||||||
| require 'linguist/sample' | require 'linguist/samples' | ||||||
|  |  | ||||||
| require 'test/unit' | require 'test/unit' | ||||||
| require 'mime/types' | require 'mime/types' | ||||||
| @@ -275,7 +275,7 @@ class TestBlob < Test::Unit::TestCase | |||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_language |   def test_language | ||||||
|     Sample.each do |sample| |     Samples.each do |sample| | ||||||
|       blob     = blob(sample[:path]) |       blob     = blob(sample[:path]) | ||||||
|       language = Linguist::Language.find_by_alias(sample[:language]) |       language = Linguist::Language.find_by_alias(sample[:language]) | ||||||
|       assert_equal language, blob.language, blob.name |       assert_equal language, blob.language, blob.name | ||||||
|   | |||||||
| @@ -1,6 +1,6 @@ | |||||||
| require 'linguist/classifier' | require 'linguist/classifier' | ||||||
| require 'linguist/language' | require 'linguist/language' | ||||||
| require 'linguist/sample' | require 'linguist/samples' | ||||||
| require 'linguist/tokenizer' | require 'linguist/tokenizer' | ||||||
| require 'linguist/md5' | require 'linguist/md5' | ||||||
|  |  | ||||||
| @@ -18,8 +18,8 @@ class TestClassifier < Test::Unit::TestCase | |||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_instance_freshness |   def test_instance_freshness | ||||||
|     serialized = Linguist::MD5.hexdigest(Sample::DATA) |     serialized = Linguist::MD5.hexdigest(Samples::DATA) | ||||||
|     latest     = Linguist::MD5.hexdigest(Linguist::Sample.classifier.to_hash) |     latest     = Linguist::MD5.hexdigest(Linguist::Samples.classifier.to_hash) | ||||||
|  |  | ||||||
|     # Just warn, it shouldn't scare people off by breaking the build. |     # Just warn, it shouldn't scare people off by breaking the build. | ||||||
|     if serialized != latest |     if serialized != latest | ||||||
| @@ -55,16 +55,16 @@ class TestClassifier < Test::Unit::TestCase | |||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_instance_classify_empty |   def test_instance_classify_empty | ||||||
|     results = Classifier.new(Sample::DATA).classify("") |     results = Classifier.new(Samples::DATA).classify("") | ||||||
|     assert results.first[1] < 0.5, results.first.inspect |     assert results.first[1] < 0.5, results.first.inspect | ||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_instance_classify_nil |   def test_instance_classify_nil | ||||||
|     assert_equal [], Classifier.new(Sample::DATA).classify(nil) |     assert_equal [], Classifier.new(Samples::DATA).classify(nil) | ||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_verify |   def test_verify | ||||||
|     data = Sample::DATA |     data = Samples::DATA | ||||||
|  |  | ||||||
|     assert_equal data['languages_total'], data['languages'].inject(0) { |n, (_, c)| n += c } |     assert_equal data['languages_total'], data['languages'].inject(0) { |n, (_, c)| n += c } | ||||||
|     assert_equal data['tokens_total'], data['language_tokens'].inject(0) { |n, (_, c)| n += c } |     assert_equal data['tokens_total'], data['language_tokens'].inject(0) { |n, (_, c)| n += c } | ||||||
| @@ -72,7 +72,7 @@ class TestClassifier < Test::Unit::TestCase | |||||||
|   end |   end | ||||||
|  |  | ||||||
|   def test_classify_ambiguous_languages |   def test_classify_ambiguous_languages | ||||||
|     Sample.each do |sample| |     Samples.each do |sample| | ||||||
|       language = Linguist::Language.find_by_alias(sample[:language]) |       language = Linguist::Language.find_by_alias(sample[:language]) | ||||||
|       next unless language.overrides.any? |       next unless language.overrides.any? | ||||||
|  |  | ||||||
| @@ -80,7 +80,7 @@ class TestClassifier < Test::Unit::TestCase | |||||||
|       languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) |       languages = Language.all.select { |l| l.extensions.include?(extname) }.map(&:name) | ||||||
|       next unless languages.length > 1 |       next unless languages.length > 1 | ||||||
|  |  | ||||||
|       results = Classifier.new(Sample::DATA).classify(File.read(sample[:path]), languages) |       results = Classifier.new(Samples::DATA).classify(File.read(sample[:path]), languages) | ||||||
|       assert_equal language.name, results.first[0], "#{sample[:path]}\n#{results.inspect}" |       assert_equal language.name, results.first[0], "#{sample[:path]}\n#{results.inspect}" | ||||||
|     end |     end | ||||||
|   end |   end | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user