mirror of
				https://github.com/KevinMidboe/linguist.git
				synced 2025-10-29 17:50:22 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			88 lines
		
	
	
		
			3.1 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
			
		
		
	
	
			88 lines
		
	
	
		
			3.1 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
| require 'linguist/samples'
 | |
| require 'linguist/language'
 | |
| require 'tempfile'
 | |
| require 'yajl'
 | |
| require 'test/unit'
 | |
| 
 | |
| class TestSamples < Test::Unit::TestCase
 | |
|   include Linguist
 | |
| 
 | |
|   def test_up_to_date
 | |
|     assert serialized = Samples.cache
 | |
|     assert latest = Samples.data
 | |
| 
 | |
|     # Just warn, it shouldn't scare people off by breaking the build.
 | |
|     if serialized['md5'] != latest['md5']
 | |
|       warn "Samples database is out of date. Run `bundle exec rake samples`."
 | |
| 
 | |
|       expected = Tempfile.new('expected.json')
 | |
|       expected.write Yajl.dump(serialized, :pretty => true)
 | |
|       expected.close
 | |
| 
 | |
|       actual = Tempfile.new('actual.json')
 | |
|       actual.write Yajl.dump(latest, :pretty => true)
 | |
|       actual.close
 | |
| 
 | |
|       expected.unlink
 | |
|       actual.unlink
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   def test_verify
 | |
|     assert data = Samples.cache
 | |
| 
 | |
|     assert_equal data['languages_total'], data['languages'].inject(0) { |n, (_, c)| n += c }
 | |
|     assert_equal data['tokens_total'], data['language_tokens'].inject(0) { |n, (_, c)| n += c }
 | |
|     assert_equal data['tokens_total'], data['tokens'].inject(0) { |n, (_, ts)| n += ts.inject(0) { |m, (_, c)| m += c } }
 | |
|   end
 | |
| 
 | |
|   # Check that there aren't samples with extensions that aren't explicitly defined in languages.yml
 | |
|   def test_parity
 | |
|     extensions = Samples.cache['extnames']
 | |
|     languages_yml = File.expand_path("../../lib/linguist/languages.yml", __FILE__)
 | |
|     languages = YAML.load_file(languages_yml)
 | |
| 
 | |
|     languages.each do |name, options|
 | |
|       options['extensions'] ||= []
 | |
| 
 | |
|       if extnames = extensions[name]
 | |
|         extnames.each do |extname|
 | |
|           next if extname == '.script!'
 | |
|           assert options['extensions'].include?(extname), "#{name} has a sample with extension (#{extname}) that isn't explicitly defined in languages.yml"
 | |
|         end
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   # If a language extension isn't globally unique then make sure there are samples
 | |
|   Linguist::Language.all.each do |language|
 | |
|     define_method "test_#{language.name}_has_samples" do
 | |
|       language.all_extensions.each do |extension|
 | |
|         language_matches = Language.find_by_filename("foo#{extension}")
 | |
| 
 | |
|         # If there is more than one language match for a given extension
 | |
|         # then check that there are examples for that language with the extension
 | |
|         if language_matches.length > 1
 | |
|           language_matches.each do |language|
 | |
|             samples = "samples/#{language.name}/*#{extension}"
 | |
|             assert Dir.glob(samples).any?, "Missing samples in #{samples.inspect}. See https://github.com/github/linguist/blob/master/CONTRIBUTING.md"
 | |
|           end
 | |
|         end
 | |
|       end
 | |
| 
 | |
|       language.filenames.each do |filename|
 | |
|         # If there is more than one language match for a given filename
 | |
|         # then check that there are examples for that language with the extension
 | |
|         if Language.find_by_filename(filename).size > 1
 | |
|           sample = "samples/#{language.name}/filenames/#{filename}"
 | |
|           assert File.exists?(sample),
 | |
|             "Missing sample in #{sample.inspect}. See https://github.com/github/linguist/blob/master/CONTRIBUTING.md"
 | |
|         end
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   def assert_samples(language_matches, file_glob)
 | |
|   end
 | |
| end
 |