RSpec.describe Licensee::ProjectFiles::LicenseFile do let(:filename) { 'LICENSE.txt' } let(:mit) { Licensee::License.find('mit') } let(:content) { sub_copyright_info(mit) } let(:content_hash) { '46cdc03462b9af57968df67b450cc4372ac41f53' } subject { described_class.new(content, filename) } it 'parses the attribution' do expect(subject.attribution).to eql('Copyright (c) 2016 Ben Balter') end context "when there's a random copyright-like line" do let(:content) { "Foo\nCopyright 2016 Ben Balter\nBar" } it "doesn't match" do expect(subject.attribution).to be_nil end end context 'with an non-UTF-8-encoded license' do let(:content) { "\x91License\x93".force_encoding('windows-1251') } it "doesn't blow up " do expect(subject.attribution).to be_nil end end it 'creates the wordset' do expect(subject.wordset.count).to eql(91) expect(subject.wordset.first).to eql('permission') end it 'creates the hash' do expect(subject.content_hash).to eql(content_hash) end context 'filename scoring' do { 'license' => 1.00, 'LICENCE' => 1.00, 'unLICENSE' => 1.00, 'unlicence' => 1.00, 'license.md' => 0.95, 'LICENSE.md' => 0.95, 'license.txt' => 0.95, 'COPYING' => 0.90, 'copyRIGHT' => 0.90, 'COPYRIGHT.txt' => 0.85, 'copying.txt' => 0.85, 'LICENSE.php' => 0.80, 'LICENCE.docs' => 0.80, 'copying.image' => 0.75, 'COPYRIGHT.go' => 0.75, 'LICENSE-MIT' => 0.70, 'LICENSE_1_0.txt' => 0.70, 'COPYING-GPL' => 0.65, 'COPYRIGHT-BSD' => 0.65, 'MIT-LICENSE.txt' => 0.60, 'mit-license-foo.md' => 0.60, 'OFL.md' => 0.50, 'ofl.textile' => 0.45, 'ofl' => 0.40, 'not-the-ofl' => 0.00, 'README.txt' => 0.00 }.each do |filename, expected| context "a file named #{filename}" do let(:score) { described_class.name_score(filename) } it 'scores the file' do expect(score).to eql(expected) end end end context 'LGPL scoring' do { 'COPYING.lesser' => 1, 'copying.lesser' => 1, 'license.lesser' => 0, 'LICENSE.md' => 0, 'FOO.md' => 0 }.each do |filename, expected| context "a file named #{filename}" do let(:score) { described_class.lesser_gpl_score(filename) } it 'scores the file' do expect(score).to eql(expected) end end end end context 'preferred license regex' do %w[md markdown txt].each do |ext| it "matches .#{ext}" do expect(described_class::PREFERRED_EXT_REGEX).to match(".#{ext}") end end it 'does not match .md2' do expect(described_class::PREFERRED_EXT_REGEX).to_not match('.md2') end it 'does not match .md/foo' do expect(described_class::PREFERRED_EXT_REGEX).to_not match('.md/foo') end end context 'any extension regex' do it 'matches .foo' do expect(described_class::OTHER_EXT_REGEX).to match('.foo') end it 'does not match .md/foo' do expect(described_class::OTHER_EXT_REGEX).to_not match('.md/foo') end end context 'license regex' do %w[LICENSE licence unlicense LICENSE-MIT MIT-LICENSE].each do |license| it "matches #{license}" do expect(described_class::LICENSE_REGEX).to match(license) end end end context 'copying regex' do %w[COPYING copyright].each do |copying| it "matches #{copying}" do expect(described_class::COPYING_REGEX).to match(copying) end end end end context 'CC false positives' do let(:regex) { Licensee::ProjectFiles::LicenseFile::CC_FALSE_POSITIVE_REGEX } it "knows MIT isn't a potential false positive" do expect(subject.content).to_not match(regex) expect(subject).to_not be_a_potential_false_positive end context 'a CC false positive without creative commons in the title' do let(:content) { 'Creative Commons Attribution-NonCommercial 4.0' } it "knows it's a potential false positive" do expect(subject.content).to match(regex) expect(subject).to be_a_potential_false_positive end end context 'a CC false positive without creative commons in the title' do let(:content) { 'Attribution-NonCommercial 4.0 International' } it "knows it's a potential false positive" do expect(subject.content).to match(regex) expect(subject).to be_a_potential_false_positive end end context 'CC-BY-ND' do let(:content) { 'Attribution-NoDerivatives 4.0 International' } it "knows it's a potential false positive" do expect(subject.content).to match(regex) expect(subject).to be_a_potential_false_positive end end context 'CC-BY-ND with leading instructions' do let(:content) do <<-LICENSE Creative Commons Corporation ("Creative Commons") is not a law firm ====================================================================== Creative Commons Attribution-NonCommercial 4.0 LICENSE end it "knows it's a potential false positive" do expect(subject.content).to match(regex) expect(subject).to be_a_potential_false_positive end end end context 'LGPL' do let(:lgpl) { Licensee::License.find('lgpl-3.0') } let(:content) { sub_copyright_info(lgpl) } context 'with a COPYING.lesser file' do let(:filename) { 'COPYING.lesser' } it 'knows when a license file is LGPL' do expect(subject).to be_lgpl end context 'with non-lgpl content' do let(:content) { sub_copyright_info(mit) } it 'is not lgpl' do expect(subject).to_not be_lgpl end end end context 'with a different file name' do let(:filename) { 'COPYING' } it 'is not lgpl' do expect(subject).to_not be_lgpl end end end context 'GPL' do let(:gpl) { Licensee::License.find('gpl-3.0') } let(:content) { sub_copyright_info(gpl) } it 'knows its GPL' do expect(subject).to be_gpl end context 'another license' do let(:content) { sub_copyright_info(mit) } it 'is not GPL' do expect(subject).to_not be_gpl end end end context 'an unknown license' do let(:content) { 'foo' } let(:other) { Licensee::License.find('other') } it 'matches to other' do expect(subject.license).to eql(other) end end context 'copyright?' do context 'a copyright file' do let(:content) { 'Copyright 2017 Ben Balter' } let(:filename) { 'COPYRIGHT.txt' } it "knows it's a copyright file" do expect(subject.send(:copyright?)).to be_truthy end end context 'A copyright file with license text' do let(:filename) { 'COPYRIGHT.txt' } it "knows it's not a copyright file" do expect(subject.send(:copyright?)).to be_falsy end end context 'a license file with copyright text' do let(:content) { 'Copyright 2017 Ben Balter' } it "knows it's not a copyright file" do expect(subject.send(:copyright?)).to be_falsy end end end end