blob: c23ea758aa8d12e5d588322f73f61fe12e50fd49 [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package license
import (
"fmt"
"io/fs"
"path/filepath"
"regexp"
"strings"
"sync"
"github.com/apache/skywalking-eyes/assets"
"github.com/apache/skywalking-eyes/internal/logger"
)
var licenseTemplatesDir = "lcs-templates"
var templatesDirs = []string{
licenseTemplatesDir,
// Some projects simply use the header text as their LICENSE content...
"header-templates",
}
var dualLicensePatterns = []*regexp.Regexp{
regexp.MustCompile(`(?i)This project is covered by two different licenses: (?P<license>[^.]+)`),
}
var normalizedTemplates = sync.Map{}
func init() {
wg := sync.WaitGroup{}
for _, dir := range templatesDirs {
files, err := assets.AssetDir(dir)
if err != nil {
logger.Log.Fatalln("Failed to read license template directory:", dir, err)
}
wg.Add(len(files))
for _, template := range files {
go loadTemplate(&wg, dir, template)
}
}
wg.Wait()
}
func loadTemplate(wg *sync.WaitGroup, dir string, template fs.DirEntry) {
defer wg.Done()
name := template.Name()
t, err := assets.Asset(filepath.Join(dir, name))
if err != nil {
logger.Log.Fatalln("Failed to read license template:", dir, err)
}
normalizedTemplates.Store(dir+"/"+name, Normalize(string(t)))
}
// Identify identifies the Spdx ID of the given license content
func Identify(pkgPath, content string) (string, error) {
for _, pattern := range dualLicensePatterns {
matches := pattern.FindStringSubmatch(content)
for i, name := range pattern.SubexpNames() {
if name == "license" && len(matches) >= i {
return matches[i], nil
}
}
}
content = Normalize(content)
logger.Log.Debugf("Normalized content for %+v:\n%+v\n", pkgPath, content)
result := make(chan string, 1)
normalizedTemplates.Range(func(key, value interface{}) bool {
name := key.(string)
license := value.(string)
// Should not use `Contains` as a root LICENSE file may include other licenses the project uses,
// `Contains` would identify the last one license as the project's license.
if strings.HasPrefix(content, license) {
name = filepath.Base(name)
result <- strings.TrimSuffix(name, filepath.Ext(name))
return false
}
return true
})
select {
case license := <-result:
return license, nil
default:
return "", fmt.Errorf("cannot identify license content")
}
}
// GetLicenseContent from license id
func GetLicenseContent(spdxID string) (string, error) {
res, err := assets.Asset(filepath.Join(licenseTemplatesDir, spdxID+".txt"))
if err != nil {
return "", err
}
return string(res), nil
}