-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathmetadata.go
351 lines (301 loc) · 10.7 KB
/
metadata.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
package ortfodb
import (
"fmt"
"io/fs"
"os"
"path/filepath"
"sort"
"strings"
"sync"
ll "github.com/ewen-lbh/label-logger-go"
"github.com/go-git/go-git/v5/plumbing/format/gitignore"
"github.com/metal3d/go-slugify"
"gopkg.in/yaml.v2"
)
type autodetectData struct {
// Name is only used for debug purposes
Name string
Files []string
ContentConditions []string
}
// Tag represents a category that can be assigned to a work. See https://ortfo.org/db/tags for more information.
type Tag struct {
// Singular-form name of the tag. For example, "Book".
Singular string `yaml:"singular"`
// Plural-form name of the tag. For example, "Books".
Plural string `yaml:"plural"`
Description string `yaml:"description,omitempty"`
// URL to a website where more information can be found about this tag.
LearnMoreAt string `yaml:"learn more at,omitempty" json:"learnMoreAt,omitempty"`
// Other singular-form names of tags that refer to this tag. The names mentionned here should not be used to define other tags.
Aliases []string `yaml:"aliases,omitempty"`
// Various ways to automatically detect that a work is tagged with this tag.
DetectConditions struct {
// Consider the work to be tagged with this tag if it contains any of the files specified here. Glob patterns are supported.
// Files are searched relative to the work's folder (even in Scattered mode, files are not searched relative to the .ortfo folder)
Files []string `yaml:"files,omitempty"`
// To be implemented
Search []string `yaml:"search,omitempty"`
// Consider the work to be tagged with this tag if it was made with any of the technologies specified here.
MadeWith []string `yaml:"made with,omitempty" json:"madeWith,omitempty"`
} `yaml:"detect,omitempty"`
}
func (t Tag) String() string {
return t.Singular
}
func (t Tag) DisplayName() string {
return t.Plural
}
func (t Tag) URLFriendlyName() string {
return slugify.Marshal(t.Singular, true)
}
func (t Tag) Detect(ctx *RunContext, workId string, techs []Technology) (bool, error) {
for _, tech := range t.DetectConditions.MadeWith {
for _, candidate := range techs {
if candidate.ReferredToBy(tech) {
return true, nil
}
}
}
return autodetectData{
Name: t.Singular,
ContentConditions: t.DetectConditions.Search,
Files: t.DetectConditions.Files,
}.Detect(ctx, workId)
}
// Technology represents a "technology" (in the very broad sense) that was used to create a work. See https://ortfo.org/db/technologies for more information.
type Technology struct {
// The slug is a unique identifier for this technology, that's suitable for use in a website's URL.
// For example, the page that shows all works using a technology with slug "a" could be at https://example.org/technologies/a.
Slug string `yaml:"slug"`
Name string `yaml:"name"`
// Name of the person or organization that created this technology.
By string `yaml:"by,omitempty"`
Description string `yaml:"description,omitempty"`
// URL to a website where more information can be found about this technology.
LearnMoreAt string `yaml:"learn more at,omitempty" json:"learnMoreAt,omitempty"`
// Other technology slugs that refer to this technology. The slugs mentionned here should not be used in the definition of other technologies.
Aliases []string `yaml:"aliases,omitempty"`
// Files contains a list of gitignore-style patterns. If the work contains any of the patterns specified, we consider that technology to be used in the work.
Files []string `yaml:"files,omitempty"`
// Autodetect contains an expression of the form 'CONTENT in PATH' where CONTENT is a free-form unquoted string and PATH is a filepath relative to the work folder.
// If CONTENT is found in PATH, we consider that technology to be used in the work.
Autodetect []string `yaml:"autodetect,omitempty"`
}
func (t Technology) String() string {
return t.Name
}
func (t Technology) DisplayName() string {
return t.Name
}
func (t Technology) URLFriendlyName() string {
return t.Slug
}
func (t Technology) Detect(ctx *RunContext, workId string) (bool, error) {
return autodetectData{
Name: t.Slug,
ContentConditions: t.Autodetect,
Files: t.Files,
}.Detect(ctx, workId)
}
// Detect returns true if this technology is detected as used in the work.
func (t autodetectData) Detect(ctx *RunContext, workId string) (matched bool, err error) {
// Match files
contentDetectionConditions := make(map[string][]string)
contentDetectionFiles := make([]string, 0)
for _, f := range t.ContentConditions {
parts := strings.Split(f, " in ")
if len(parts) != 2 {
return false, fmt.Errorf("invalid autodetect expression: %s", f)
}
content := parts[0]
path := parts[1]
contentDetectionFiles = append(contentDetectionFiles, path)
if _, ok := contentDetectionConditions[path]; !ok {
contentDetectionConditions[path] = []string{content}
} else {
contentDetectionConditions[path] = append(contentDetectionConditions[path], content)
}
}
ll.Debug("Starting auto-detect for %s: contentDetection map is %v", t, contentDetectionConditions)
for _, f := range append(t.Files, contentDetectionFiles...) {
_, isContentDetection := contentDetectionConditions[f]
ll.Debug("Auto-detecting %s in %s: %q: isContentDetection=%v", t, workId, f, isContentDetection)
pat := gitignore.ParsePattern(f, nil)
// Walk all files of the work folder (excl. hidden files unfortunately)
err = fs.WalkDir(os.DirFS(ctx.PathToWorkFolder(workId)), ".", func(path string, d fs.DirEntry, err error) error {
if err != nil {
return err
}
if filepath.Base(path) == "node_modules" {
return fs.SkipDir
}
if filepath.Base(path) == ".venv" {
return fs.SkipDir
}
pathFragments := make([]string, 0)
for _, fragment := range strings.Split(path, string(os.PathSeparator)) {
if fragment != "" {
pathFragments = append(pathFragments, fragment)
}
}
if isContentDetection {
if path != f {
return nil
}
contents, err := readFile(filepath.Join(ctx.PathToWorkFolder(workId), path))
if err != nil {
return fmt.Errorf("while reading contents of %s to check whether it contains one of %#v: %w", path, contentDetectionConditions[path], err)
}
for _, contentCondition := range contentDetectionConditions[path] {
if strings.Contains(contents, contentCondition) {
ll.Debug("Auto-detected %s in %s: condition %q in %q met", t, workId, contentCondition, path)
matched = true
return filepath.SkipAll
}
}
} else {
result := pat.Match(pathFragments, d.IsDir())
if result == gitignore.Exclude {
ll.Debug("Auto-detected %s in %s: filepattern %q matches %q", t, workId, f, path)
matched = true
return filepath.SkipAll
} else if result == gitignore.Include {
ll.Debug("Auto-detected %s in %s: filepattern %q matches %q", t, workId, f, path)
matched = false
return filepath.SkipAll
}
}
return nil
})
}
return
}
func (ctx *RunContext) DetectTechnologies(workId string) (detecteds []Technology, err error) {
results := make(chan Technology, len(ctx.TechnologiesRepository))
errs := make(chan error, len(ctx.TechnologiesRepository))
wg := sync.WaitGroup{}
for _, tech := range ctx.TechnologiesRepository {
wg.Add(1)
go func(tech Technology, results chan Technology, errors chan error, wg *sync.WaitGroup) {
matched, err := tech.Detect(ctx, workId)
if err != nil {
errors <- fmt.Errorf("while trying to detect %s: %w", tech, err)
}
if matched {
results <- tech
}
wg.Done()
}(tech, results, errs, &wg)
}
wg.Wait()
close(results)
close(errs)
for err := range errs {
if err != nil {
return detecteds, err
}
}
for tech := range results {
detecteds = append(detecteds, tech)
}
sort.Slice(detecteds, func(i, j int) bool {
return detecteds[i].Slug < detecteds[j].Slug
})
return
}
func (t Tag) ReferredToBy(name string) bool {
return stringsLooselyMatch(name, append(t.Aliases, t.Plural, t.Singular)...)
}
func (ctx *RunContext) FindTag(name string) (result Tag, ok bool) {
for _, tag := range ctx.TagsRepository {
if tag.ReferredToBy(name) {
return tag, true
}
}
return Tag{}, false
}
func (t Technology) ReferredToBy(name string) bool {
return stringsLooselyMatch(name, append(t.Aliases, t.Slug, t.Name)...)
}
func (ctx *RunContext) FindTechnology(name string) (result Technology, ok bool) {
for _, tech := range ctx.TechnologiesRepository {
if tech.ReferredToBy(name) {
return tech, true
}
}
return Technology{}, false
}
func (ctx *RunContext) DetectTags(workId string, techs []Technology) (detecteds []Tag, err error) {
results := make(chan Tag, len(ctx.TagsRepository))
errs := make(chan error, len(ctx.TagsRepository))
wg := sync.WaitGroup{}
for _, tag := range ctx.TagsRepository {
wg.Add(1)
go func(tag Tag, results chan Tag, errors chan error, wg *sync.WaitGroup) {
matched, err := tag.Detect(ctx, workId, techs)
if err != nil {
errors <- fmt.Errorf("while trying to detect %s: %w", tag, err)
}
if matched {
results <- tag
}
wg.Done()
}(tag, results, errs, &wg)
}
wg.Wait()
close(results)
close(errs)
for err := range errs {
if err != nil {
return detecteds, err
}
}
for tag := range results {
detecteds = append(detecteds, tag)
}
sort.Slice(detecteds, func(i, j int) bool {
return detecteds[i].Plural < detecteds[j].Plural
})
return
}
func (ctx *RunContext) LoadTagsRepository() ([]Tag, error) {
if len(ctx.TagsRepository) > 0 {
return ctx.TagsRepository, nil
}
var tags []Tag
if ctx.Config.Tags.Repository == "" {
ll.Warn("No tags repository specified in configuration at %s", ctx.Config.source)
return []Tag{}, nil
}
raw, err := readFileBytes(ctx.Config.Tags.Repository)
if err != nil {
return []Tag{}, fmt.Errorf("while reading %s: %w", ctx.Config.Tags.Repository, err)
}
err = yaml.Unmarshal(raw, &tags)
if err != nil {
return []Tag{}, fmt.Errorf("while decoding YAML: %w", err)
}
ctx.TagsRepository = tags
return tags, nil
}
func (ctx *RunContext) LoadTechnologiesRepository() ([]Technology, error) {
if len(ctx.TechnologiesRepository) > 0 {
return ctx.TechnologiesRepository, nil
}
var technologies []Technology
if ctx.Config.Technologies.Repository == "" {
ll.Warn("No technologies repository specified in configuration at %s", ctx.Config.source)
return []Technology{}, nil
}
raw, err := readFileBytes(ctx.Config.Technologies.Repository)
if err != nil {
return []Technology{}, fmt.Errorf("while reading %s: %w", ctx.Config.Technologies.Repository, err)
}
err = yaml.Unmarshal(raw, &technologies)
if err != nil {
return []Technology{}, fmt.Errorf("while decoding YAML: %w", err)
}
ctx.TechnologiesRepository = technologies
return technologies, nil
}