diff --git a/cmd/app/cmd.go b/cmd/app/cmd.go index 4399480a..512af7e5 100644 --- a/cmd/app/cmd.go +++ b/cmd/app/cmd.go @@ -6,6 +6,7 @@ import ( "io" "os" + "github.com/gardener/docforge/pkg/api" "github.com/gardener/docforge/pkg/hugo" "github.com/spf13/cobra" "k8s.io/klog/v2" @@ -37,13 +38,17 @@ func NewCommand(ctx context.Context, cancel context.CancelFunc) *cobra.Command { cmd := &cobra.Command{ Use: "docforge", Short: "Build documentation bundle", - Run: func(cmd *cobra.Command, args []string) { + RunE: func(cmd *cobra.Command, args []string) error { options := NewOptions(flags) doc := Manifest(flags.documentationManifestPath) - reactor := NewReactor(ctx, options) + if err := api.ValidateManifest(doc); err != nil { + return err + } + reactor := NewReactor(ctx, options, doc.Links) if err := reactor.Run(ctx, doc, flags.dryRun); err != nil { - klog.Errorf(err.Error()) + return err } + return nil }, } diff --git a/cmd/app/factory.go b/cmd/app/factory.go index 522217ef..3faba0ae 100644 --- a/cmd/app/factory.go +++ b/cmd/app/factory.go @@ -5,6 +5,7 @@ import ( "io" "path/filepath" + "github.com/gardener/docforge/pkg/api" "github.com/gardener/docforge/pkg/hugo" "github.com/gardener/docforge/pkg/metrics" "github.com/gardener/docforge/pkg/resourcehandlers" @@ -44,7 +45,7 @@ type Metering struct { } // NewReactor creates a Reactor from Options -func NewReactor(ctx context.Context, options *Options) *reactor.Reactor { +func NewReactor(ctx context.Context, options *Options, globalLinksCfg *api.Links) *reactor.Reactor { dryRunWriters := writers.NewDryRunWritersFactory(options.DryRunWriter) o := &reactor.Options{ MaxWorkersCount: options.MaxWorkersCount, @@ -59,6 +60,7 @@ func NewReactor(ctx context.Context, options *Options) *reactor.Reactor { ResourceHandlers: initResourceHandlers(ctx, options), DryRunWriter: dryRunWriters, Resolve: options.Resolve, + GlobalLinksConfig: globalLinksCfg, } if options.DryRunWriter != nil { o.Writer = dryRunWriters.GetWriter(options.DestinationPath) diff --git a/example/advanced/00.yaml b/example/advanced/00.yaml index abf6761b..6f1d75b9 100644 --- a/example/advanced/00.yaml +++ b/example/advanced/00.yaml @@ -1,69 +1,62 @@ -root: - name: doc +structure: + - name: doc nodes: - name: overview - contentSelectors: - - source: https://github.com/gardener/documentation/wiki/Architecture.md - - name: gardenlet - contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md + source: https://github.com/gardener/documentation/wiki/Architecture.md + - source: https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md # linkSubstitutes define changes to links in documents.They apply to links and images # specified with markdown markup. - linksSubstitutes: + links: # The key in the mapping is an absolute form of a document link that will be # subject to transformation - "https://github.com/gardener/gardener/blob/master/docs/usage/shooted_seed.md": - # destination is the link reference URL. If it is empty string, - # the links markup is removed leaving only link text behind. - # For images, the entire markup is removed. - destination: "" - "https://kubernetes.io/docs/concepts/extend-kubernetes/operator/": - destination: "https://kubernetes.io/docs/concepts/extend-kubernetes/operator1111" - # text is a link text element (alt-text for images). Specifying text - # will change it to the new value. Empty string is valid only with - # `destination=""` - text: smooth operator - # title is the title element of a link or image. Specifying text - # will change it to the new value. - title: a title - # localityDomains can be specified on node level too. - # Node's localityDomain definitions override and amend global ones. - localityDomain: - github.com/gardener/gardener: - version: v1.11.1 - path: gardener/gardener - # exclude omits resources from path. You can - # also use include with the reverse semantics - exclude: - - example - # downloadSubstitutes is a list of regular expressions matching - # links to resources on documents that will be downloaded, mapped - # to name expressions tha define how the downloaded resources will - # named. - # There is a set of variables that can be used to construct the - # expressions: - # - $name: the original name of the resource - # - $path: the original path of the resource - # - $uuid: a UUID generated for the resource - # - $ext: a original resource extension - # The default expression applying to all resources is: $uuid.$ext - # Besides regular-expression-to-expression mappings it is possible - # to map exact URLs (escaped) to concrete names. - downloadSubstitutes: - "\\.(jpg|gif|png)": "$name-hires-$uuid.$ext" - - name: deploying-gardenlets - contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md - - name: automatic-deployment - contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_automatically.md - - name: deploy-gardenlet-manually - contentSelectors: - - source: https://github.com/gardener/gardener/blob/2a33b26458dddd7ad09c4c3b2311d3391db890e7/docs/deployment/deploy_gardenlet_manually.md - - name: shooted-seeds - contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/usage/shooted_seed.md -localityDomain: - github.com/gardener/gardener: - version: v1.10.0 - path: gardener/gardener + rewrites: + github.com/gardener/gardener: + version: v1.11.1 + "https://github.com/gardener/gardener/blob/master/docs/usage/shooted_seed.md": + # destination is the link reference URL. If it is empty string, + # the links markup is removed leaving only link text behind. + # For images, the entire markup is removed. + destination: "" + "https://kubernetes.io/docs/concepts/extend-kubernetes/operator/": + destination: "https://kubernetes.io/docs/concepts/extend-kubernetes/operator1111" + # text is a link text element (alt-text for images). Specifying text + # will change it to the new value. Empty string is valid only with + # `destination=""` + text: smooth operator + # title is the title element of a link or image. Specifying text + # will change it to the new value. + title: a title + downloads: + # localityDomains can be specified on node level too. + # Node's localityDomain definitions override and amend global ones. + scope: + github.com/gardener/gardener: + version: v1.11.1 + # downloadSubstitutes is a list of regular expressions matching + # links to resources on documents that will be downloaded, mapped + # to name expressions tha define how the downloaded resources will + # named. + # There is a set of variables that can be used to construct the + # expressions: + # - $name: the original name of the resource + # - $path: the original path of the resource + # - $uuid: a UUID generated for the resource + # - $ext: a original resource extension + # The default expression applying to all resources is: $uuid.$ext + # Besides regular-expression-to-expression mappings it is possible + # to map exact URLs (escaped) to concrete names. + renames: + "\\.(jpg|gif|png)": "$name-hires-$uuid.$ext" + - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md + - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_automatically.md + - source: https://github.com/gardener/gardener/blob/2a33b26458dddd7ad09c4c3b2311d3391db890e7/docs/deployment/deploy_gardenlet_manually.md + - source: https://github.com/gardener/gardener/blob/master/docs/usage/shooted_seed.md +links: + # The key in the mapping is an absolute form of a document link that will be + # subject to transformation + rewrites: + github.com/gardener/gardener: + version: v1.10.0 + downloads: + scope: + github.com/gardener/gardener: ~ \ No newline at end of file diff --git a/example/ns2.yaml b/example/ns2.yaml new file mode 100644 index 00000000..27b92968 --- /dev/null +++ b/example/ns2.yaml @@ -0,0 +1,35 @@ +structure: + - name: Deployments + nodes: + - name: 00-gardenlet_loioc60a1dffee014e2b89d30503cbcd6597.md + source: https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md + links: + rewrites: + gardener/gardener/(tree|blob): + version: v1.10.1 + downloads: + scope: + gardener/gardener/(tree|blob|raw)/v1.10.1/docs: + "gardenlet-architecture-detailed.png": "$name_loio7976e5f568284f2b9c5962f43052650d_LowRes$ext" + "gardenlet-architecture-similarities.png": "$name_loio1f6697e4b0b641e2a7ed438e949efe72_LowRes$ext" + - name: 00-10-deploying-gardenlets_loio694e6ebecdec48559b9dcfeef2a04cb8.md + source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md + - name: 00-20-automatic-deployment_loio43db0eed58974608a2f256959c95cd59.md + source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_automatically.md + - name: 00-30-deploy-gardenlet-manually_loio40d2a0c019bf4ac986e237217f488f83.md + source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_manually.md + - name: 10-shooted-seeds_loio16e32f722f284bc8ad77899c5b000779.md + source: https://github.com/gardener/gardener/blob/master/docs/usage/shooted_seed.md + - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_manually.md + - name: $name_$uuid$ext + source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet_manually.md +links: + rewrites: + gardener/gardener/(tree|blob): + version: v1.10.1 + (pulls|pull|issues|issue): + destination: "" + text: "" + downloads: + scope: + gardener/gardener/(tree|blob|raw)/v1.10.1/docs: ~ \ No newline at end of file diff --git a/example/simple/00.yaml b/example/simple/00.yaml index a41bb0ac..9d111f03 100644 --- a/example/simple/00.yaml +++ b/example/simple/00.yaml @@ -1,6 +1,6 @@ # The documentation structure root node. Mandatory. -root: - name: doc +structure: + - name: doc # nodeSelector is resolved to a node hierarchy, where nodes are selected # by criteria (criteria is not implemented yet, i.e no filters). nodesSelector: diff --git a/example/simple/01.yaml b/example/simple/01.yaml index 6b1be9bc..a1af9c8a 100644 --- a/example/simple/01.yaml +++ b/example/simple/01.yaml @@ -1,6 +1,6 @@ # The documentation structure root node. Mandatory. -root: - name: doc +structure: + - name: doc # nodeSelector is resolved to a node hierarchy, where nodes are selected # by criteria (criteria is not implemented yet, i.e no filters). nodesSelector: @@ -8,7 +8,7 @@ root: # generate a hierarchy. For GitHub paths that is a folder in a GitHub repo # and the generated nodes hierarchy corresponds ot the file/folder structure # available in the repository at that path. - path: https://github.com/gardener/gardener/tree/master/docs + path: https://github.com/gardener/gardener/tree/v1.11.1/docs # A list of child nodes to this structure node to form document structure hierarchy. # Note that if a nodeSelector is specified on this node, will be merged with other # existing nodes in `nodes`. Nodes with the same name will have their other properties @@ -16,26 +16,21 @@ root: # nodes. nodes: - name: aws_provider - # contentSelectors is a list of source selection specifications. - # Normally, there will be one but it is possible to specify several and - # they will be appended in that order. - contentSelectors: - # Source specifies location of document source. - # The supported sources as of now are GitHub repository documents and wiki pages. - - source: https://github.com/gardener/gardener-extension-provider-aws/blob/v1.13.0/docs/usage-as-end-user.md + # Source specifies location of document source. + # The supported sources as of now are GitHub repository documents and wiki pages. + source: https://github.com/gardener/gardener-extension-provider-aws/blob/v1.13.0/docs/usage-as-end-user.md # A localityDomain defines the scope of documentation structure "local" # resources that are downloaded along with structure's documents. -localityDomain: +links: # A locality domain. GFor GitHub it is in the form # // - github.com/gardener/gardener: - # The version, if specified, is applied to all links inside this domain. - # Document-local resources that will be downloaded (inside `path`), and - # links that will be absolute in this domain (github.com/gardener/gardener) - # will be rewritten with this version in their URLs. - version: v1.11.1 - # Path inside this domain that defines the scope of the "document-local" - # resources, which will be downloaded along with documents. - # If version is specified, the links used to download the resources are - # rewritten to match the version. - path: gardener/gardener/docs \ No newline at end of file + rewrites: + gardener/gardener/(blob|tree|raw): + # The version, if specified, is applied to all links inside this domain. + # Document-local resources that will be downloaded (inside `path`), and + # links that will be absolute in this domain (github.com/gardener/gardener) + # will be rewritten with this version in their URLs. + version: v1.11.1 + downloads: + scope: + gardener/gardener/(blob|raw)/v1.11.1/docs: ~ \ No newline at end of file diff --git a/pkg/api/nodes.go b/pkg/api/nodes.go index da87a61d..bebf05b1 100755 --- a/pkg/api/nodes.go +++ b/pkg/api/nodes.go @@ -142,38 +142,53 @@ func (n *Node) AddStats(s ...*Stat) { } } -// FindNodeByContentSource traverses up and then all around the +// FindNodeBySource traverses up and then all around the // tree paths in the node's documentation structure, looking for -// a node that has contentSource path nodeContentSource -func FindNodeByContentSource(nodeContentSource string, node *Node) *Node { +// a node that has the source string either in source, contentSelector +// or template +func FindNodeBySource(source string, node *Node) *Node { if node == nil { return nil } - - for _, contentSelector := range node.ContentSelectors { - if contentSelector.Source == nodeContentSource { - return node - } + if n := matchAnySource(source, node); n != nil { + return n } root := node.GetRootNode() if root == nil { root = node } - return withMatchinContentSelectorSource(nodeContentSource, root) + return withMatchinContentSelectorSource(source, root) } -func withMatchinContentSelectorSource(nodeContentSource string, node *Node) *Node { - if node == nil { - return nil +func matchAnySource(source string, node *Node) *Node { + if node.Source == source { + return node } for _, contentSelector := range node.ContentSelectors { - if contentSelector.Source == nodeContentSource { + if contentSelector.Source == source { return node } } + if t := node.Template; t != nil { + for _, contentSelector := range t.Sources { + if contentSelector.Source == source { + return node + } + } + } + return nil +} + +func withMatchinContentSelectorSource(source string, node *Node) *Node { + if node == nil { + return nil + } + if n := matchAnySource(source, node); n != nil { + return n + } for i := range node.Nodes { - foundNode := withMatchinContentSelectorSource(nodeContentSource, node.Nodes[i]) + foundNode := withMatchinContentSelectorSource(source, node.Nodes[i]) if foundNode != nil { return foundNode } diff --git a/pkg/api/parser_test.go b/pkg/api/parser_test.go index 643538a3..73df90e7 100755 --- a/pkg/api/parser_test.go +++ b/pkg/api/parser_test.go @@ -25,8 +25,8 @@ import ( ) var b = []byte(` -root: - name: root +structure: +- name: root nodes: - name: node_1 contentSelectors: @@ -36,20 +36,19 @@ root: - source: https://a.com properties: "custom_key": custom_value - localityDomain: - github.com/gardener/gardener: - exclude: - - a + links: + downloads: + scope: + github.com/gardener/gardener: ~ nodes: - name: subnode contentSelectors: - source: path/a -localityDomain: - github.com/gardener/gardener: - version: v1.10.0 - path: gardener/gardener/docs - LinkSubstitutes: - a: b +links: + rewrites: + github.com/gardener/gardener: + version: v1.10.0 + text: b `) func traverse(node *Node) { @@ -73,7 +72,9 @@ func TestParse(t *testing.T) { fmt.Println(err) return } - traverse(got.Root) + for _, n := range got.Structure { + traverse(n) + } // if got != c.want { // t.Errorf("Something(%q) == %q, want %q", c.in, got, c.want) // } @@ -87,23 +88,25 @@ func TestSerialize(t *testing.T) { }{ { &Documentation{ - Root: &Node{ - Title: "A Title", - Nodes: []*Node{ - { - Title: "node 1", - ContentSelectors: []ContentSelector{{Source: "path1/**"}}, - }, - { - Title: "path 2", - ContentSelectors: []ContentSelector{{Source: "https://a.com"}}, - Properties: map[string]interface{}{ - "custom_key": "custom_value", + Structure: []*Node{ + &Node{ + Name: "A Title", + Nodes: []*Node{ + { + Name: "node 1", + ContentSelectors: []ContentSelector{{Source: "path1/**"}}, }, - Nodes: []*Node{ - { - Title: "subnode", - ContentSelectors: []ContentSelector{{Source: "path/a"}}, + { + Name: "path 2", + ContentSelectors: []ContentSelector{{Source: "https://a.com"}}, + Properties: map[string]interface{}{ + "custom_key": "custom_value", + }, + Nodes: []*Node{ + { + Name: "subnode", + ContentSelectors: []ContentSelector{{Source: "path/a"}}, + }, }, }, }, @@ -128,22 +131,24 @@ func TestSerialize(t *testing.T) { func TestMe(t *testing.T) { d := &Documentation{ - Root: &Node{ - Name: "docs", - NodeSelector: &NodeSelector{ - Path: "https://github.com/gardener/gardener/tree/master/docs", - }, - Nodes: []*Node{ - { - Name: "calico", - NodeSelector: &NodeSelector{ - Path: "https://github.com/gardener/gardener-extension-networking-calico/tree/master/docs", - }, + Structure: []*Node{ + &Node{ + Name: "docs", + NodeSelector: &NodeSelector{ + Path: "https://github.com/gardener/gardener/tree/master/docs", }, - { - Name: "aws", - NodeSelector: &NodeSelector{ - Path: "https://github.com/gardener/gardener-extension-provider-aws/tree/master/docs", + Nodes: []*Node{ + { + Name: "calico", + NodeSelector: &NodeSelector{ + Path: "https://github.com/gardener/gardener-extension-networking-calico/tree/master/docs", + }, + }, + { + Name: "aws", + NodeSelector: &NodeSelector{ + Path: "https://github.com/gardener/gardener-extension-provider-aws/tree/master/docs", + }, }, }, }, @@ -164,45 +169,46 @@ func TestFile(t *testing.T) { got *Documentation ) expected := &Documentation{ - Root: &Node{ - Name: "00", - Nodes: []*Node{ - &Node{ - Name: "01", - ContentSelectors: []ContentSelector{ - ContentSelector{ - Source: "https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md", - }, - }, - LocalityDomain: &LocalityDomain{ - LocalityDomainMap: LocalityDomainMap{ - "github.com/gardener/gardener": &LocalityDomainValue{ - Version: "v1.11.1", - Path: "gardener/gardener", - LinksMatchers: LinksMatchers{ - Exclude: []string{ - "example", - }, + Structure: []*Node{ + &Node{ + Name: "00", + Nodes: []*Node{ + &Node{ + Name: "01", + Source: "https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md", + Links: &Links{ + Rewrites: map[string]*LinkRewriteRule{ + "github.com/gardener/gardener": &LinkRewriteRule{ + Version: "v1.11.1", + }, + }, + Downloads: &Downloads{ + Scope: map[string]ResourceRenameRules{ + "github.com/gardener/gardener": nil, }, }, }, }, - }, - &Node{ - Name: "02", - ContentSelectors: []ContentSelector{ - ContentSelector{ - Source: "https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md", + &Node{ + Name: "02", + ContentSelectors: []ContentSelector{ + ContentSelector{ + Source: "https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md", + }, }, }, }, }, }, - LocalityDomain: &LocalityDomain{ - LocalityDomainMap: LocalityDomainMap{ - "github.com/gardener/gardener": &LocalityDomainValue{ + Links: &Links{ + Rewrites: map[string]*LinkRewriteRule{ + "github.com/gardener/gardener": &LinkRewriteRule{ Version: "v1.10.0", - Path: "gardener/gardener", + }, + }, + Downloads: &Downloads{ + Scope: map[string]ResourceRenameRules{ + "github.com/gardener/gardener": nil, }, }, }, diff --git a/pkg/api/testdata/parse_test_00.yaml b/pkg/api/testdata/parse_test_00.yaml index 663f33d7..0b4d02f1 100644 --- a/pkg/api/testdata/parse_test_00.yaml +++ b/pkg/api/testdata/parse_test_00.yaml @@ -1,19 +1,22 @@ -root: - name: 00 +structure: +- name: 00 nodes: - name: 01 - contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md - localityDomain: - github.com/gardener/gardener: - version: v1.11.1 - path: gardener/gardener - exclude: - - example + source: https://github.com/gardener/gardener/blob/master/docs/concepts/gardenlet.md + links: + rewrites: + "github.com/gardener/gardener": + version: v1.11.1 + downloads: + scope: + "github.com/gardener/gardener": ~ - name: 02 contentSelectors: - - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md -localityDomain: - github.com/gardener/gardener: - version: v1.10.0 - path: gardener/gardener \ No newline at end of file + - source: https://github.com/gardener/gardener/blob/master/docs/deployment/deploy_gardenlet.md +links: + rewrites: + "github.com/gardener/gardener": + version: v1.10.0 + downloads: + scope: + "github.com/gardener/gardener": ~ \ No newline at end of file diff --git a/pkg/api/types.go b/pkg/api/types.go index 1dca0b84..1f9beef0 100644 --- a/pkg/api/types.go +++ b/pkg/api/types.go @@ -15,114 +15,123 @@ package api -// Documentation is a documentation structure that can be serialized and deserialized -// and parsed into a model supporting the tasks around building a concrete documentation -// bundle. +// Documentation models a manifest for building a documentation structure from various +// sources into a coherent bundle. type Documentation struct { - // Root is the root node of this documentation structure - Root *Node `yaml:"root"` - // Variables are a set of key-value entries, where the key is the variable name - // and the value is a node template. Nodes defined as variables can be resused - // by reference throughout the documentation structure to minimise duplicate - // node definitions. A reference to a variable is in the format `$variable-name`, - // where `variable-name` is a key in this Variables map structure. + // Structure defines a documentation structure hierarchy. // + // Optional, alternative to NodeSelector + Structure []*Node `yaml:"structure,omitempty"` + // NodesSelector is a specification for building a documentation structure hierarchy. + // The root of the hierarchy is a node generated for the resource at the nodeSelector's + // path. It is attached as single, direct descendant of this Documentation. + // NodesSelector on this level is useful in a scenario where the intended structure needs + // not to be modelled but complies with an existing hierarchy that can be resolved to + // a documentation structure. // Note: WiP - proposed, not implemented yet. - Variables map[string]*Node `yaml:"variables,omitempty"` - // LocalityDomain defines the scope of the downloadable resources - // for this structure - LocalityDomain *LocalityDomain `yaml:"localityDomain,omitempty"` + // + // Optional, alternative to Structure + NodeSelector *NodeSelector `yaml:"nodesSelector,omitempty"` + // Links defines global rules for processing document links + // + // Optional + Links *Links `yaml:"links,omitempty"` + // Variables are a set of key-value entries that allow manifests to be parameterized. + // When the manifest is resolved, variables values are interpolated throughout the text. + // + // Note: WiP - proposed, not implemented yet. + // Optional + Variables map[string]interface{} `yaml:"variables,omitempty"` } -// Node is a recursive, tree data structure representing documentation model. +// Node is a recursive, tree data structure representing documentation structure. +// A Node's descendents are its `nodes` array elements. +// A node without any of the options for content assignment - Source, ContentSlectors +// or Template is a container node, and is serialized as folder. If it has a content +// assignment property, it is a document node and is serialized as file. +// Document nodes have a nil Nodes property. type Node struct { - parent *Node - // Name is the name of this node. If omitted, the name is the resource name from - // Source as reported by an eligible ResourceHandler's Name() method. - // Node with multiple Source entries require name. + // Name is an identifying name for this node that will be used also for its serialization. + // Name cannot be omitted if this is a container node. + // Name can be omitted for document nodes only if the Source property is specified. In this + // case, the Name value is the resource name from the location specified in Source. + // A document node without Source requires Name. + // The Name value of a node with Source can be also an expression constructed from several + // variables: + // - $name: the original name of the resource provided by Source + // - $ext: the extension of the resource provided by Source. May be empty string if the + // resource has no extension. + // - $uuid: a UUID identifier generated and at disposal for each node. + // + // Mandatory if this is a container Node or Source is not specified, optional otherwise Name string `yaml:"name,omitempty"` - // A reference to the parent of this node, unless it is the root. Unexported and - // assigned internally when the node structure is resolved. Not marshalled. - // Title is the title for a node displayed to human users - Title string `yaml:"title,omitempty"` - // Source is a sequence of path specifications to locate the resources - // that represent this document node. There must be at minimum one. When - // they are multiple, the resulting document is an aggregation of the - // material located at each path. - // - // A source path specification entries are in the following format: - // `path[#{semantic-block-selector}]`, where: - // - `path` is a valid resource locator for a document. - // - `semantic-block-selector`is an expression that selects semantic block - // elements from the document similar to CSS selectors (Note: WiP - proposed, - // not implemented yet.). - // - // Examples: - // - A single file - // `source: ["path/a/b/c/file.md"]` - // - // - Two files in order to construct a new document - // `source: ["path1/a/b/c/file1.md", - // "path2/e/f/g/file2.md"]` - // - // - A file and the section under the first heading level 1 from another file - // in that order to construct a new document. - // Note: WiP - proposed, not implemented yet. - // `source: ["path1/a/b/c/file1.md", - // "path2/e/f/g/file2.md#{h1:first-of-type}"]` + // ContentSelectors is a sequence of specifications for selecting cotent for this node. + // The content provided by the list of ContentSelectors is aggregated into a single document. + // + // Mandatory when there is no Name property. Alternative to ContentSelectors and Template. Only + // one must be specified. + Source string `yaml:"source,omitempty"` + // ContentSelectors is a sequence of specifications for selecting cotent for this node. + // The content provided by the list of ContentSelectors is aggregated into a single document. + // Name is a required property when ContentSelectors are used to assign content to a node. + // + // Optional, alternative to ContentSelectors and Template. Only one of them must be specified. ContentSelectors []ContentSelector `yaml:"contentSelectors,omitempty"` - // Nodes is an array of nodes that are subnodes (children) of this node + // Template is a specification for content selection and its application to a template, the + // product of which is this document node's content. + // Name is a required property when Template are used to assign content to a node. + // + // Optional, alternative to ContentSelectors and Source. Only one of them must be specified. + Template *Template `yaml:"template,omitempty"` + // Nodes is a list of nodes that are descendants of this Node. This field is applicable + // only to container nodes and not to document nodes. + // A folder node must always have a Name. // // Note: For a non-strict alternative for specifying child nodes, refer to // `NodesSelector` + // Optional Nodes []*Node `yaml:"nodes,omitempty"` - // NodesSelector is a structure modeling an existing structure of documents at a - // location that can be further filtered by their metadata propertis and set as - // child nodes to this node. This is an alternative to explicitly setting child - // nodes structure resource paths with `Nodes`. + // NodesSelector is a specification for building a documentation structure hierarchy, + // descending from this node. The modelled structure is merged into this node's Nodes + // field, masshing it up with potentially explicitly defined descendants there. The merge + // strategy identifies identical nodes by their name and in this case performs a merge + // of their properties. Where there are conflicts, the explicitly defined node wins. + // A NodeSelector can coexist or be an alternative to an explicitly defined structure, + // depending on the goal. + // // Note: WiP - proposed, not implemented yet. + // Optional NodeSelector *NodeSelector `yaml:"nodesSelector,omitempty"` // Properties are a map of arbitrary, key-value pairs to model custom, - // untyped node properties. They could be used to instruct specific ResourceHandlers - // and the serialization of the Node. For example the properties member could be - // used to set the front-matter to markdowns for front-matter aware builders such - // as Hugo. + // untyped node properties. They can be used for various purposes. For example, + // specifying a "fronatmatter" property on a node will result in applying the value as + // front matter in the resulting document content. This si applicable only to document + // nodes. Properties map[string]interface{} `yaml:"properties,omitempty"` + // Links defines the rules for handling links in this node's content. Applicable only + // to document nodes. + Links *Links `yaml:"links,omitempty"` - *LocalityDomain `yaml:"localityDomain,omitempty"` - - // LinksSubstitutes is an optional map of links and their - // substitutions. Use it to override the default handling of those - // links in documents referenced by this node's contentSelector: - // - An empty substitution string ("") removes a link markdown. - // It leaves only its text component in the document for links - // and nothing for images. - // This applies only to markdown for links and images. - // - A fixed string that will replace the whole original link - // destination. - // The keys in the substitution map are matched against documents - // links as exact string matches. The document links are converted to - // their absolute form for the match - // TODO: update this doc - LinksSubstitutes LinkSubstitutes `yaml:"linksSubstitutes,omitempty"` - - stats []*Stat + // private fields + parent *Node + stats []*Stat } -// NodeSelector is an specification for selecting subnodes (children) for a node. +// NodeSelector is a specification for selecting a descending hierarchy for a node. // The order in which the documents are selected is not guaranteed. The interpreters // of NodeSelectors can make use of the resource metadata or other sources to construct -// and populate child Nodes dynamically. +// and populate descendent Nodes dynamically. // // Example: -// - Select all documents located at path/a/b/c that have front-matter property -// `type` with value `faq`: +// - Select recursively all documents located at path /a/b/c that have front-matter +// property `type` with value `faq`: +// ``` +// nodesSelector: { +// path: "path/a/b/c" +// frontMatter: +// "type:faq" +// } // ``` -// nodesSelector: { -// path: "path/a/b/c", -// annotation: "type:faq" -// } -// ``` // will select markdown documents located at path/a/b/c with front-matter: // --- // type: faq @@ -131,98 +140,202 @@ type Node struct { // Note: WiP - proposed, not implemented yet. type NodeSelector struct { // Path is a resource locator to a set of files, i.e. to a resource container. + // A node selector path defines the scope that will be used to + // generate a hierarchy. For GitHub paths that is a folder in a GitHub repo + // and the generated nodes hierarchy corresponds ot the file/folder structure + // available in the repository at that path. + // Without any further criteria, all nodes within path are included. + // + // Mandatory Path string `yaml:"path"` - // Depth a maximum depth of the recursion. If omitted or less than 0, the - // constraint is not considered - Depth int64 `yaml:"depth,omitempty"` - // Annotation is an optional expression, filtering documents located at `Path` + // ExcludePath is a set of exclusion rules for node candidates for the hierarchy. + // Each rule is a regular expression to match a node's path that is relative to the + // path element. + // Note: WiP - proposed, not implemented yet. + // + // Optional + ExcludePath []string `yaml:"excludePath,omitempty"` + // ExcludeFrontMatter is an optional expression, filtering documents located at `Path` // by their metadata properties. Markdown metadata is commonly provisioned as // `front-matter` block at the head of the document delimited by comment // tags (`---`). - Annotation string `yaml:"annotation,omitempty"` + // Documents with front matter that matches all map entries of this field + // are not selected. + // Note: WiP - proposed, not implemented yet. + // + // Optional + ExcludeFrontMatter map[string]interface{} `yaml:"excludeFrontMatter,omitempty"` + // FrontMatter is an optional expression, filtering documents located at `Path` + // by their metadata properties. Markdown metadata is commonly provisioned as + // `front-matter` block at the head of the document delimited by comment + // tags (`---`). + // Documents with front matter that matches all map entries of this field + // are selected. + // Note: WiP - proposed, not implemented yet. + // + // Optional + FrontMatter map[string]interface{} `yaml:"frontMatter,omitempty"` + // Depth a maximum depth of the recursion. If omitted or less than 0, the + // constraint is not considered + // + // Optional + Depth int64 `yaml:"depth,omitempty"` } // ContentSelector specifies a document node content target +// A ContentSelector specification +// that constitute this document node's content. There must be at minimum one. When +// they are multiple, the resulting document is an aggregation of the +// material located at each path. +// +// A ContentSelector specification entries are in the following format: +// `path[#{semantic-block-selector}]`, where: +// - `path` is a valid resource locator for a document. +// - `semantic-block-selector`is an expression that selects semantic block +// elements from the document similar to CSS selectors (Note: WiP - proposed, +// not implemented yet.). +// +// Examples: +// - A single file +// `source: ["path/a/b/c/file.md"]` +// +// - Two files in order to construct a new document +// `source: ["path1/a/b/c/file1.md", +// "path2/e/f/g/file2.md"]` +// +// - A file and the section under the first heading level 1 from another file +// in that order to construct a new document. +// Note: WiP - proposed, not implemented yet. +// `source: ["path1/a/b/c/file1.md", +// "path2/e/f/g/file2.md#{h1:first-of-type}"]` type ContentSelector struct { // URI of a document + // + // Mandatory Source string `yaml:"source,omitempty"` // Optional filtering expression that selects content from the document content - // Omiting this file will select the whole document content. + // Omiting this file will select the whole document content at Source. + // + // Optional Selector *string `yaml:"selector,omitempty"` } -// LinksMatchers defines links exclusion/inclusion patterns -type LinksMatchers struct { - // Include is a list of regular expressions that will be matched to every - // link that is candidate for download to determine whether it is - // eligible. The links to match are absolute. - // Include can be used in conjunction with Exclude when it is easier/ - // preferable to deny all resources and allow selectively. - // Include can be used in conjunction with localityDomain to add - // additional resources not in the domain. - Include []string `yaml:"include,omitempty"` - // Exclude is a list of regular expression that will be matched to every - // link that is candidate for download to determine whether it is - // not eligible. The links to match are absolute. - // Use Exclude to further constrain the set of downloaded resources - // that are in a locality domain. - Exclude []string `yaml:"exclude,omitempty"` +// Template specifies rules for selecting content and applying it +// to a template +type Template struct { + // Path to the template file. + // A template file content is valid Golang template content. + // See https://golang.org/pkg/text/template. + // The template will have at disposal the variables defined in + // this specification's Sources. Their values will be the content + // selected by the coresponding specifications. + // + // Mandatory + Path string `yaml:"path"` + // Sources maps variable names to ContentSelectors that will be + // used as specification for the content to fetch and assign ot that + // these variables + Sources map[string]*ContentSelector `yaml:"path,omitempty"` } -// LocalityDomain contains the entries defining a -// locality domain scope. Each entry is a mapping -// between a domain, such as github.com/gardener/gardener, -// and a path in it that defines "local" resources. -// Documents referenced by documentation node structure -// are always part of the locality domain. Other -// resources referenced by those documents are checked -// against the path hierarchy of locality domain -// entries to determine how they will be processed. -type LocalityDomain struct { - LocalityDomainMap `yaml:",inline"` - // DownloadSubstitutes is an optional map of resource names in this - // locality domain and their substitutions. Use it to override the - // default downloads naming: - // - An exact download name mapped to a download resource will be used - // to name that resources when downloaded. - // - An expression with substitution variables can be used - // to change the default pattern for generating downloaded resource - // names, which is $uuid. - // The supported variables are: - // - $name: the original name of the resource - // - $path: the original path of the resource in this domain (may be empty) - // - $uuid: the identifier generated f=or the downloaded resource - // - $ext: the extension of the original resource (may be "") - // Example expression: $name-$uuid - DownloadSubstitutes map[string]string `yaml:"downloadSubstitutes,omitempty"` +// Links defines how document links are processed. +type Links struct { + // Rewrites maps regular expressions matching a document links resolved to absolute, + // with link rewriting rules. + // A common use is to rewrite resources links versions, if they support that to have + // them downloaded at a particular state. + // A rewrite mapping an expression to nil rules (~) is interpreted as request to remove + // the links matching the expression. + Rewrites map[string]*LinkRewriteRule + // Downloads are definition for document referenced resources that will be downloaded + // in dedicated destination (__resources by default) and optionally renamed. + // Downloads are performed after rewrites. + Downloads *Downloads } -// LocalityDomainMap maps domains such as github.com/gardener/gardener -// to LocalityDomainValues -type LocalityDomainMap map[string]*LocalityDomainValue - -// LocalityDomainValue encapsulates the members of a -// LocalityDomain entry value -type LocalityDomainValue struct { - // Version sets the version of the resources that will - // be referenced in this domain. Download targets and - // absolute links in documents referenced by the structure - // will be rewritten to match this version - Version string `yaml:"version"` - // Path is the relative path inside a domain that contains - // resources considered 'local' that will be downloaded. - Path string `yaml:"path"` - LinksMatchers `yaml:",inline"` +// LinkRewriteRule si a rule definition specifying link properties to be rewritten. +type LinkRewriteRule struct { + // Rewrites the version of links matching this pattern, e.g. master -> v1.11.3. + // For GitHub links the version will rewrite the sha path segment in the URL + // right after organization, repository and resource type. + // Note that not every link supports version. For example GitHub issues + // links have different pattern and it has no sha segment. + // The version will be applied only where applicable. + Version string `yaml:"version,omitempty"` + // Rewrites the destination in a link|image markdown + // + // Example: + // with `destination: "github.tools.sap/kubernetes/gardener"` + // [a](github.com/gardener/gardener) -> [a](github.tools.sap/kubernetes/gardener) + // + // This setting overwrites a version setting if both exist so it makes little sense to use it + // with version. + // + // Note that destinations that are matched by a downloads specification will be converted to + // relative, using the result of the destination substitution. + // + // Setting destination to empty string leads to removing the link, leaving only the text element behind + // + // Example: + // with `destination: ""` [a](github.com/gardener/gardener) -> a + // + // Note that for images this will remove the image entirely: + // + // Example: + // with `destination: ""` ![alt-text-here](github.com/gardener/gardener/blob/master/images/b.png) -> + // + Destination *string `yaml:"destination,omitempty"` + // Rewrites or sets a matched link markdown's text component (alt-text for images) + // If used in combination with destination: "" and value "" this will effectively remove a link + // completely, leaving nothing behind in the document. + Text string `yaml:"text,omitempty"` + // Rewrites or sets a matched link markdown's title component. + // Note that this will have no effect with settings destination: "" and text: "" as the whole + // markdown together with tis title will be removed. + Title string `yaml:"title,omitempty"` } -// LinkSubstitutes is the mapping between absolute links -// and substitutions for them -type LinkSubstitutes map[string]*LinkSubstitute - -// LinkSubstitute comprises subtitutes for various link details -// commonly found in markup -type LinkSubstitute struct { - Text *string `yaml:"text,omitempty"` - Destination *string `yaml:"destination,omitempty"` - Title *string `yaml:"title,omitempty"` +// Downloads is a definition of the scope of downloadable resources and rules for renaming them. +type Downloads struct { + // Renames is a set of renaming rules that are globally applicable to all downloads + // regardless of scope. + // Example: + // renames: + // "\\.(jpg|gif|png)": "$name-hires-$uuid.$ext" + Renames ResourceRenameRules `yaml:"renames,omitempty"` + // Scope defines the scope for downloaded resources with a set of mappings between + // document links matching regular expressions and (optional) naming patterns. + // A scope map entry maps a regular expression that matches document links that will + // be downloaded to an optional rename specification or ~ for default. + // If no particular rename specification is supplied: + // 1. the globally supplied renames are tested to match and applied (if supplied) + // 2. a default rename expression `$uuid.$ext` will be applied to all matched targets. + // + // Example: define a download scope (only) that downloads every matching document. + // scope: + // gardener/gardener/(tree|blob|raw)/master/docs: ~ + // + // Example: define a download scope that downloads every matching document and + // renames it to a specific pattern if it is an jpg|gif|png image or uses the default + // naming pattern otherwise. + // scope: + // gardener/gardener/(tree|blob|raw)/master/docs: + // "\\.(jpg|gif|png)": "$name-image-$uuid.$ext" + Scope map[string]ResourceRenameRules `yaml:"scope,omitempty"` } + +// ResourceRenameRules defines a mapping between regular expressions matching +// resource locators and name pattern expressions or exact names. +// The name patter will be used to rename the downloaded resources matching the +// specified regular expression key. +// There is a set of variables that can be used to construct the +// naming expressions: +// - $name: the original name of the resource +// - $uuid: a UUID generated for the resource +// - $ext: a original resource extension +// The default expression applying to all resources is: $uuid.$ext +// +// Example: +// "\\.(jpg|gif|png)": "$name-image-$uuid.$ext" +// +type ResourceRenameRules map[string]string diff --git a/pkg/api/validate.go b/pkg/api/validate.go new file mode 100644 index 00000000..b50536b3 --- /dev/null +++ b/pkg/api/validate.go @@ -0,0 +1,66 @@ +package api + +import ( + "fmt" + "strings" + + "github.com/hashicorp/go-multierror" +) + +func ValidateManifest(manifest *Documentation) error { + var errs *multierror.Error + if manifest != nil { + if manifest.NodeSelector != nil && manifest.Structure != nil { + multierror.Append(errs, fmt.Errorf("nodeSelector and structure are mutually exclusive properties")) + } + if manifest.NodeSelector == nil && manifest.Structure == nil { + errs = multierror.Append(errs, fmt.Errorf("Either nodeSelector or structure must be present in a manifest")) + } + validateStructure(manifest.Structure, errs) + validateNodeSelector(manifest.NodeSelector, errs) + } + return errs.ErrorOrNil() +} + +func validateStructure(structure []*Node, errs *multierror.Error) { + for _, node := range structure { + validateNode(node, errs) + validateStructure(node.Nodes, errs) + } +} + +func validateNode(node *Node, errs *multierror.Error) { + if len(node.Name) == 0 { + if len(node.Nodes) != 0 || len(node.ContentSelectors) > 0 || node.Template != nil { + errs = multierror.Append(errs, fmt.Errorf("Expected property name != nil")) + } + } + if len(node.Name) > 0 && len(node.Source) > 0 { + if strings.Contains(node.Name, "$name") || strings.Contains(node.Name, "$uuid") || strings.Contains(node.Name, "$ext") { + multierror.Append(errs, fmt.Errorf("name variables are supported only together with source property: %s", node.Name)) + } + } + if len(node.Nodes) != 0 && len(node.ContentSelectors) > 0 { + multierror.Append(errs, fmt.Errorf("nodes and contentSelectors are mutually exclusive properties")) + } + if len(node.Nodes) != 0 && len(node.Source) > 0 { + multierror.Append(errs, fmt.Errorf("nodes and source are mutually exclusive properties")) + } + if len(node.Nodes) != 0 && node.Template != nil { + multierror.Append(errs, fmt.Errorf("nodes and template are mutually exclusive properties")) + } + validateNodeSelector(node.NodeSelector, errs) + validateLinks(node.Links, errs) +} + +func validateNodeSelector(ns *NodeSelector, errs *multierror.Error) { + if ns != nil { + // TODO: implement me + } +} + +func validateLinks(links *Links, errs *multierror.Error) { + if links != nil { + // TODO: implement me + } +} diff --git a/pkg/reactor/build.go b/pkg/reactor/build.go index 308e18f8..ddaf4306 100644 --- a/pkg/reactor/build.go +++ b/pkg/reactor/build.go @@ -8,21 +8,20 @@ import ( "k8s.io/klog/v2" ) -func tasks(node *api.Node, t *[]interface{}) { - n := node - *t = append(*t, &DocumentWorkTask{ - Node: n, - }) - if node.Nodes != nil { - for _, n := range node.Nodes { - tasks(n, t) +func tasks(nodes []*api.Node, t *[]interface{}) { + for _, node := range nodes { + *t = append(*t, &DocumentWorkTask{ + Node: node, + }) + if node.Nodes != nil { + tasks(node.Nodes, t) } } } // Build starts the build operation for a document structure root // in a locality domain -func (r *Reactor) Build(ctx context.Context, documentationRoot *api.Node, localityDomain *localityDomain) error { +func (r *Reactor) Build(ctx context.Context, documentationStructure []*api.Node) error { var errors *multierror.Error errCh := make(chan error) @@ -45,7 +44,7 @@ func (r *Reactor) Build(ctx context.Context, documentationRoot *api.Node, locali r.DownloadController.Start(ctx, errCh, downloadShutdownCh) }() // start document controller with download scope - r.DocController.SetDownloadScope(localityDomain) + // r.DocController.SetDownloadScope(localityDomain) go func() { klog.V(6).Infoln("Starting document controller") r.DocController.Start(ctx, errCh, documentShutdownCh) @@ -78,7 +77,7 @@ func (r *Reactor) Build(ctx context.Context, documentationRoot *api.Node, locali // to exit when ready go func() { documentPullTasks := make([]interface{}, 0) - tasks(documentationRoot, &documentPullTasks) + tasks(documentationStructure, &documentPullTasks) for _, task := range documentPullTasks { r.DocController.Enqueue(ctx, task) } diff --git a/pkg/reactor/build_test.go b/pkg/reactor/build_test.go index 0035f47e..2f1f353c 100644 --- a/pkg/reactor/build_test.go +++ b/pkg/reactor/build_test.go @@ -12,7 +12,7 @@ func Test_tasks(t *testing.T) { type args struct { node *api.Node tasks []interface{} - lds localityDomain + // lds localityDomain } tests := []struct { name string @@ -22,12 +22,12 @@ func Test_tasks(t *testing.T) { { name: "it creates tasks based on the provided doc", args: args{ - node: newDoc.Root, + node: newDoc.Structure[0], tasks: []interface{}{}, }, expectedTasks: []*DocumentWorkTask{ { - Node: newDoc.Root, + Node: newDoc.Structure[0], }, { Node: archNode, @@ -47,7 +47,7 @@ func Test_tasks(t *testing.T) { for _, tc := range tests { t.Run(tc.name, func(t *testing.T) { rhs := resourcehandlers.NewRegistry(&FakeResourceHandler{}) - tasks(tc.args.node, &tc.args.tasks) + tasks([]*api.Node{tc.args.node}, &tc.args.tasks) if len(tc.args.tasks) != len(tc.expectedTasks) { t.Errorf("expected number of tasks %d != %d", len(tc.expectedTasks), len(tc.args.tasks)) diff --git a/pkg/reactor/content_processor.go b/pkg/reactor/content_processor.go index 361d704e..a2259721 100644 --- a/pkg/reactor/content_processor.go +++ b/pkg/reactor/content_processor.go @@ -28,9 +28,10 @@ var ( // NodeContentProcessor operates on documents content to reconcile links and // schedule linked resources downloads type NodeContentProcessor struct { - resourceAbsLinks map[string]string - rwlock sync.RWMutex - localityDomain *localityDomain + resourceAbsLinks map[string]string + rwlock sync.RWMutex + globalLinksConfig *api.Links + // localityDomain *localityDomain // ResourcesRoot specifies the root location for downloaded resource. // It is used to rewrite resource links in documents to relative paths. resourcesRoot string @@ -42,15 +43,15 @@ type NodeContentProcessor struct { } // NewNodeContentProcessor creates NodeContentProcessor objects -func NewNodeContentProcessor(resourcesRoot string, ld *localityDomain, downloadJob DownloadController, failFast bool, markdownFmt bool, rewriteEmbedded bool, resourceHandlers resourcehandlers.Registry) *NodeContentProcessor { - if ld == nil { - ld = &localityDomain{ - mapping: map[string]*localityDomainValue{}, - } - } +func NewNodeContentProcessor(resourcesRoot string, globalLinksConfig *api.Links, downloadJob DownloadController, failFast bool, markdownFmt bool, rewriteEmbedded bool, resourceHandlers resourcehandlers.Registry) *NodeContentProcessor { + // if ld == nil { + // ld = &localityDomain{ + // mapping: map[string]*localityDomainValue{}, + // } + // } c := &NodeContentProcessor{ resourceAbsLinks: make(map[string]string), - localityDomain: ld, + globalLinksConfig: globalLinksConfig, resourcesRoot: resourcesRoot, DownloadController: downloadJob, failFast: failFast, @@ -100,10 +101,9 @@ func (c *NodeContentProcessor) reconcileMDLinks(ctx context.Context, docNode *ap var errors *multierror.Error contentBytes, _ = markdown.UpdateLinkRefs(contentBytes, func(markdownType markdown.Type, destination, text, title []byte) ([]byte, []byte, []byte, error) { var ( - _destination string - _text, _title *string - download *Download - err error + _destination, _text, _title string + download *Download + err error ) if _destination, _text, _title, download, err = c.resolveLink(ctx, docNode, string(destination), contentSourcePath); err != nil { errors = multierror.Append(err) @@ -128,11 +128,11 @@ func (c *NodeContentProcessor) reconcileMDLinks(ctx context.Context, docNode *ap if download != nil { c.schedule(ctx, download, contentSourcePath) } - if _text != nil { - text = []byte(*_text) + if len(_text) > 0 { + text = []byte(_text) } - if _title != nil { - title = []byte(*_title) + if len(_title) > 0 { + title = []byte(_title) } if len(_destination) < 1 { return nil, text, title, nil @@ -187,19 +187,19 @@ type Download struct { } // returns destination, text (alt-text for images), title, download(url, downloadName), err -func (c *NodeContentProcessor) resolveLink(ctx context.Context, node *api.Node, destination string, contentSourcePath string) (string, *string, *string, *Download, error) { +func (c *NodeContentProcessor) resolveLink(ctx context.Context, node *api.Node, destination string, contentSourcePath string) (string, string, string, *Download, error) { var ( - text, title, substituteDestination *string - hasSubstition bool - inLD bool - absLink string + substituteDestination *string + version, text, title, downloadResourceName, absLink string + ok bool + globalRewrites map[string]*api.LinkRewriteRule ) if strings.HasPrefix(destination, "#") || strings.HasPrefix(destination, "mailto:") { - return destination, nil, nil, nil, nil + return destination, "", "", nil, nil } // validate destination - u, err := url.Parse(destination) + u, err := urls.Parse(destination) if err != nil { return "", text, title, nil, err } @@ -208,7 +208,7 @@ func (c *NodeContentProcessor) resolveLink(ctx context.Context, node *api.Node, // It's a valid absolute link that is not in our scope. Leave it be. return destination, text, title, nil, err } - + //convert relative links to absolute handler := c.ResourceHandlers.Get(contentSourcePath) if handler == nil { return destination, text, title, nil, nil @@ -218,55 +218,64 @@ func (c *NodeContentProcessor) resolveLink(ctx context.Context, node *api.Node, return "", text, title, nil, err } - if hasSubstition, substituteDestination, text, title = substitute(absLink, node); hasSubstition && substituteDestination != nil { - if len(*substituteDestination) == 0 { - // quit early. substitution is a request to remove this link - return "", text, title, nil, nil + // rewrite link if required + if gLinks := c.globalLinksConfig; gLinks != nil { + globalRewrites = gLinks.Rewrites + } + _a := absLink + if version, substituteDestination, text, title, ok = MatchForLinkRewrite(absLink, node, globalRewrites); ok { + if substituteDestination != nil { + if len(*substituteDestination) == 0 { + // quit early. substitution is a request to remove this link + return "", text, title, nil, nil + } + absLink = *substituteDestination + } + if len(version) > 0 { + handler := c.ResourceHandlers.Get(absLink) + if handler == nil { + return absLink, text, title, nil, nil + } + if absLink, err = handler.SetVersion(absLink, version); err != nil { + klog.Warningf("Failed to set version %s to %s: %s\n", version, absLink, err.Error()) + return absLink, text, title, nil, nil + } } - absLink = *substituteDestination } - //TODO: this is URI-specific (URLs only) - fixme - u, err = url.Parse(absLink) + u, err = urls.Parse(absLink) if err != nil { return "", text, title, nil, err } - _a := absLink - - resolvedLD := c.localityDomain - if node != nil { - resolvedLD = resolveLocalityDomain(node, c.localityDomain) - } - if resolvedLD != nil { - absLink, inLD = resolvedLD.MatchPathInLocality(absLink, c.ResourceHandlers) - } if _a != absLink { - klog.V(6).Infof("[%s] Link converted %s -> %s\n", contentSourcePath, _a, absLink) + klog.V(6).Infof("[%s] Link rewritten %s -> %s\n", contentSourcePath, _a, absLink) } + // Links to other documents are enforced relative when // linking documents from the node structure. // Links to other documents are changed to match the linking // document version when appropriate or left untouched. - if strings.HasSuffix(u.Path, ".md") { - //TODO: this is URI-specific (URLs only) - fixme - l := strings.TrimSuffix(absLink, "?") - l = strings.TrimSuffix(l, "#") - if existingNode := api.FindNodeByContentSource(l, node); existingNode != nil { + if u.Extension == "md" { + if existingNode := api.FindNodeBySource(absLink, node); existingNode != nil { relPathBetweenNodes := node.RelativePath(existingNode) if destination != relPathBetweenNodes { klog.V(6).Infof("[%s] %s -> %s\n", contentSourcePath, destination, relPathBetweenNodes) } - destination = relPathBetweenNodes - return destination, text, title, nil, nil + return relPathBetweenNodes, text, title, nil, nil } return absLink, text, title, nil, nil } + // Note: ignores global rules for now // Links to resources are assessed for download eligibility // and if applicable their destination is updated as relative // path to predefined location for resources - if absLink != "" && inLD { - resourceName := c.generateResourceName(absLink, resolvedLD) + var globalDownloadsConfig *api.Downloads + if c.globalLinksConfig != nil { + globalDownloadsConfig = c.globalLinksConfig.Downloads + } + if ok, downloadResourceName = MatchForDownload(u, node, globalDownloadsConfig); ok { + resourceName := c.getResourceName(u, downloadResourceName) _d := destination destination = buildDestination(node, resourceName, c.resourcesRoot) if _d != destination { @@ -323,42 +332,39 @@ func buildDestination(node *api.Node, resourceName, root string) string { return resourceRelPath } -func (c *NodeContentProcessor) generateResourceName(absURL string, resolvedLD *localityDomain) string { - var ( - ok bool - resourceName string - ) - u, _ := urls.Parse(absURL) +// Check for cached resource name first and return that if found. Otherwise, +// return the downloadName +func (c *NodeContentProcessor) getResourceName(u *urls.URL, downloadName string) string { c.rwlock.Lock() defer c.rwlock.Unlock() - if resourceName, ok = c.resourceAbsLinks[u.Path]; !ok { - resourceName = u.ResourceName - if len(u.Extension) > 0 { - resourceName = fmt.Sprintf("%s.%s", u.ResourceName, u.Extension) - } - resourceName = resolvedLD.GetDownloadedResourceName(u) - c.resourceAbsLinks[absURL] = resourceName + if cachedDownloadName, ok := c.resourceAbsLinks[u.Path]; ok { + return cachedDownloadName } - return resourceName + return downloadName } // returns substitution found, destination, text, title -func substitute(absLink string, node *api.Node) (ok bool, destination *string, text *string, title *string) { - if node == nil { - return false, nil, nil, nil - } - if substitutes := node.LinksSubstitutes; substitutes != nil { - for substituteK, substituteV := range substitutes { - // remove trailing slashes to avoid inequality only due to that - l := strings.TrimSuffix(absLink, "/") - s := strings.TrimSuffix(substituteK, "/") - if s == l { - return true, substituteV.Destination, substituteV.Text, substituteV.Title - } - } - } - return false, nil, nil, nil -} +// func rewrite(absLink string, node *api.Node) (ok bool, version string, destination *string, text string, title string) { +// if node == nil { +// return false, "", nil, "", "" +// } +// if links := node.Links; links != nil && len(links.Rewrites) > 0 { +// for expr, rule := range links.Rewrites { +// var ( +// regex *regexp.Regexp +// err error +// ) +// if regex, err = regexp.Compile(expr); err != nil { +// klog.Warningf("invalid link rewrite expression: %s, %s", expr, err.Error()) +// continue +// } +// if regex.Match([]byte(absLink)) { +// return true, rule.Version, rule.Destination, rule.Text, rule.Title +// } +// } +// } +// return false, "", nil, "", "" +// } // recordLinkStats records link stats for a node func recordLinkStats(node *api.Node, title, details string) { diff --git a/pkg/reactor/content_processor_test.go b/pkg/reactor/content_processor_test.go index 4957aec2..772f9efc 100644 --- a/pkg/reactor/content_processor_test.go +++ b/pkg/reactor/content_processor_test.go @@ -8,7 +8,6 @@ import ( "github.com/gardener/docforge/pkg/api" "github.com/gardener/docforge/pkg/resourcehandlers" "github.com/gardener/docforge/pkg/resourcehandlers/github" - "github.com/stretchr/testify/assert" ) func Test_processLink(t *testing.T) { @@ -105,16 +104,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, { @@ -159,16 +158,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, // links to documents @@ -192,16 +191,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, { @@ -224,16 +223,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, // Version rewrite @@ -247,16 +246,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, { @@ -269,16 +268,16 @@ func Test_processLink(t *testing.T) { wantResourceName: "", wantErr: nil, mutate: func(c *NodeContentProcessor) { - c.localityDomain = &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/gardener/gardener": &localityDomainValue{ - "v1.10.0", - "gardener/gardener/docs", - nil, - nil, - }, - }, - } + // c.localityDomain = &localityDomain{ + // mapping: map[string]*localityDomainValue{ + // "github.com/gardener/gardener": &localityDomainValue{ + // "v1.10.0", + // "gardener/gardener/docs", + // nil, + // nil, + // }, + // }, + // } }, }, } @@ -286,9 +285,9 @@ func Test_processLink(t *testing.T) { t.Run(tt.name, func(t *testing.T) { c := &NodeContentProcessor{ resourceAbsLinks: make(map[string]string), - localityDomain: &localityDomain{ - mapping: map[string]*localityDomainValue{}, - }, + // localityDomain: &localityDomain{ + // mapping: map[string]*localityDomainValue{}, + // }, resourcesRoot: "/__resources", ResourceHandlers: resourcehandlers.NewRegistry(github.NewResourceHandler(nil, []string{"github.com"})), rewriteEmbedded: true, @@ -329,69 +328,69 @@ func Test_processLink(t *testing.T) { } } -func Test_Substitute(t *testing.T) { - cda := "cda" - testCases := []struct { - link string - substitutes map[string]*api.LinkSubstitute - wantDestination string - wantOK bool - wantText *string - wantTitle *string - }{ - { - "abc", - map[string]*api.LinkSubstitute{ - "abc": &api.LinkSubstitute{ - Destination: &cda, - }, - }, - "cda", - true, - &cda, - &cda, - }, - { - "abc", - map[string]*api.LinkSubstitute{}, - "abc", - false, - &cda, - &cda, - }, - { - "", - map[string]*api.LinkSubstitute{ - "abc": &api.LinkSubstitute{ - Destination: &cda, - }, - }, - "", - false, - nil, - nil, - }, - } - for _, tc := range testCases { - t.Run("", func(t *testing.T) { - n := &api.Node{ - LinksSubstitutes: tc.substitutes, - } - var ( - gotOK bool - gotDestination, gotText, gotTitle *string - ) - gotOK, gotDestination, gotText, gotTitle = substitute(tc.link, n) - assert.Equal(t, tc.wantOK, gotOK) - if gotDestination != nil { - assert.Equal(t, tc.wantDestination, *gotDestination) - } - if gotText != nil { - assert.Equal(t, tc.wantText, *gotText) - } - if gotTitle != nil { - assert.Equal(t, tc.wantTitle, *gotTitle) - } - }) - } -} +// func Test_Substitute(t *testing.T) { +// cda := "cda" +// testCases := []struct { +// link string +// substitutes map[string]*api.LinkSubstitute +// wantDestination string +// wantOK bool +// wantText *string +// wantTitle *string +// }{ +// { +// "abc", +// map[string]*api.LinkSubstitute{ +// "abc": &api.LinkSubstitute{ +// Destination: &cda, +// }, +// }, +// "cda", +// true, +// &cda, +// &cda, +// }, +// { +// "abc", +// map[string]*api.LinkSubstitute{}, +// "abc", +// false, +// &cda, +// &cda, +// }, +// { +// "", +// map[string]*api.LinkSubstitute{ +// "abc": &api.LinkSubstitute{ +// Destination: &cda, +// }, +// }, +// "", +// false, +// nil, +// nil, +// }, +// } +// for _, tc := range testCases { +// t.Run("", func(t *testing.T) { +// n := &api.Node{ +// LinksSubstitutes: tc.substitutes, +// } +// var ( +// gotOK bool +// gotDestination, gotText, gotTitle *string +// ) +// gotOK, gotDestination, gotText, gotTitle = substitute(tc.link, n) +// assert.Equal(t, tc.wantOK, gotOK) +// if gotDestination != nil { +// assert.Equal(t, tc.wantDestination, *gotDestination) +// } +// if gotText != nil { +// assert.Equal(t, tc.wantText, *gotText) +// } +// if gotTitle != nil { +// assert.Equal(t, tc.wantTitle, *gotTitle) +// } +// }) +// } +// } diff --git a/pkg/reactor/document_controller.go b/pkg/reactor/document_controller.go index c65323e0..7486cf14 100644 --- a/pkg/reactor/document_controller.go +++ b/pkg/reactor/document_controller.go @@ -11,7 +11,7 @@ type DocumentController interface { jobs.Controller // SetDownloadScope sets the scope for resources considered "local" // and therefore downloaded and relatively linked - SetDownloadScope(scope *localityDomain) + // SetDownloadScope(scope *localityDomain) // GetDownloadController is accessor for the DownloadController // working with this DocumentController GetDownloadController() DownloadController @@ -43,9 +43,10 @@ func (d *docController) Shutdown() { // propagate the shutdown to the related download controller d.Worker.(*DocumentWorker).NodeContentProcessor.DownloadController.Shutdown() } -func (d *docController) SetDownloadScope(scope *localityDomain) { - d.Worker.(*DocumentWorker).NodeContentProcessor.localityDomain = scope -} + +// func (d *docController) SetDownloadScope(scope *localityDomain) { +// d.Worker.(*DocumentWorker).NodeContentProcessor.localityDomain = scope +// } func (d *docController) GetDownloadController() DownloadController { return d.Worker.(*DocumentWorker).NodeContentProcessor.DownloadController } diff --git a/pkg/reactor/document_worker.go b/pkg/reactor/document_worker.go index d35b5153..6b6c87e7 100644 --- a/pkg/reactor/document_worker.go +++ b/pkg/reactor/document_worker.go @@ -25,7 +25,7 @@ type DocumentWorker struct { Reader processors.Processor NodeContentProcessor *NodeContentProcessor - localityDomain localityDomain + // localityDomain localityDomain } // DocumentWorkTask implements jobs#Task @@ -53,14 +53,13 @@ func (w *DocumentWorker) Work(ctx context.Context, task interface{}, wq jobs.Wor if task, ok := task.(*DocumentWorkTask); ok { var ( - b bytes.Buffer - document []byte - err error + b bytes.Buffer + sourceBlob, document []byte + err error ) if len(task.Node.ContentSelectors) > 0 { for _, content := range task.Node.ContentSelectors { - var sourceBlob []byte if sourceBlob, err = w.Reader.Read(ctx, content.Source); err != nil { return jobs.NewWorkerError(err, 0) } @@ -72,18 +71,29 @@ func (w *DocumentWorker) Work(ctx context.Context, task interface{}, wq jobs.Wor } b.Write(sourceBlob) } - - if b.Len() == 0 { - return nil + } + // TODO: implement read by template + if len(task.Node.Source) > 0 { + if sourceBlob, err = w.Reader.Read(ctx, task.Node.Source); err != nil { + return jobs.NewWorkerError(err, 0) } - if document, err = ioutil.ReadAll(&b); err != nil { + b.Write(sourceBlob) + if sourceBlob, err = w.NodeContentProcessor.ReconcileLinks(ctx, task.Node, task.Node.Source, sourceBlob); err != nil { return jobs.NewWorkerError(err, 0) } + } - if w.Processor != nil { - if document, err = w.Processor.Process(document, task.Node); err != nil { - return jobs.NewWorkerError(err, 0) - } + if b.Len() == 0 { + return nil + } + + if document, err = ioutil.ReadAll(&b); err != nil { + return jobs.NewWorkerError(err, 0) + } + + if w.Processor != nil { + if document, err = w.Processor.Process(document, task.Node); err != nil { + return jobs.NewWorkerError(err, 0) } } diff --git a/pkg/reactor/document_worker_test.go b/pkg/reactor/document_worker_test.go index 25d83b17..26793976 100644 --- a/pkg/reactor/document_worker_test.go +++ b/pkg/reactor/document_worker_test.go @@ -61,14 +61,14 @@ func TestDocumentWorkerWork(t *testing.T) { }, &TestWriter{ make(map[string][]byte), }, 1, false, rhRegistry), - localityDomain: &localityDomain{ - mapping: map[string]*localityDomainValue{}, - }, + // localityDomain: &localityDomain{ + // mapping: map[string]*localityDomainValue{}, + // }, ResourceHandlers: rhRegistry, }, - localityDomain{ - mapping: map[string]*localityDomainValue{}, - }, + // localityDomain{ + // mapping: map[string]*localityDomainValue{}, + // }, } testCases := []struct { diff --git a/pkg/reactor/integration_test.go b/pkg/reactor/integration_test.go index 04cd60b9..38600acb 100644 --- a/pkg/reactor/integration_test.go +++ b/pkg/reactor/integration_test.go @@ -28,45 +28,51 @@ func init() { tests.SetKlogV(6) } -func _TestReactorWithGitHub(t *testing.T) { +func TestReactorWithGitHub(t *testing.T) { timeout := 300 * time.Second ctx, cancel := context.WithTimeout(context.Background(), timeout) defer cancel() docs := &api.Documentation{ - Root: &api.Node{ - Name: "docs", - NodeSelector: &api.NodeSelector{ - Path: "https://github.com/gardener/gardener/tree/v1.10.0/docs", - }, - Nodes: []*api.Node{ - { - Name: "calico", - NodeSelector: &api.NodeSelector{ - Path: "https://github.com/gardener/gardener-extension-networking-calico/tree/master/docs", - }, + Structure: []*api.Node{ + &api.Node{ + Name: "docs", + NodeSelector: &api.NodeSelector{ + Path: "https://github.com/gardener/gardener/tree/v1.10.0/docs", }, - { - Name: "aws", - NodeSelector: &api.NodeSelector{ - Path: "https://github.com/gardener/gardener-extension-provider-aws/tree/master/docs", + Nodes: []*api.Node{ + { + Name: "calico", + NodeSelector: &api.NodeSelector{ + Path: "https://github.com/gardener/gardener-extension-networking-calico/tree/master/docs", + }, + }, + { + Name: "aws", + NodeSelector: &api.NodeSelector{ + Path: "https://github.com/gardener/gardener-extension-provider-aws/tree/master/docs", + }, }, }, }, }, - LocalityDomain: &api.LocalityDomain{ - LocalityDomainMap: map[string]*api.LocalityDomainValue{ - "github.com/gardener/gardener": &api.LocalityDomainValue{ + Links: &api.Links{ + Rewrites: map[string]*api.LinkRewriteRule{ + "gardener/gardener/(blob|tree|raw)": &api.LinkRewriteRule{ Version: "v1.10.0", - Path: "gardener/gardener/docs", }, - "github.com/gardener/gardener-extension-provider-aws": &api.LocalityDomainValue{ - Version: "master", - Path: "gardener/gardener-extension-provider-aws/docs", + "gardener/gardener-extension-provider-aws/(blob|tree|raw)": &api.LinkRewriteRule{ + Version: "v1.15.3", }, - "github.com/gardener/gardener-extension-networking-calico": &api.LocalityDomainValue{ - Version: "master", - Path: "gardener/gardener-extension-networking-calico/docs", + "gardener/gardener-extension-networking-calico/(blob|tree|raw)": &api.LinkRewriteRule{ + Version: "v1.10.0", + }, + }, + Downloads: &api.Downloads{ + Scope: map[string]api.ResourceRenameRules{ + "gardener/gardener/(blob|tree|raw)/v1.10.0/docs": nil, + "gardener/gardener-extension-provider-aws/(blob|tree|raw)/v1.15.3/docs": nil, + "gardener/gardener-extension-networking-calico/(blob|tree|raw)/v1.10.0/docs": nil, }, }, }, diff --git a/pkg/reactor/localitydomain.go b/pkg/reactor/localitydomain.go index 239c86cb..87b4747b 100644 --- a/pkg/reactor/localitydomain.go +++ b/pkg/reactor/localitydomain.go @@ -2,12 +2,10 @@ package reactor import ( "fmt" - "reflect" "regexp" "strings" "github.com/gardener/docforge/pkg/api" - "github.com/gardener/docforge/pkg/resourcehandlers" "github.com/gardener/docforge/pkg/util/urls" "github.com/google/uuid" "k8s.io/klog/v2" @@ -22,321 +20,348 @@ import ( // resources referenced by those documents are checked // against the path hierarchy of locality domain // entries to determine hwo they will be processed. -type localityDomain struct { - mapping - downloadSubstitutes map[string]string -} -type mapping map[string]*localityDomainValue +// type localityDomain struct { +// mapping +// downloadSubstitutes map[string]string +// } -// LocalityDomainValue encapsulates the members of a -// localityDomain entry value -type localityDomainValue struct { - // Version is the version of the resources in this - // locality domain - Version string - // Path defines the scope of this locality domain - // and is relative to it - Path string - Include []string - Exclude []string -} +// type mapping map[string]*localityDomainValue -func copyMap(s map[string]string) map[string]string { - _s := make(map[string]string) - for k, v := range s { - _s[k] = v - } - return _s -} +// // LocalityDomainValue encapsulates the members of a +// // localityDomain entry value +// type localityDomainValue struct { +// // Version is the version of the resources in this +// // locality domain +// Version string +// // Path defines the scope of this locality domain +// // and is relative to it +// Path string +// Include []string +// Exclude []string +// } -// fromAPI creates new localityDomain copy object from -// api.LocalityDomain -func copyLocalityDomain(ld *api.LocalityDomain) *localityDomain { - localityDomain := &localityDomain{ - mapping: map[string]*localityDomainValue{}, - } - for k, v := range ld.LocalityDomainMap { - localityDomain.mapping[k] = &localityDomainValue{ - v.Version, - v.Path, - v.Include, - v.Exclude, - } - } - localityDomain.downloadSubstitutes = copyMap(ld.DownloadSubstitutes) - return localityDomain -} +// MatchPathInLocality determines if a given link is in the locality domain scope +// and returns the link with version matching the one of the matched locality +// domain. +// func (ld localityDomain) MatchPathInLocality(link string, rhs resourcehandlers.Registry) (string, bool) { +// if rh := rhs.Get(link); rh != nil { +// var ( +// key, path string +// err error +// ) +// if key, path, _, err = rh.GetLocalityDomainCandidate(link); err != nil { +// return link, false +// } +// localityDomain, ok := ld.mapping[key] +// if !ok { +// return link, false +// } -// Set creates or updates a locality domain entry -// with key and path. An update is performed when -// the path is ancestor оф the existing path for -// that key. -func (ld localityDomain) Set(key, path, version string) { +// var exclude, include bool +// // check if the link is not in locality scope by explicit exclude +// if len(localityDomain.Exclude) > 0 { +// for _, rx := range localityDomain.Exclude { +// if exclude, err = regexp.MatchString(rx, link); err != nil { +// klog.Warningf("exclude pattern match %s failed for %s\n", localityDomain.Exclude, link) +// } +// if exclude { +// break +// } +// } +// } +// // check if the link is in locality scope by explicit include +// if len(localityDomain.Include) > 0 { +// for _, rx := range localityDomain.Include { +// if include, err = regexp.MatchString(rx, link); err != nil { +// klog.Warningf("include pattern match %s failed for %s\n", localityDomain.Include, link) +// } +// if include { +// exclude = false +// break +// } +// } +// } +// if exclude { +// if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { +// klog.Errorf("%v\n", err) +// return link, false +// } +// return link, false +// } + +// prefix := localityDomain.Path +// // FIXME: this is tmp valid only for github urls +// if strings.HasPrefix(path, prefix) { +// if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { +// klog.Errorf("%v\n", err) +// return link, false +// } +// return link, true +// } +// // check if in the same repo and then enforce versions rewrite +// _s := strings.Split(prefix, "/") +// _s = _s[:len(_s)-1] +// repoPrefix := strings.Join(_s, "/") +// if strings.HasPrefix(path, repoPrefix) { +// if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { +// klog.Errorf("%v\n", err) +// return link, false +// } +// } +// } +// return link, false +// } + +// // PathInLocality determines if a given link is in the locality domain scope +// func (ld localityDomain) PathInLocality(link string, rhs resourcehandlers.Registry) bool { +// if rh := rhs.Get(link); rh != nil { +// var ( +// key, path, version string +// err error +// ) +// if key, path, version, err = rh.GetLocalityDomainCandidate(link); err != nil { +// return false +// } +// localityDomain, ok := ld.mapping[key] +// if !ok { +// return false +// } +// klog.V(6).Infof("Path %s in locality domain %s: %v\n", path, localityDomain, strings.HasPrefix(path, localityDomain.Path)) +// // TODO: locality domain to be constructed from key for comparison +// return reflect.DeepEqual(localityDomain, &localityDomainValue{ +// version, +// path, +// localityDomain.Include, +// localityDomain.Exclude, +// }) +// } +// return false +// } + +// MatchForLinkRewrite tries recursively from this node +// up to the hierarchy root link rewrite rules attached +// to nodes and finally defined globally that match this +// URL to apply them and rewrite the link or return it +// untouched. +func MatchForLinkRewrite(absLink string, node *api.Node, globalRenameRules map[string]*api.LinkRewriteRule) (version string, destination *string, text string, title string, isMatched bool) { var ( - existingLD *localityDomainValue - ok bool + regex *regexp.Regexp + err error ) - if existingLD, ok = ld.mapping[key]; !ok { - ld.mapping[key] = &localityDomainValue{ - version, - path, - nil, - nil, - } - return - } - - localityDomain := strings.Split(existingLD.Path, "/") - localityDomainCandidate := strings.Split(path, "/") - for i := range localityDomain { - if len(localityDomainCandidate) <= i || localityDomain[i] != localityDomainCandidate[i] { - ld.mapping[key].Path = strings.Join(localityDomain[:i], "/") + nodes := node.Parents() + nodes = append(nodes, node) + for i := len(nodes) - 1; i >= 0; i-- { + p := nodes[i] + if destination == nil || len(version) == 0 || len(text) == 0 || len(title) == 0 { + if l := p.Links; l != nil { + if l.Rewrites != nil { + for expr, rule := range l.Rewrites { + if regex, err = regexp.Compile(expr); err != nil { + klog.Warningf("invalid link rewrite expression: %s, %s", expr, err.Error()) + continue + } + if regex.Match([]byte(absLink)) { + isMatched = true + if len(version) == 0 { + version = rule.Version + } + if destination == nil { + destination = rule.Destination + } + if len(text) == 0 { + text = rule.Text + } + if len(title) == 0 { + title = rule.Title + } + } + } + } + } + } else { return } } + return } -// MatchPathInLocality determines if a given link is in the locality domain scope -// and returns the link with version matching the one of the matched locality -// domain. -func (ld localityDomain) MatchPathInLocality(link string, rhs resourcehandlers.Registry) (string, bool) { - if rh := rhs.Get(link); rh != nil { - var ( - key, path string - err error - ) - if key, path, _, err = rh.GetLocalityDomainCandidate(link); err != nil { - return link, false - } - localityDomain, ok := ld.mapping[key] - if !ok { - return link, false - } +//TODO: implement node settings override parent/global ones - var exclude, include bool - // check if the link is not in locality scope by explicit exclude - if len(localityDomain.Exclude) > 0 { - for _, rx := range localityDomain.Exclude { - if exclude, err = regexp.MatchString(rx, link); err != nil { - klog.Warningf("exclude pattern match %s failed for %s\n", localityDomain.Exclude, link) - } - if exclude { - break - } - } - } - // check if the link is in locality scope by explicit include - if len(localityDomain.Include) > 0 { - for _, rx := range localityDomain.Include { - if include, err = regexp.MatchString(rx, link); err != nil { - klog.Warningf("include pattern match %s failed for %s\n", localityDomain.Include, link) - } - if include { - exclude = false - break - } +// MatchForDownload returns true if the provided URL is in the defined download scope +// for the node, and the resource name to use when serializing it. +func MatchForDownload(url *urls.URL, node *api.Node, globalDownloadRules *api.Downloads) (isMatched bool, downloadResourceName string) { + downloads := []*api.Downloads{} + if globalDownloadRules != nil { + downloads = append(downloads, globalDownloadRules) + } + nodes := node.Parents() + nodes = append(nodes, node) + for _, p := range nodes { + if l := p.Links; l != nil { + if l.Downloads != nil { + downloads = append(downloads, l.Downloads) } } - if exclude { - if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { - klog.Errorf("%v\n", err) - return link, false - } - return link, false + } + for i := len(downloads) - 1; i >= 0; i-- { + d := downloads[i] + if isMatched, downloadResourceName = matchForDownload(url, d); isMatched { + return } + } + return false, "" +} - prefix := localityDomain.Path - // FIXME: this is tmp valid only for github urls - if strings.HasPrefix(path, prefix) { - if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { - klog.Errorf("%v\n", err) - return link, false - } - return link, true +func matchForDownload(url *urls.URL, downloadRules *api.Downloads) (bool, string) { + var ( + regex *regexp.Regexp + downloadResourceName string + err error + ) + if downloadRules == nil { + return false, "" + } + link := url.String() + for linkMatchExpr, linkRenameRules := range downloadRules.Scope { + if regex, err = regexp.Compile(linkMatchExpr); err != nil { + klog.Warningf("invalid link rewrite expression: %s, %s", linkMatchExpr, err.Error()) + continue } - // check if in the same repo and then enforce versions rewrite - _s := strings.Split(prefix, "/") - _s = _s[:len(_s)-1] - repoPrefix := strings.Join(_s, "/") - if strings.HasPrefix(path, repoPrefix) { - if link, err = rh.SetVersion(link, localityDomain.Version); err != nil { - klog.Errorf("%v\n", err) - return link, false + if regex.Match([]byte(link)) { + // check for match scope-specific rules for renaming downloads first + if renameRule := matchDownloadRenameRule(link, linkRenameRules); len(renameRule) > 0 { + downloadResourceName = expandVariables(url, renameRule) + return true, downloadResourceName + } + // check for match scope-agnostic, global rules for renaming downloads + if renameRule := matchDownloadRenameRule(link, downloadRules.Renames); len(renameRule) > 0 { + downloadResourceName = expandVariables(url, renameRule) + return true, downloadResourceName } + // default download resource name + downloadResourceName := expandVariables(url, "$uuid$ext") + return true, downloadResourceName } } - return link, false + return false, "" } -// PathInLocality determines if a given link is in the locality domain scope -func (ld localityDomain) PathInLocality(link string, rhs resourcehandlers.Registry) bool { - if rh := rhs.Get(link); rh != nil { - var ( - key, path, version string - err error - ) - if key, path, version, err = rh.GetLocalityDomainCandidate(link); err != nil { - return false +func matchDownloadRenameRule(link string, rules map[string]string) string { + var ( + renameRegex *regexp.Regexp + err error + ) + for linkRenameMatchExpr, renameRule := range rules { + if renameRegex, err = regexp.Compile(linkRenameMatchExpr); err != nil { + klog.Warningf("invalid link rewrite expression: %s, %s", linkRenameMatchExpr, err.Error()) + continue } - localityDomain, ok := ld.mapping[key] - if !ok { - return false + if renameRegex.Match([]byte(link)) { + return renameRule } - klog.V(6).Infof("Path %s in locality domain %s: %v\n", path, localityDomain, strings.HasPrefix(path, localityDomain.Path)) - // TODO: locality domain to be constructed from key for comparison - return reflect.DeepEqual(localityDomain, &localityDomainValue{ - version, - path, - localityDomain.Include, - localityDomain.Exclude, - }) } - return false + return "" } -func (ld localityDomain) GetDownloadedResourceName(u *urls.URL) string { - k := strings.TrimPrefix(u.Path, "/") +func expandVariables(url *urls.URL, renameExpr string) string { id := uuid.New().String() - if len(ld.downloadSubstitutes) > 0 { - for substituteMatcher, s := range ld.downloadSubstitutes { - var ( - matched bool - err error - ) - if matched, err = regexp.MatchString(substituteMatcher, k); err != nil { - klog.Warningf("download substitution pattern match %s failed for %s\n", substituteMatcher, k) - break - } - if matched { - s = strings.ReplaceAll(s, "$name", u.ResourceName) - s = strings.ReplaceAll(s, "$uuid", id) - s = strings.ReplaceAll(s, "$path", u.ResourcePath) - s = strings.ReplaceAll(s, "$ext", u.Extension) - return s - } - } - } - if len(u.Extension) > 0 { - s := fmt.Sprintf("%s.%s", id, u.Extension) - return s - } - return id + s := renameExpr + s = strings.ReplaceAll(s, "$name", url.ResourceName) + s = strings.ReplaceAll(s, "$uuid", id) + s = strings.ReplaceAll(s, "$ext", fmt.Sprintf(".%s", url.Extension)) + return s } -// setLocalityDomainForNode visits all content selectors in the node and its -// descendants to build a localityDomain -func localityDomainFromNode(node *api.Node, rhs resourcehandlers.Registry) (*localityDomain, error) { - var localityDomains = &localityDomain{ - mapping: map[string]*localityDomainValue{}, - } - if err := csHandle(node.ContentSelectors, localityDomains, rhs); err != nil { - return nil, err +func resolveLinks(links *api.Links, nodes []*api.Node) { + for _, n := range nodes { + n.Links = mergeLinks(links, n.Links) + resolveLinks(n.Links, n.Nodes) + continue } - if node.Nodes != nil { - if err := fromNodes(node.Nodes, localityDomains, rhs); err != nil { - return nil, err - } - } - return localityDomains, nil } -func csHandle(contentSelectors []api.ContentSelector, localityDomains *localityDomain, rhs resourcehandlers.Registry) error { - for _, cs := range contentSelectors { - if rh := rhs.Get(cs.Source); rh != nil { - key, path, version, err := rh.GetLocalityDomainCandidate(cs.Source) - if err != nil { - return err - } - localityDomains.Set(key, path, version) - } +func mergeLinks(a, b *api.Links) *api.Links { + if b == nil { + return a } - return nil + if a == nil { + return b + } + a.Rewrites = mergeRewrites(a.Rewrites, b.Rewrites) + a.Downloads = mergeDownloads(a.Downloads, b.Downloads) + return a } -func fromNodes(nodes []*api.Node, localityDomains *localityDomain, rhs resourcehandlers.Registry) error { - for _, node := range nodes { - csHandle(node.ContentSelectors, localityDomains, rhs) - if err := fromNodes(node.Nodes, localityDomains, rhs); err != nil { - return err +func mergeRewrites(a, b map[string]*api.LinkRewriteRule) map[string]*api.LinkRewriteRule { + if len(b) == 0 { + return a + } + if len(a) == 0 { + return b + } + for k, v := range b { + if rule, ok := a[k]; ok { + a[k] = mergeLinkRewriteRule(rule, v) + continue } + a[k] = v } - return nil + return a } -// ResolveLocalityDomain resolves the actual locality domain for a node, -// considering the global one (if any) and locally defined one. -// If no localityDomain is defined on the node the function returns nil -func resolveLocalityDomain(node *api.Node, globalLD *localityDomain) *localityDomain { - if nodeLD := node.LocalityDomain; nodeLD != nil { - nodeLD := copyLocalityDomain(nodeLD) - if globalLD == nil { - return copyLocalityDomain(node.LocalityDomain) - } - ld := &localityDomain{ - mapping: map[string]*localityDomainValue{}, - } - for k, v := range globalLD.mapping { - ld.mapping[k] = &localityDomainValue{ - v.Version, - v.Path, - v.Exclude, - v.Include, - } - } - mergeLocalityDomain(ld, nodeLD) - return ld +func mergeLinkRewriteRule(a, b *api.LinkRewriteRule) *api.LinkRewriteRule { + if len(b.Version) > 0 { + a.Version = b.Version + } + if b.Destination != nil { + a.Destination = b.Destination } - return globalLD + if len(b.Text) > 0 { + a.Text = b.Text + } + if len(b.Title) > 0 { + a.Title = b.Title + } + return a } -func mergeLocalityDomain(a, b *localityDomain) *localityDomain { - if a == nil || b == nil { - panic("cannot merge nil localityDomain arguments") +func mergeDownloads(a, b *api.Downloads) *api.Downloads { + if b == nil { + return a } - a.downloadSubstitutes = mergeDownloadSubstitutes(a.downloadSubstitutes, b.downloadSubstitutes) - for k, v := range b.mapping { - v := mergeLocalityDomainValue(a.mapping[k], v) - a.mapping[k] = v + if a == nil { + return b } + a.Renames = mergeResourceRenameRule(a.Renames, b.Renames) + a.Scope = mergeDownloadScope(a.Scope, b.Scope) return a } -// replaces Version and Path from b in a if any -// merges Exclude and Include from b in a if any -// merges DownloadSubstitutes from b in a if any, -// replacing duplicate entries in a with entries from b. -func mergeLocalityDomainValue(a, b *localityDomainValue) *localityDomainValue { - if len(b.Version) > 0 { - a.Version = b.Version - } - if len(b.Path) > 0 { - a.Path = b.Path +func mergeResourceRenameRule(a, b api.ResourceRenameRules) api.ResourceRenameRules { + if len(b) == 0 { + return a } - if len(b.Exclude) > 0 { - _e := []string{} - if len(a.Exclude) > 0 { - _e = append(_e, a.Exclude...) - } - a.Exclude = append(_e, b.Exclude...) + if len(a) == 0 { + return b } - if len(b.Include) > 0 { - _e := []string{} - if len(a.Include) > 0 { - _e = append(_e, a.Include...) - } - a.Include = append(_e, b.Include...) + for k, v := range b { + a[k] = v } return a } -func mergeDownloadSubstitutes(a, b map[string]string) map[string]string { - if len(a) > 0 && len(b) < 1 { +func mergeDownloadScope(a, b map[string]api.ResourceRenameRules) map[string]api.ResourceRenameRules { + if len(b) == 0 { return a } - if len(a) < 1 && len(b) > 0 { + if len(a) == 0 { return b } for k, v := range b { + if rule, ok := a[k]; ok { + a[k] = mergeResourceRenameRule(rule, v) + continue + } a[k] = v } return a diff --git a/pkg/reactor/localitydomain_test.go b/pkg/reactor/localitydomain_test.go index 3977a73a..6f904c5d 100644 --- a/pkg/reactor/localitydomain_test.go +++ b/pkg/reactor/localitydomain_test.go @@ -1,223 +1,213 @@ package reactor -import ( - "reflect" - "testing" +// func TestGitHubLocalityDomain_Set(t *testing.T) { - "github.com/gardener/docforge/pkg/resourcehandlers" - "github.com/gardener/docforge/pkg/resourcehandlers/github" +// tests := []struct { +// name string +// localityDomain *localityDomain +// key string +// urls []string +// expected *localityDomainValue +// }{ +// { +// name: "Should return the same and already existing locality domain", +// localityDomain: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "https://github.com/gardener/gardener": &localityDomainValue{ +// "master", +// "/gardener/gardener/master/docs", +// nil, +// nil, +// }, +// }, +// }, +// key: "https://github.com/gardener/gardener", +// urls: []string{"/gardener/gardener/master/docs"}, +// expected: &localityDomainValue{ +// "master", +// "/gardener/gardener/master/docs", +// nil, +// nil, +// }, +// }, +// { +// name: "Should return the candidate locality domain as it is higher in the hierarchy", +// localityDomain: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "https://github.com/gardener/gardener": &localityDomainValue{ +// "master", +// "/gardener/gardener/master/docs", +// nil, +// nil, +// }, +// }, +// }, +// key: "github.com/gardener/gardener", +// urls: []string{"/gardener/gardener/master", "/gardener/gardener/master/docs/concepts", "/gardener/gardener/master/docs/concepts/apiserver.md"}, +// expected: &localityDomainValue{ +// "master", +// "/gardener/gardener/master", +// nil, +// nil, +// }, +// }, +// { +// name: "Should return one level higher because both are on the same level in the hierarchy", +// localityDomain: &localityDomain{ +// mapping: map[string]*localityDomainValue{}, +// }, +// key: "github.com/gardener/gardener", +// urls: []string{"/gardener/gardener/master/examples", "/gardener/gardener/master"}, +// expected: &localityDomainValue{ +// "master", +// "/gardener/gardener/master", +// nil, +// nil, +// }, +// }, +// } +// for _, tc := range tests { +// t.Run(tc.name, func(t *testing.T) { +// ld := tc.localityDomain +// for _, url := range tc.urls { +// ld.Set(tc.key, url, "master") +// } - "github.com/gardener/docforge/pkg/api" -) +// if !reflect.DeepEqual(ld.mapping[tc.key], tc.expected) { +// t.Errorf("test failed %s != %s", ld.mapping[tc.key], tc.expected) +// } +// }) +// } +// } -func TestGitHubLocalityDomain_Set(t *testing.T) { - - tests := []struct { - name string - localityDomain *localityDomain - key string - urls []string - expected *localityDomainValue - }{ - { - name: "Should return the same and already existing locality domain", - localityDomain: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "https://github.com/gardener/gardener": &localityDomainValue{ - "master", - "/gardener/gardener/master/docs", - nil, - nil, - }, - }, - }, - key: "https://github.com/gardener/gardener", - urls: []string{"/gardener/gardener/master/docs"}, - expected: &localityDomainValue{ - "master", - "/gardener/gardener/master/docs", - nil, - nil, - }, - }, - { - name: "Should return the candidate locality domain as it is higher in the hierarchy", - localityDomain: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "https://github.com/gardener/gardener": &localityDomainValue{ - "master", - "/gardener/gardener/master/docs", - nil, - nil, - }, - }, - }, - key: "github.com/gardener/gardener", - urls: []string{"/gardener/gardener/master", "/gardener/gardener/master/docs/concepts", "/gardener/gardener/master/docs/concepts/apiserver.md"}, - expected: &localityDomainValue{ - "master", - "/gardener/gardener/master", - nil, - nil, - }, - }, - { - name: "Should return one level higher because both are on the same level in the hierarchy", - localityDomain: &localityDomain{ - mapping: map[string]*localityDomainValue{}, - }, - key: "github.com/gardener/gardener", - urls: []string{"/gardener/gardener/master/examples", "/gardener/gardener/master"}, - expected: &localityDomainValue{ - "master", - "/gardener/gardener/master", - nil, - nil, - }, - }, - } - for _, tc := range tests { - t.Run(tc.name, func(t *testing.T) { - ld := tc.localityDomain - for _, url := range tc.urls { - ld.Set(tc.key, url, "master") - } - - if !reflect.DeepEqual(ld.mapping[tc.key], tc.expected) { - t.Errorf("test failed %s != %s", ld.mapping[tc.key], tc.expected) - } - }) - } -} - -func Test_SetLocalityDomainForNode(t *testing.T) { - tests := []struct { - name string - want *localityDomain - wantErr bool - mutate func(newDoc *api.Documentation) - }{ - { - name: "Should return the expected locality domain", - want: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/org/repo": &localityDomainValue{ - "master", - "org/repo/docs", - nil, - nil, - }, - }, - }, - wantErr: false, - mutate: func(newDoc *api.Documentation) { - newDoc.Root.ContentSelectors = []api.ContentSelector{ - {Source: "https://github.com/org/repo/tree/master/docs/concepts"}, - {Source: "https://github.com/org/repo/tree/master/docs/architecture"}, - } - }, - }, - { - name: "Should return the expected locality domain", - want: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/org/repo": &localityDomainValue{ - "master", - "org/repo/docs", - nil, - nil, - }, - }, - }, - wantErr: false, - mutate: func(newDoc *api.Documentation) { - newDoc.Root.ContentSelectors = []api.ContentSelector{ - {Source: "https://github.com/org/repo/tree/master/docs"}, - {Source: "https://github.com/org/repo/tree/master/docs/architecture"}, - } - }, - }, - { - name: "Should return the expected locality domain", - want: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/org/repo": &localityDomainValue{ - "master", - "org/repo", - nil, - nil, - }, - }, - }, - wantErr: false, - mutate: func(newDoc *api.Documentation) { - newDoc.Root.ContentSelectors = []api.ContentSelector{ - {Source: "https://github.com/org/repo/tree/master/docs"}, - {Source: "https://github.com/org/repo/tree/master/example"}, - } - }, - }, - { - name: "Should return the expected locality domain", - want: &localityDomain{ - mapping: map[string]*localityDomainValue{ - "github.com/org/repo": &localityDomainValue{ - "master", - "org/repo", - nil, - nil, - }, - "github.com/org/repo2": &localityDomainValue{ - "master", - "org/repo2/example", - nil, - nil, - }, - }, - }, - wantErr: false, - mutate: func(newDoc *api.Documentation) { - newDoc.Root.ContentSelectors = []api.ContentSelector{ - {Source: "https://github.com/org/repo/tree/master/docs"}, - {Source: "https://github.com/org/repo/tree/master/example"}, - } - newDoc.Root.Nodes = []*api.Node{ - { - Name: "anotherrepo", - ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo2/tree/master/example"}}, - }, - } - }, - }, - } - for _, tc := range tests { - t.Run(tc.name, func(t *testing.T) { - newDoc := createNewDocumentation() - gh := github.NewResourceHandler(nil, []string{"github.com"}) - rhs := resourcehandlers.NewRegistry(gh) - tc.mutate(newDoc) - got, err := localityDomainFromNode(newDoc.Root, rhs) - if (err != nil) != tc.wantErr { - t.Errorf("SetLocalityDomainForNode() error = %v, wantErr %v", err, tc.wantErr) - return - } - for k, v := range tc.want.mapping { - var ( - _v *localityDomainValue - ok bool - ) - if _v, ok = got.mapping[k]; !ok { - t.Errorf("want %s:%v, got %s:%v", k, v, k, _v) - } else { - if _v.Path != v.Path { - t.Errorf("want path %s, got %s", v.Path, _v.Path) - } - if _v.Version != v.Version { - t.Errorf("want version %s, got %s", v.Version, _v.Version) - } - } - } - rhs.Remove() - }) - } -} +// func Test_SetLocalityDomainForNode(t *testing.T) { +// tests := []struct { +// name string +// want *localityDomain +// wantErr bool +// mutate func(newDoc *api.Documentation) +// }{ +// { +// name: "Should return the expected locality domain", +// want: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "github.com/org/repo": &localityDomainValue{ +// "master", +// "org/repo/docs", +// nil, +// nil, +// }, +// }, +// }, +// wantErr: false, +// mutate: func(newDoc *api.Documentation) { +// newDoc.Root.ContentSelectors = []api.ContentSelector{ +// {Source: "https://github.com/org/repo/tree/master/docs/concepts"}, +// {Source: "https://github.com/org/repo/tree/master/docs/architecture"}, +// } +// }, +// }, +// { +// name: "Should return the expected locality domain", +// want: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "github.com/org/repo": &localityDomainValue{ +// "master", +// "org/repo/docs", +// nil, +// nil, +// }, +// }, +// }, +// wantErr: false, +// mutate: func(newDoc *api.Documentation) { +// newDoc.Root.ContentSelectors = []api.ContentSelector{ +// {Source: "https://github.com/org/repo/tree/master/docs"}, +// {Source: "https://github.com/org/repo/tree/master/docs/architecture"}, +// } +// }, +// }, +// { +// name: "Should return the expected locality domain", +// want: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "github.com/org/repo": &localityDomainValue{ +// "master", +// "org/repo", +// nil, +// nil, +// }, +// }, +// }, +// wantErr: false, +// mutate: func(newDoc *api.Documentation) { +// newDoc.Root.ContentSelectors = []api.ContentSelector{ +// {Source: "https://github.com/org/repo/tree/master/docs"}, +// {Source: "https://github.com/org/repo/tree/master/example"}, +// } +// }, +// }, +// { +// name: "Should return the expected locality domain", +// want: &localityDomain{ +// mapping: map[string]*localityDomainValue{ +// "github.com/org/repo": &localityDomainValue{ +// "master", +// "org/repo", +// nil, +// nil, +// }, +// "github.com/org/repo2": &localityDomainValue{ +// "master", +// "org/repo2/example", +// nil, +// nil, +// }, +// }, +// }, +// wantErr: false, +// mutate: func(newDoc *api.Documentation) { +// newDoc.Root.ContentSelectors = []api.ContentSelector{ +// {Source: "https://github.com/org/repo/tree/master/docs"}, +// {Source: "https://github.com/org/repo/tree/master/example"}, +// } +// newDoc.Root.Nodes = []*api.Node{ +// { +// Name: "anotherrepo", +// ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo2/tree/master/example"}}, +// }, +// } +// }, +// }, +// } +// for _, tc := range tests { +// t.Run(tc.name, func(t *testing.T) { +// newDoc := createNewDocumentation() +// gh := github.NewResourceHandler(nil, []string{"github.com"}) +// rhs := resourcehandlers.NewRegistry(gh) +// tc.mutate(newDoc) +// got, err := localityDomainFromNode(newDoc.Root, rhs) +// if (err != nil) != tc.wantErr { +// t.Errorf("SetLocalityDomainForNode() error = %v, wantErr %v", err, tc.wantErr) +// return +// } +// for k, v := range tc.want.mapping { +// var ( +// _v *localityDomainValue +// ok bool +// ) +// if _v, ok = got.mapping[k]; !ok { +// t.Errorf("want %s:%v, got %s:%v", k, v, k, _v) +// } else { +// if _v.Path != v.Path { +// t.Errorf("want path %s, got %s", v.Path, _v.Path) +// } +// if _v.Version != v.Version { +// t.Errorf("want version %s, got %s", v.Version, _v.Version) +// } +// } +// } +// rhs.Remove() +// }) +// } +// } diff --git a/pkg/reactor/reactor.go b/pkg/reactor/reactor.go index 12de2c26..f4fa2401 100644 --- a/pkg/reactor/reactor.go +++ b/pkg/reactor/reactor.go @@ -4,8 +4,10 @@ import ( "context" "fmt" "os" + "strings" "github.com/gardener/docforge/pkg/processors" + "github.com/google/uuid" "k8s.io/klog/v2" "github.com/gardener/docforge/pkg/api" @@ -30,6 +32,7 @@ type Options struct { ResourceHandlers []resourcehandlers.ResourceHandler DryRunWriter writers.DryRunWriter Resolve bool + GlobalLinksConfig *api.Links } // NewReactor creates a Reactor from Options @@ -39,7 +42,7 @@ func NewReactor(o *Options) *Reactor { worker := &DocumentWorker{ Writer: o.Writer, Reader: &GenericReader{rhRegistry}, - NodeContentProcessor: NewNodeContentProcessor(o.ResourcesPath, nil, downloadController, o.FailFast, o.MarkdownFmt, o.RewriteEmbedded, rhRegistry), + NodeContentProcessor: NewNodeContentProcessor(o.ResourcesPath, o.GlobalLinksConfig, downloadController, o.FailFast, o.MarkdownFmt, o.RewriteEmbedded, rhRegistry), Processor: o.Processor, } docController := NewDocumentController(worker, o.MaxWorkersCount, o.FailFast) @@ -56,21 +59,17 @@ func NewReactor(o *Options) *Reactor { // Reactor orchestrates the documentation build workflow type Reactor struct { - FailFast bool - ResourceHandlers resourcehandlers.Registry - localityDomain *localityDomain + FailFast bool + ResourceHandlers resourcehandlers.Registry + // localityDomain *localityDomain DocController DocumentController DownloadController DownloadController DryRunWriter writers.DryRunWriter Resolve bool } -// Run starts build operation on docStruct -func (r *Reactor) Run(ctx context.Context, docStruct *api.Documentation, dryRun bool) error { - var ( - err error - ld *localityDomain - ) +// Run starts build operation on documentation +func (r *Reactor) Run(ctx context.Context, documentation *api.Documentation, dryRun bool) error { ctx, cancel := context.WithCancel(ctx) defer func() { cancel() @@ -79,22 +78,12 @@ func (r *Reactor) Run(ctx context.Context, docStruct *api.Documentation, dryRun } }() - if err := r.ResolveStructure(ctx, docStruct.Root); err != nil { + if err := r.ResolveStructure(ctx, documentation.Structure); err != nil { return err } - if docStruct.LocalityDomain != nil { - ld = copyLocalityDomain(docStruct.LocalityDomain) - if ld == nil || len(ld.mapping) == 0 { - if ld, err = localityDomainFromNode(docStruct.Root, r.ResourceHandlers); err != nil { - return err - } - r.localityDomain = ld - } - } - if r.Resolve { - s, err := api.Serialize(docStruct) + s, err := api.Serialize(documentation) if err != nil { return err } @@ -102,35 +91,49 @@ func (r *Reactor) Run(ctx context.Context, docStruct *api.Documentation, dryRun os.Stdout.Write([]byte("\n\n")) } + resolveLinks(documentation.Links, documentation.Structure) + klog.V(4).Info("Building documentation structure\n\n") - if err = r.Build(ctx, docStruct.Root, ld); err != nil { + if err := r.Build(ctx, documentation.Structure); err != nil { return err } return nil } -// ResolveStructure builds the subnodes hierarchy of a node based on the natural nodes -// hierarchy and on rules such as those in NodeSelector. -// The node hierarchy is resolved by an appropriate handler selected based -// on the NodeSelector path URI +// ResolveStructure resolves the following in a structure model: +// - Node name variables +// - NodeSelectors // The resulting model is the actual flight plan for replicating resources. -func (r *Reactor) ResolveStructure(ctx context.Context, node *api.Node) error { - node.SetParentsDownwards() - if node.NodeSelector != nil { - var handler resourcehandlers.ResourceHandler - if handler = r.ResourceHandlers.Get(node.NodeSelector.Path); handler == nil { - return fmt.Errorf("No suitable handler registered for path %s", node.NodeSelector.Path) +func (r *Reactor) ResolveStructure(ctx context.Context, nodes []*api.Node) error { + var handler resourcehandlers.ResourceHandler + for _, node := range nodes { + node.SetParentsDownwards() + if len(node.Source) > 0 { + if handler = r.ResourceHandlers.Get(node.Source); handler == nil { + return fmt.Errorf("No suitable handler registered for URL %s", node.Source) + } + if len(node.Name) == 0 { + node.Name = "$name" + } + name, ext := handler.ResourceName(node.Source) + id := uuid.New().String() + node.Name = strings.ReplaceAll(node.Name, "$name", name) + node.Name = strings.ReplaceAll(node.Name, "$uuid", id) + node.Name = strings.ReplaceAll(node.Name, "$ext", fmt.Sprintf(".%s", ext)) } - if err := handler.ResolveNodeSelector(ctx, node); err != nil { - return err + if node.NodeSelector != nil { + if handler = r.ResourceHandlers.Get(node.NodeSelector.Path); handler == nil { + return fmt.Errorf("No suitable handler registered for path %s", node.NodeSelector.Path) + } + if err := handler.ResolveNodeSelector(ctx, node); err != nil { + return err + } + // remove node selectors after resolution + node.NodeSelector = nil } - // remove node selectors after resolution - node.NodeSelector = nil - } - if len(node.Nodes) > 0 { - for _, n := range node.Nodes { - if err := r.ResolveStructure(ctx, n); err != nil { + if len(node.Nodes) > 0 { + if err := r.ResolveStructure(ctx, node.Nodes); err != nil { return err } } diff --git a/pkg/reactor/reactor_test.go b/pkg/reactor/reactor_test.go index 1637331f..e1b7b8fe 100644 --- a/pkg/reactor/reactor_test.go +++ b/pkg/reactor/reactor_test.go @@ -15,14 +15,12 @@ func init() { var ( apiRefNode = &api.Node{ Name: "apiRef", - Title: "API Reference", ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs/architecture/apireference.md"}}, } archNode = &api.Node{ Name: "arch", ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs/architecture"}}, - Title: "Architecture", Nodes: []*api.Node{ apiRefNode, }, @@ -31,26 +29,25 @@ var ( blogNode = &api.Node{ Name: "blog", ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs/blog/blog-part1.md"}}, - Title: "Blog", } tasksNode = &api.Node{ Name: "tasks", - Title: "Tasks", ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs/tasks"}}, } ) func createNewDocumentation() *api.Documentation { return &api.Documentation{ - Root: &api.Node{ - Name: "rootNode", - Title: "Root node!", - ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs"}}, - Nodes: []*api.Node{ - archNode, - blogNode, - tasksNode, + Structure: []*api.Node{ + &api.Node{ + Name: "rootNode", + ContentSelectors: []api.ContentSelector{{Source: "https://github.com/org/repo/tree/master/docs"}}, + Nodes: []*api.Node{ + archNode, + blogNode, + tasksNode, + }, }, }, } @@ -74,6 +71,10 @@ func (f *FakeResourceHandler) Name(uri string) string { return uri } +func (f *FakeResourceHandler) ResourceName(uri string) (string, string) { + return "", "" +} + func (f *FakeResourceHandler) BuildAbsLink(source, relLink string) (string, error) { return relLink, nil } diff --git a/pkg/resourcehandlers/github/github_resource_handler.go b/pkg/resourcehandlers/github/github_resource_handler.go index b6b76278..8ce33054 100644 --- a/pkg/resourcehandlers/github/github_resource_handler.go +++ b/pkg/resourcehandlers/github/github_resource_handler.go @@ -15,6 +15,7 @@ import ( "github.com/gardener/docforge/pkg/api" "github.com/gardener/docforge/pkg/resourcehandlers" + "github.com/gardener/docforge/pkg/util/urls" "github.com/google/go-github/v32/github" ) @@ -76,8 +77,8 @@ func buildNodes(node *api.Node, childResourceLocators []*ResourceLocator, cache ) if node.NodeSelector != nil { nodePath = node.NodeSelector.Path - } else if len(node.ContentSelectors) > 0 { - nodePath = node.ContentSelectors[0].Source + } else if len(node.Source) > 0 { + nodePath = node.Source } if nodeResourceLocator = cache.Get(nodePath); nodeResourceLocator == nil { panic(fmt.Sprintf("Node is not available as ResourceLocator %v", nodePath)) @@ -97,8 +98,8 @@ func buildNodes(node *api.Node, childResourceLocators []*ResourceLocator, cache } childName := strings.TrimSuffix(childName, ".md") n := &api.Node{ - ContentSelectors: []api.ContentSelector{{Source: childResourceLocator.String()}}, - Name: childName, + Name: childName, + Source: childResourceLocator.String(), } n.SetParent(node) if node.Nodes == nil { @@ -123,13 +124,17 @@ func buildNodes(node *api.Node, childResourceLocators []*ResourceLocator, cache // containing for example images only adn thus irrelevant to the // documentation structure func cleanupNodeTree(node *api.Node) { - if len(node.ContentSelectors) > 0 { - source := node.ContentSelectors[0].Source + if len(node.Source) > 0 { + source := node.Source if rl, _ := parse(source); rl.Type == Tree { - node.ContentSelectors = nil + node.Source = "" } } for _, n := range node.Nodes { + // skip nested unresolved nodeSelector nodes from cleanup + if n.NodeSelector != nil && len(n.Nodes) == 0 { + continue + } cleanupNodeTree(n) } childrenCopy := make([]*api.Node, len(node.Nodes)) @@ -137,10 +142,15 @@ func cleanupNodeTree(node *api.Node) { copy(childrenCopy, node.Nodes) } for i, n := range node.Nodes { - if n.ContentSelectors == nil && len(n.Nodes) == 0 { - childrenCopy = removeNode(childrenCopy, i) + if len(n.Nodes) == 0 { + if n.NodeSelector != nil { + continue + } + if len(n.Source) == 0 && len(n.Nodes) == 0 { + childrenCopy = removeNode(childrenCopy, i) + } + node.Nodes = childrenCopy } - node.Nodes = childrenCopy } } @@ -362,6 +372,23 @@ func (gh *GitHub) Name(uri string) string { return "" } +// ResourceName implements resourcehandlers/ResourceHandler#ResourceName +func (gh *GitHub) ResourceName(uri string) (string, string) { + var ( + rl *ResourceLocator + err error + ) + if rl, err = gh.URLToGitHubLocator(nil, uri, false); err != nil { + panic(err) + } + if gh != nil { + if u, err := urls.Parse(rl.String()); err == nil { + return u.ResourceName, u.Extension + } + } + return "", "" +} + // BuildAbsLink builds the abs link from the source and the relative path // Implements resourcehandlers/ResourceHandler#BuildAbsLink func (gh *GitHub) BuildAbsLink(source, relPath string) (string, error) { diff --git a/pkg/resourcehandlers/github/github_resource_handler_test.go b/pkg/resourcehandlers/github/github_resource_handler_test.go index 105323b3..a789e328 100644 --- a/pkg/resourcehandlers/github/github_resource_handler_test.go +++ b/pkg/resourcehandlers/github/github_resource_handler_test.go @@ -262,12 +262,12 @@ func TestResolveNodeSelector(t *testing.T) { api.SortNodesByName(c.want) if !reflect.DeepEqual(c.inNode, c.want) { s, _ := api.Serialize(&api.Documentation{ - Root: c.inNode, + Structure: []*api.Node{c.inNode}, }) fmt.Printf(s) fmt.Printf("\n\n") s, _ = api.Serialize(&api.Documentation{ - Root: c.want, + Structure: []*api.Node{c.want}, }) fmt.Printf(s) t.Errorf("ResolveNodeSelector == %++v, want %++v", c.inNode, c.want) diff --git a/pkg/resourcehandlers/resource_handlers.go b/pkg/resourcehandlers/resource_handlers.go index 705227da..4f3a8263 100644 --- a/pkg/resourcehandlers/resource_handlers.go +++ b/pkg/resourcehandlers/resource_handlers.go @@ -21,6 +21,9 @@ type ResourceHandler interface { // Name resolves the name of the resource from a URI // Example: https://github.com/owner/repo/tree/master/a/b/c.md -> c.md Name(uri string) string + // ResourceName returns a breakdown of a resource name in the link, consisting + // of name and potentially and extention without the dot. + ResourceName(link string) (string, string) // BuildAbsLink should return an absolute path of a relative link in regards of the provided // source BuildAbsLink(source, link string) (string, error) diff --git a/pkg/resourcehandlers/resource_handlers_test.go b/pkg/resourcehandlers/resource_handlers_test.go index bf5bb4fa..7729612b 100644 --- a/pkg/resourcehandlers/resource_handlers_test.go +++ b/pkg/resourcehandlers/resource_handlers_test.go @@ -27,9 +27,11 @@ func (rh *TestResourceHandler) Read(ctx context.Context, uri string) ([]byte, er return nil, nil } func (rh *TestResourceHandler) Name(uri string) string { - return string("") + return "" +} +func (rh *TestResourceHandler) ResourceName(uri string) (string, string) { + return "", "" } - func (rh *TestResourceHandler) BuildAbsLink(source, relLink string) (string, error) { return relLink, nil } diff --git a/pkg/writers/dryRunWriter.go b/pkg/writers/dryRunWriter.go index 265bc58b..238352f0 100644 --- a/pkg/writers/dryRunWriter.go +++ b/pkg/writers/dryRunWriter.go @@ -131,6 +131,7 @@ func format(files []*file, b *bytes.Buffer) { b.WriteString(fmt.Sprintf("%s\n", s)) if i < len(dd)-1 { b.Write(bytes.Repeat([]byte(" "), i)) + continue } for _, st := range f.stats { b.Write([]byte(" ")) diff --git a/pkg/writers/dryRunWriter_test.go b/pkg/writers/dryRunWriter_test.go index 52fa6399..e2e86836 100644 --- a/pkg/writers/dryRunWriter_test.go +++ b/pkg/writers/dryRunWriter_test.go @@ -17,6 +17,7 @@ func TestFormat(t *testing.T) { in := []string{ "dev/__resources/015ec383-3c1b-487b-acff-4d7f4f8a1b14.png", "dev/__resources/173a7246-e1d5-40d5-b981-8cff293e177a.png", + "dev/doc/README.md", "dev/doc/aws_provider.md", "dev/doc/gardener", "dev/doc/gardener/_index.md", @@ -41,6 +42,7 @@ func TestFormat(t *testing.T) { 015ec383-3c1b-487b-acff-4d7f4f8a1b14.png 173a7246-e1d5-40d5-b981-8cff293e177a.png doc + README.md aws_provider.md gardener _index.md