Leeres Fossil Repo

Check-in [bd5b945d3b]
Login

Check-in [bd5b945d3b]

Many hyperlinks are disabled.
Use anonymous login to enable hyperlinks.

Overview
Comment:Draft implementation in literate style
Timelines: family | ancestors | descendants | both | trunk
Files: files | file ages | folders
SHA1: bd5b945d3bb51c866475efb3df55db007a3c3e19
User & Date: nsa 2013-04-08 11:35:45.845
Context
2013-04-08
12:10
It finally works check-in: 2141176eb1 user: nsa tags: trunk
11:35
Draft implementation in literate style check-in: bd5b945d3b user: nsa tags: trunk
08:48
Initial commit check-in: 1aa4e3e7c1 user: nsa tags: trunk
Changes
Unified Diff Ignore Whitespace Patch
Added bootlit.go.










































































































































































































































































































>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
package main

import (
	"regexp"
	"flag"
	"bufio"
	"fmt"
	"os"
	"io"
	"strings"
)

func main() {
	var sourceFile string
	var docFile string
	var parsingFile string
	var defaultChunk string

	flag.Usage = func() {
		fmt.Fprintf(os.Stderr, "Usage of lit: lit [options] file-to-parse.w\n")
		flag.PrintDefaults()
	}

	flag.StringVar(&defaultChunk, "default-chunk", "*", "Default program chunk")
	flag.StringVar(&sourceFile, "src-out", "", "File to write source code")
	flag.StringVar(&docFile, "doc-out", "", "File to write document")
	flag.Parse()

	if len(flag.Args()) > 0 {
		parsingFile = flag.Arg(0)
	}
	
	if parsingFile == "" || (sourceFile == "" && docFile == "") {
		flag.Usage()
		os.Exit(0)
	}

	chunks, document := parseFile(parsingFile)
	chunks = expandChunks(chunks)

	if sourceFile != "" {
		sourceOutput, err := os.Create(sourceFile)
		defer sourceOutput.Close()

		if err != nil {
			panic(err)
		}
		sourceOutput.WriteString(chunks[defaultChunk])
	}

	if docFile != "" {
		docOutput, err := os.Create(docFile)
		defer docOutput.Close()	

		if err != nil {
			panic(err)
		}
		docOutput.WriteString(document)	
	}
}


func parseFile(fileName string) (map[string]string, string) {
	f, err := os.Open(fileName)
	if err != nil {
		panic(err)
	}
	defer f.Close()

	fileBuf := bufio.NewReader(f)

	var (
		endOfChunkMatcher *regexp.Regexp
		chunkMatcher *regexp.Regexp
		regexpError error
	)

	chunkMatcher, regexpError = regexp.Compile("<<([^>]+)>>=")
	if regexpError != nil {
		panic(regexpError)и
	}
	endOfChunkMatcher, regexpError = regexp.Compile("@")
	if regexpError != nil {
		panic(regexpError)
	}
	
	var document string
	var chunkName string
	var chunks = make(map[string]string)

	var processLine = func(line string) {
		if chunkName != "" {
			chunks[chunkName] += line
		} else {
			document += line
		}
	}
	
	for {
		line, err := fileBuf.ReadString('\n')
		if err == io.EOF {
			processLine(line)
			break
		} else if err != nil {
			panic(err)
		}
		var matches = chunkMatcher.FindStringSubmatch(line)
		if matches != nil {
			chunkName = matches[1]
			chunks[chunkName] = ""
		} else if matches = endOfChunkMatcher.FindStringSubmatch(line); matches != nil {
			chunkName = ""
		} else {
			processLine(line)
		}
	}
	return chunks, document
}


func expandChunks(chunks map[string]string) map[string]string {

	var expandedChunks = make(map[string]string)
	chunkMatcher, err := regexp.Compile("<<([^>]+)>>")
	if err != nil {
		panic(err)
	}

	var expandBody func(b string) string
	expandBody = func(b string) string {
		var newBody = b
		submatches := chunkMatcher.FindAllStringSubmatch(b, -1)
		if submatches != nil {
			for _, matches := range submatches {
				fullChunk, chunkName := matches[0], matches[1]
				if chunks[chunkName] != "" {
					newBody = strings.Replace(newBody, fullChunk, expandBody(chunks[chunkName]), -1)
				}
			}
		}
		return newBody
	}

	for name, body := range chunks {
		expandedChunks[name] = expandBody(body)
	}

	return expandedChunks
}
Deleted lit.go.
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
package main

import (
	"regexp"
	"flag"
	"bufio"
	"fmt"
	"os"
	"io"
	"strings"
)

func main() {
	var sourceFile string
	var docFile string
	var parsingFile string
	var defaultChunk string

	flag.Usage = func() {
		fmt.Fprintf(os.Stderr, "Usage of lit: lit [options] file-to-parse.w\n")
		flag.PrintDefaults()
	}

	flag.StringVar(&defaultChunk, "default-chunk", "*", "Default program chunk")
	flag.StringVar(&sourceFile, "src-out", "", "File to write source code")
	flag.StringVar(&docFile, "doc-out", "", "File to write document")
	flag.Parse()

	if len(flag.Args()) > 0 {
		parsingFile = flag.Arg(0)
	}
	
	if parsingFile == "" || (sourceFile == "" && docFile == "") {
		flag.Usage()
		os.Exit(0)
	}

	chunks, document := parseFile(parsingFile)
	chunks = expandChunks(chunks)

	if sourceFile != "" {
		sourceOutput, err := os.Create(sourceFile)
		defer sourceOutput.Close()

		if err != nil {
			panic(err)
		}
		sourceOutput.WriteString(chunks[defaultChunk])
	}

	if docFile != "" {
		docOutput, err := os.Create(docFile)
		defer docOutput.Close()	

		if err != nil {
			panic(err)
		}
		docOutput.WriteString(document)	
	}
}


func parseFile(fileName string) (map[string]string, string) {
	f, err := os.Open(fileName)
	if err != nil {
		panic(err)
	}
	defer f.Close()

	fileBuf := bufio.NewReader(f)

	var (
		endOfChunkMatcher *regexp.Regexp
		chunkMatcher *regexp.Regexp
		regexpError error
	)

	chunkMatcher, regexpError = regexp.Compile("<<([^>]+)>>=")
	if regexpError != nil {
		panic(regexpError)
	}
	endOfChunkMatcher, regexpError = regexp.Compile("@")
	if regexpError != nil {
		panic(regexpError)
	}
	
	var document string
	var chunkName string
	var chunks = make(map[string]string)

	var processLine = func(line string) {
		if chunkName != "" {
			chunks[chunkName] += line
		} else {
			document += line
		}
	}
	
	for {
		line, err := fileBuf.ReadString('\n')
		if err == io.EOF {
			processLine(line)
			break
		} else if err != nil {
			panic(err)
		}
		var matches = chunkMatcher.FindStringSubmatch(line)
		if matches != nil {
			chunkName = matches[1]
			chunks[chunkName] = ""
		} else if matches = endOfChunkMatcher.FindStringSubmatch(line); matches != nil {
			chunkName = ""
		} else {
			processLine(line)
		}
	}
	return chunks, document
}


func expandChunks(chunks map[string]string) map[string]string {

	var expandedChunks = make(map[string]string)
	chunkMatcher, err := regexp.Compile("<<([^>]+)>>")
	if err != nil {
		panic(err)
	}

	var expandBody func(b string) string
	expandBody = func(b string) string {
		var newBody = b
		submatches := chunkMatcher.FindAllStringSubmatch(b, -1)
		if submatches != nil {
			for _, matches := range submatches {
				fullChunk, chunkName := matches[0], matches[1]
				if chunks[chunkName] != "" {
					newBody = strings.Replace(newBody, fullChunk, expandBody(chunks[chunkName]), -1)
				}
			}
		}
		return newBody
	}

	for name, body := range chunks {
		expandedChunks[name] = expandBody(body)
	}

	return expandedChunks
}
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<
<










































































































































































































































































































Added lit.go.w.










































































































































































































































































































































































































































































































































































>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
# Lit, simple tool for language agnostic literate programming

Literate programming is a technique introduced by Dolad Knuth many years ago. 
Nowdays literate programming is almost dead, it's really sad in my opinion. This little application designed to bring
literate programming approach to almost any programming language expirience.

I strongly recomend to read original Knuth paper on Literate Programming (http://www.literateprogramming.com/knuthweb.pdf)

Noweb.py by Jonathan Aquino was inspiration for this humble peace of code.

## Main idea
It was surprisingly easy to implement this tool. Main idea is to parse file in single pass line-by-line detecting 
chunks and use `Map` to store it's names and values. 
In second part of processing recursively 'expand' chunks bodies, replacing entries of others chunks to get full programm.

## Used packages
To process files this application using os, io, bufio and regex packages. Flag package used to parse command line parameters. It's a bit shitty, but it's ok.

<<Used packages>>=
	"regexp"
	"flag"
	"bufio"
	"fmt"
	"os"
	"io"
	"strings"
@

# Run flow
## Parsing command line parameters

Right after start application will try to parse command line parameters. If some vital data is not defined application will show usage and exit. 
There is 4 overall parameters: 
* --src-out: File name for code output (tangle output)
* --doc-out: File name for document output (weave output)
* --default-chunk: Default chunk name. Chunk with this name will consider holding main program code. By default it's name is "*"
* First parameter after all options witll consider file name to parse 

As I mention above, we using `flag` package to parse command line. For every command line argument there is variable defined. Default values for src-out and doc-out parameters is empty string.
In Go this is "Zero value" for string, so we can catch situation when user omit one or another parameter. Default value for default-chunk is always "*".

<<Command line parsing>>=
	var sourceFile string
	var docFile string
	var parsingFile string
	var defaultChunk string

	flag.Usage = func() {
		fmt.Fprintf(os.Stderr, "Usage of lit: lit [options] file-to-parse.w\n")
		flag.PrintDefaults()
	}

	flag.StringVar(&defaultChunk, "default-chunk", "*", "Default program chunk")
	flag.StringVar(&sourceFile, "src-out", "", "File to write source code")
	flag.StringVar(&docFile, "doc-out", "", "File to write document")
	flag.Parse()
@


# Check command line options validity
If there is no file to parse we can't do anything except show usage. Another case is when both src-out and doc-out is missing. In this situation application will show usage too, because
it can't do anything useful with given file. 

<<Parameters check>>=
	if len(flag.Args()) > 0 {
		parsingFile = flag.Arg(0)
	}

	if parsingFile == "" || (sourceFile == "" && docFile == "") {
		flag.Usage()
		os.Exit(0)
	}
@

But if /only one/ of they is missing application can dump source code or documentation without dumping another part.

For exmaple, if you want to generate both, documentation and source from some file `source.w`, you should run:
	
	lit --src-out source.c --doc-out source.tex source.w

But if you need only source, you can omit doc-out parameter:
	
	lit --src-out source.c source.w

Same works for doc-out.

<<Processing command line>>=
	if sourceFile != "" {
		sourceOutput, err := os.Create(sourceFile)
		defer sourceOutput.Close()

		if err != nil {
			panic(err)
		}
		sourceOutput.WriteString(chunks[defaultChunk])
	}

	if docFile != "" {
		docOutput, err := os.Create(docFile)
		defer docOutput.Close()	

		if err != nil {
			panic(err)
		}
		docOutput.WriteString(document)	
	}
@


## File parsing

File parsing process is extremely straightforward. After file is open we reading it line by line trying to match one specified regular expressions.

<<Open file and buf reader>>=
	f, err := os.Open(fileName)
	if err != nil {
		panic(err)
	}
	defer f.Close()

	fileBuf := bufio.NewReader(f)
@

Expression "<<([^>]+)>>=" is used to match beginning of chunk, "@" for end of chunk.

<<Define regular expressions>>=
	var (
		endOfChunkMatcher *regexp.Regexp
		chunkMatcher *regexp.Regexp
		regexpError error
	)

	chunkMatcher, regexpError = regexp.Compile("<<([^>]+)>>=")
	if regexpError != nil {
		panic(regexpError)и
	}
	endOfChunkMatcher, regexpError = regexp.Compile("@")
	if regexpError != nil {
		panic(regexpError)
	}
@

After chunk beginning is found we extract his name from submatches and store it in variable `chunkName`, after that any line not matched by any regular expression is added to Map named `chunks` 
with value of `chunkName` as a key.
If line matches with end of chunk expression chunkName is set ot zero value. If line no one expression can match line and `chunkName` variable set to zero value, that line is adding to `document` string variable.

<<Reading and processing lines>>=
	for {
		line, err := fileBuf.ReadString('\n')
		if err == io.EOF {
			processLine(line)
			break
		} else if err != nil {
			panic(err)
		}
		var matches = chunkMatcher.FindStringSubmatch(line)
		if matches != nil {
			chunkName = matches[1]
			chunks[chunkName] = ""
		} else if matches = endOfChunkMatcher.FindStringSubmatch(line); matches != nil {
			chunkName = ""
		} else {
			processLine(line)
		}
	}
@

As a result of execution `parseFile` function returns `document` string and `chunks` map. 

<<File parsing definition>>=
func parseFile(fileName string) (map[string]string, string) {

	<<Open file and buf reader>>

	<<Define regular expressions>>
	
	var document string
	var chunkName string
	var chunks = make(map[string]string)

	<<Proc line closure>>
	<<Reading and processing lines>>

	return chunks, document
}
@

To simplify processing of every line of code defined closure `processLine`. This closure decides where current processing line will go: to the chunk body or documentation.

<<Proc line closure>>=
	var processLine = func(line string) {
		if chunkName != "" {
			chunks[chunkName] += line
		} else {
			document += line
		}
	}
@


# Expanding chunks

Every chunk body can contain any number of links to another chunks. To build whole program from literate source we need to "expand" every chunk body by replacing links to other chunks by its bodies.
First of all we define data structure for "final" expanded chunks `expandedChunks`. After that we define regular expression, which will match "links" to other chunks.

<<Define expanded chunks and regexp>>=
	var expandedChunks = make(map[string]string)
	chunkMatcher, err := regexp.Compile("<<([^>]+)>>")
	if err != nil {
		panic(err)
	}
@

Expand body closure defined inside `expandChunks` function takes a body as an argument and match it for links to another chunks. After that it takes every linked chunk name and replaces it with
result of recursive self-invocation with linked chunk body.
If there is no linked chunks closure just returns given body. May be I should check if `expandedChunks` already has expanded body for linked chunk to avoid extra work.

<<Define expand body closure>>=
	var expandBody func(b string) string
	expandBody = func(b string) string {
		var newBody = b
		submatches := chunkMatcher.FindAllStringSubmatch(b, -1)
		if submatches != nil {
			for _, matches := range submatches {
				fullChunk, chunkName := matches[0], matches[1]
				if chunks[chunkName] != "" {
					newBody = strings.Replace(newBody, fullChunk, expandBody(chunks[chunkName]), -1)
				}
			}
		}
		return newBody
	}
@

<<Expanding chunks definition>>=
func expandChunks(chunks map[string]string) map[string]string {

	<<Define expanded chunks and regexp>>

	<<Define expand body closure>>

	for name, body := range chunks {
		expandedChunks[name] = expandBody(body)
	}

	return expandedChunks
}
@

# Main program structure

<<*>>=
package main

import (
<<Used packages>>
)

func main() {
	<<Command line parsing>>
	<<Parameters check>>

	chunks, document := parseFile(parsingFile)
	chunks = expandChunks(chunks)

	<<Processing command line>>
}

<<File parsing definition>>
<<Expanding chunks definition>>

@