Merge branch 'dev'

input.block 被抽象成一个接口，方便一些特殊语言的实现；新的语言支持：pascal/delphi；
caixw · Jul 11, 2016 · 59c225e · 59c225e
2 parents cd87c66 + b57c0d6
commit 59c225e
Show file tree

Hide file tree

Showing 18 changed files with 690 additions and 330 deletions.
diff --git a/README.md b/README.md
@@ -2,7 +2,7 @@ apidoc [![Build Status](https://travis-ci.org/caixw/apidoc.svg?branch=master)](h
 ======
 
 apidoc 是一个简单的 RESTful API 文档生成工具，它从代码注释中提取特定格式的内容，生成文档。
-目前支持支持以下语言：C#、C/C++、Go、Java、Javascript、Perl、PHP、Python、Ruby、Rust 和 Swift
+目前支持支持以下语言：C#、C/C++、Go、Java、Javascript、Pascal、Perl、PHP、Python、Ruby、Rust 和 Swift
 
 具体文档可参考：http://apidoc.tools
 
@@ -45,6 +45,12 @@ go get github.com/caixw/apidoc
 
 
 
+### 添加新语言
+
+若需要添加对新语言的支持，可以在 `input/lang.go` 中，根据要求添加新语言的定义即可。
+
+
+
 ### 集成
 
 若需要将 apidoc 当作包集成到其它 Go 程序中，可分别引用 `input` 和 `output` 的相关函数：

diff --git a/app/app.go b/app/app.go
@@ -17,7 +17,7 @@ const (
 	// 版本号
 	//
 	// 版本号按照 http://semver.org 中的规则
-	Version = "2.15.5+20160708"
+	Version = "2.16.6+20160712"
 
 	// 程序的正式名称
 	Name = "apidoc"
@@ -43,6 +43,9 @@ const (
 
 	// 输出的 profile 文件的名称
 	Profile = "apidoc.prof"
+
+	// 需要解析的最小代码块，小于此值，将不作解析
+	MiniSize = len("@api ")
 )
 
 // Message 向终端输出不同颜色的提示信息

diff --git a/app/app_test.go b/app/app_test.go
@@ -5,6 +5,7 @@
 package app
 
 import (
+	"strings"
 	"testing"
 
 	"github.com/issue9/assert"
@@ -16,8 +17,13 @@ import (
 func TestConsts(t *testing.T) {
 	a := assert.New(t)
 
+	a.True(version.SemVerValid(Version))
+	a.True(len(Name) > 0)
 	a.True(is.URL(RepoURL))
 	a.True(is.URL(OfficialURL))
-
-	a.True(version.SemVerValid(Version))
+	a.True(len(ConfigFilename) > 0).True(strings.IndexAny(ConfigFilename, "/\\") < 0)
+	a.True(len(DefaultTitle) > 0)
+	a.True(len(DefaultGroupName) > 0).True(strings.IndexAny(DefaultGroupName, "/\\") < 0)
+	a.True(len(Profile) > 0).True(strings.IndexAny(Profile, "/\\") < 0)
+	a.True(MiniSize >= 0)
 }
diff --git a/input/block.go b/input/block.go
@@ -0,0 +1,166 @@
+// Copyright 2016 by caixw, All rights reserved.
+// Use of this source code is governed by a MIT
+// license that can be found in the LICENSE file.
+
+package input
+
+import (
+	"strings"
+	"unicode"
+	"unicode/utf8"
+)
+
+// 用于描述 block.Type 的值。
+const (
+	blockTypeNone     int8 = iota
+	blockTypeString        // 字符串，将被忽略。
+	blockTypeSComment      // 单行注释
+	blockTypeMComment      // 多行注释
+)
+
+// blocker 接口定义了解析代码块的所有操作。
+// 通过 BeginFunc 查找匹配的起始位置，通过
+// EndFunc 查找结束位置，并返回所有的块内容。
+type blocker interface {
+	BeginFunc(l *lexer) bool         // 确定 l 的当前位置是否匹配 blocker 的起始位置。
+	EndFunc(l *lexer) ([]rune, bool) // 确定 l 的当前位置是否匹配 blocker 的结束位置，若匹配返回中间的字符串。
+}
+
+// block 定义了与语言相关的三种类型的代码块：单行注释，多行注释，字符串。
+type block struct {
+	Type   int8   // 代码块的类型，可以是字符串，单行注释或是多行注释
+	Begin  string // 块的起始字符串
+	End    string // 块的结束字符串，单行注释不用定义此值
+	Escape string // 当 Type 为 blockTypeString 时，此值表示转义字符，Type 为其它值时，此值无意义
+}
+
+func (b *block) BeginFunc(l *lexer) bool {
+	return l.match(b.Begin)
+}
+
+// 返回从当前位置到定义结束的所有字符
+// 返回值 bool 提示是否正常找到结束标记
+func (b *block) EndFunc(l *lexer) ([]rune, bool) {
+	switch b.Type {
+	case blockTypeString:
+		return b.endString(l)
+	case blockTypeMComment:
+		return b.endMComments(l)
+	case blockTypeSComment:
+		return b.endSComments(l)
+	}
+
+	return nil, false
+}
+
+// 从 l 的当前位置开始往后查找，直到找到 b 中定义的 end 字符串，
+// 将 l 中的指针移到该位置。
+// 正常找到结束符的返回 true，否则返回 false。
+func (b *block) endString(l *lexer) ([]rune, bool) {
+LOOP:
+	for {
+		switch {
+		case l.atEOF():
+			break LOOP
+		case (len(b.Escape) > 0) && l.match(b.Escape):
+			l.next()
+		case l.match(b.End):
+			return nil, true
+		default:
+			l.next()
+		}
+	} // end for
+	return nil, false
+}
+
+// 从 l 的当前位置往后开始查找连续的相同类型单行代码块。
+func (b *block) endSComments(l *lexer) ([]rune, bool) {
+	// 跳过除换行符以外的所有空白字符。
+	skipSpace := func() {
+		for {
+			r, w := utf8.DecodeRune(l.data[l.pos:])
+			if !unicode.IsSpace(r) || r == '\n' {
+				break
+			}
+			l.pos += w
+		}
+	} // end skipSpace
+
+	ret := make([]rune, 0, 1000)
+	for {
+		for { // 读取一行的内容到 ret 变量中
+			r := l.next()
+			ret = append(ret, r)
+
+			if l.atEOF() || r == '\n' {
+				break
+			}
+		}
+
+		skipSpace()            // 去掉新行的前导空格，若是存在的话。
+		if !l.match(b.Begin) { // 不是接连着的注释块了，结束当前的匹配
+			break
+		}
+	}
+
+	if len(ret) > 0 { // 最后一个换行符返还给 lexer
+		l.pos--
+	}
+
+	return ret, true
+}
+
+// 从 l 的当前位置一直到定义的 b.End 之间的所有字符。
+// 会对每一行应用 filterSymbols 规则。
+func (b *block) endMComments(l *lexer) ([]rune, bool) {
+	lines := make([][]rune, 0, 20)
+	line := make([]rune, 0, 100)
+
+LOOP:
+	for {
+		switch {
+		case l.atEOF():
+			return nil, false
+		case l.match(b.End):
+			lines = append(lines, filterSymbols(line, b.Begin))
+			break LOOP
+		default:
+			r := l.next()
+			line = append(line, r)
+			if r == '\n' {
+				lines = append(lines, filterSymbols(line, b.Begin))
+				line = make([]rune, 0, 100)
+			}
+		}
+	}
+
+	ret := make([]rune, 0, 1000)
+	for _, v := range lines {
+		ret = append(ret, v...)
+	}
+	return ret, true
+}
+
+// 行首若出现`空白字符+symbol+空白字符`的组合，则去掉这些字符。
+// symbol 为 charset 中的任意字符。
+func filterSymbols(line []rune, charset string) []rune {
+	for k, v := range line {
+		if unicode.IsSpace(v) { // 跳过行首的空格
+			continue
+		}
+
+		// 不存在指定的符号，直接返回原数据
+		if strings.IndexRune(charset, v) < 0 {
+			return line
+		}
+
+		// 若下个字符正好是是空格
+		if len(line) > k+1 && unicode.IsSpace(line[k+1]) {
+			return line[k+2:]
+		} else {
+			return line
+		}
+	}
+
+	return line
+}