Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat(utils): Add parser for wiki #54

Merged
merged 12 commits into from
Mar 18, 2022
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions .github/workflows/unit-test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,8 @@ jobs:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v2
with:
submodules: recursive
- uses: pnpm/[email protected]
with:
version: '6'
Expand Down
3 changes: 3 additions & 0 deletions .gitmodules
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
[submodule "packages/utils/wiki/__test__/wiki-syntax-spec"]
path = packages/utils/wiki/__test__/wiki-syntax-spec
url = https://github.com/bangumi/wiki-syntax-spec
1 change: 1 addition & 0 deletions packages/utils/index.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
export { default as parseWiki } from './wiki/parser'
7 changes: 6 additions & 1 deletion packages/utils/package.json
Original file line number Diff line number Diff line change
@@ -1,5 +1,10 @@
{
"name": "@bangumi/utils",
"version": "0.0.0",
"private": true
"private": true,
"main": "index.ts",
"devDependencies": {
"@types/js-yaml": "^4.0.5",
"js-yaml": "^4.1.0"
}
}
45 changes: 45 additions & 0 deletions packages/utils/wiki/__test__/parser.test.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
import path from 'path'
import fs from 'fs'
import parse from '../parser'
import yaml from 'js-yaml'

const testsDir = path.resolve(__dirname, './wiki-syntax-spec/tests/')
const validTestDir = path.resolve(testsDir, 'valid')
const invalidTestDir = path.resolve(testsDir, 'invalid')

const validTestFiles = fs.readdirSync(validTestDir)
const inValidTestFiles = fs.readdirSync(invalidTestDir)

describe('Wiki syntax parser expected to be valid', () => {
validTestFiles.forEach(file => {
const prefix = file.split('.')[0]
const suffix = file.split('.')[1]
if (suffix !== 'wiki') {
return
}
it(`${prefix} should be valid`, () => {
const testFilePath = path.resolve(validTestDir, file)
const expectedFilePath = path.resolve(validTestDir, `${prefix}.yaml`)

const testContent = fs.readFileSync(testFilePath, 'utf8')
const expectedContent = fs.readFileSync(expectedFilePath, 'utf8')

const result = parse(testContent)
const expected = yaml.load(expectedContent)

expect(result).toEqual(expected)
})
})
})

describe('Wiki syntax parser expected to be inValid', () => {
inValidTestFiles.forEach(file => {
const prefix = file.split('.')[0]
it(`${prefix} should be invalid`, () => {
const testFilePath = path.resolve(invalidTestDir, file)
const testContent = fs.readFileSync(testFilePath, 'utf8')

expect(() => parse(testContent)).toThrowError()
})
})
})
1 change: 1 addition & 0 deletions packages/utils/wiki/__test__/wiki-syntax-spec
Submodule wiki-syntax-spec added at fe7435
17 changes: 17 additions & 0 deletions packages/utils/wiki/error.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
export const GlobalPrefixError = 'missing prefix \'{{Infobox\' at the start'
export const GlobalSuffixError = 'missing suffix \'}}\' at the end'
export const ArrayNoCloseError = 'array should be closed by \'}\''
export const ArrayItemWrappedError = 'array item should be wrapped by \'[]\''
export const ExpectingNewFieldError = 'missing \'|\' to start a new field'
export const ExpectingSignEqualError = 'missing \'=\' to separate field name and value'

export class WikiSyntaxError extends Error {
line: string | null
lino: number | null

constructor (lino: number | null, line: string | null, message: string) {
super(message)
this.line = line
this.lino = lino
}
}
108 changes: 108 additions & 0 deletions packages/utils/wiki/parser.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,108 @@
import { Wiki, WikiArrayItem, WikiItem, WikiItemType } from './types'
import {
ArrayItemWrappedError,
ArrayNoCloseError,
ExpectingNewFieldError,
ExpectingSignEqualError,
GlobalPrefixError,
GlobalSuffixError,
WikiSyntaxError
} from './error'

/* should start with `{{Infobox` and end with `}}` */
const prefix = '{{Infobox'
const suffix = '}}'

export default function parse (s: string): Wiki {
const wiki: Wiki = { type: '', data: [] }

const strTrim = s.trim().replace(/\r\n/g, '\n')

if (strTrim === '') {
return wiki
}

if (!strTrim.startsWith(prefix)) {
throw new WikiSyntaxError(null, null, GlobalPrefixError)
}
if (!strTrim.endsWith(suffix)) {
throw new WikiSyntaxError(null, null, GlobalSuffixError)
}

const arr = strTrim.split('\n')
wiki.type = parseType(arr[0])

/* split content between {{Infobox xxx and }} */
const fields = arr.slice(1, -1)

let inArray = false
for (let i = 0; i < fields.length; ++i) {
const line = fields[i].trim()
const lino = i + 2

if (line === '') {
continue
}
/* new field */
if (line[0] === '|') {
if (inArray) {
throw new WikiSyntaxError(lino, line, ArrayNoCloseError)
}
const meta = parseNewField(lino, line)
inArray = meta[2] === 'array'
const field = new WikiItem(...meta)
wiki.data.push(field)
/* is Array item */
} else if (inArray) {
if (line[0] === '}') {
inArray = false
continue
}
if (i === fields.length - 1) {
throw new WikiSyntaxError(lino, line, ArrayNoCloseError)
}
wiki.data[wiki.data.length - 1]!.values!.push(
new WikiArrayItem(
...parseArrayItem(lino, line)
)
)
} else {
throw new WikiSyntaxError(lino, line, ExpectingNewFieldError)
}
}
return wiki
}

const parseType = (line: string): string => {
return line.slice(prefix.length, !line.includes('}}') ? undefined : line.indexOf('}}')).trim()
}

const parseNewField = (lino: number, line: string): [string, string, WikiItemType] => {
const str = line.slice(1)
const index = str.indexOf('=')

if (index === -1) {
throw new WikiSyntaxError(lino, line, ExpectingSignEqualError)
}

const key = str.slice(0, index).trim()
const value = str.slice(index + 1).trim()
switch (value) {
case '{':
return [key, '', 'array']
default :
return [key, value, 'object']
}
}

const parseArrayItem = (lino: number, line: string): [string, string] => {
if (line[0] !== '[' || line[line.length - 1] !== ']') {
throw new WikiSyntaxError(lino, line, ArrayItemWrappedError)
}
const content = line.slice(1, line.length - 1)
const index = content.indexOf('|')
if (index === -1) {
return ['', content.trim()]
}
return [content.slice(0, index).trim(), content.slice(index + 1).trim()]
}
36 changes: 36 additions & 0 deletions packages/utils/wiki/types.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
export interface Wiki {
type: string
data: WikiItem[]
}

export type WikiItemType = 'array' | 'object'

export class WikiArrayItem {
k?: string
v?: string

constructor (k: string, v: string) {
k && (this.k = k)
this.v = v
}
}

export class WikiItem {
key?: string
value?: string
array?: boolean
values?: WikiArrayItem[]

constructor (key: string, value: string, type: WikiItemType) {
this.key = key
switch (type) {
case 'array':
this.array = true
this.values = []
break
case 'object':
this.value = value
break
}
}
}
22 changes: 21 additions & 1 deletion pnpm-lock.yaml

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.