92 lines
3.1 KiB
Swift
92 lines
3.1 KiB
Swift
/**
|
|
* Splash
|
|
* Copyright (c) John Sundell 2018
|
|
* MIT license - see LICENSE.md
|
|
*/
|
|
|
|
import Foundation
|
|
|
|
/// This class acts as the main API entry point for Splash. Using it,
|
|
/// any code string can be highlighted to any desired format, using
|
|
/// any language grammar. Per default, Swift's langauge grammar is used.
|
|
/// To initialize this class, pass the desired output format, such as
|
|
/// `AttributedStringOutputFormat` or `HTMLOutputFormat`, or a custom
|
|
/// implementation. One syntax highlighter may be reused multiple times.
|
|
public struct SyntaxHighlighter<Format: OutputFormat> {
|
|
private let format: Format
|
|
private let grammar: Grammar
|
|
private let tokenizer = Tokenizer()
|
|
|
|
/// Initialize an instance with the desired output format.
|
|
/// If no grammar is passed, then Swift's grammar is used.
|
|
public init(format: Format, grammar: Grammar = SwiftGrammar()) {
|
|
self.format = format
|
|
self.grammar = grammar
|
|
}
|
|
|
|
/// Highlight the given code, returning output as specified by the
|
|
/// syntax highlighter's `Format`.
|
|
public func highlight(_ code: String) -> Format.Builder.Output {
|
|
var builder = format.makeBuilder()
|
|
var state: (token: String, tokenType: TokenType?)?
|
|
|
|
func handle(_ token: String, ofType type: TokenType?, trailingWhitespace: String?) {
|
|
guard let whitespace = trailingWhitespace else {
|
|
state = (token, type)
|
|
return
|
|
}
|
|
|
|
builder.addToken(token, ofType: type)
|
|
builder.addWhitespace(whitespace)
|
|
state = nil
|
|
}
|
|
|
|
for segment in tokenizer.segmentsByTokenizing(code, delimiters: grammar.delimiters) {
|
|
let token = segment.tokens.current
|
|
let whitespace = segment.trailingWhitespace
|
|
|
|
guard !token.isEmpty else {
|
|
whitespace.map { builder.addWhitespace($0) }
|
|
continue
|
|
}
|
|
|
|
let tokenType = typeOfToken(in: segment)
|
|
|
|
guard var currentState = state else {
|
|
handle(token, ofType: tokenType, trailingWhitespace: whitespace)
|
|
continue
|
|
}
|
|
|
|
guard currentState.tokenType == tokenType else {
|
|
builder.addToken(currentState.token, ofType: currentState.tokenType)
|
|
handle(token, ofType: tokenType, trailingWhitespace: whitespace)
|
|
continue
|
|
}
|
|
|
|
currentState.token.append(token)
|
|
handle(currentState.token, ofType: tokenType, trailingWhitespace: whitespace)
|
|
}
|
|
|
|
if let lastState = state {
|
|
builder.addToken(lastState.token, ofType: lastState.tokenType)
|
|
}
|
|
|
|
return builder.build()
|
|
}
|
|
|
|
private func typeOfToken(in segment: Segment) -> TokenType? {
|
|
let rule = grammar.syntaxRules.first { $0.matches(segment) }
|
|
return rule?.tokenType
|
|
}
|
|
}
|
|
|
|
private extension OutputBuilder {
|
|
mutating func addToken(_ token: String, ofType type: TokenType?) {
|
|
if let type = type {
|
|
addToken(token, ofType: type)
|
|
} else {
|
|
addPlainText(token)
|
|
}
|
|
}
|
|
}
|