/** * Splash * Copyright (c) John Sundell 2018 * MIT license - see LICENSE.md */ import Foundation /// This class acts as the main API entry point for Splash. Using it, /// any code string can be highlighted to any desired format, using /// any language grammar. Per default, Swift's langauge grammar is used. /// To initialize this class, pass the desired output format, such as /// `AttributedStringOutputFormat` or `HTMLOutputFormat`, or a custom /// implementation. One syntax highlighter may be reused multiple times. public struct SyntaxHighlighter { private let format: Format private let grammar: Grammar private let tokenizer = Tokenizer() /// Initialize an instance with the desired output format. /// If no grammar is passed, then Swift's grammar is used. public init(format: Format, grammar: Grammar = SwiftGrammar()) { self.format = format self.grammar = grammar } /// Highlight the given code, returning output as specified by the /// syntax highlighter's `Format`. public func highlight(_ code: String) -> Format.Builder.Output { var builder = format.makeBuilder() var state: (token: String, tokenType: TokenType?)? func handle(_ token: String, ofType type: TokenType?, trailingWhitespace: String?) { guard let whitespace = trailingWhitespace else { state = (token, type) return } builder.addToken(token, ofType: type) builder.addWhitespace(whitespace) state = nil } for segment in tokenizer.segmentsByTokenizing(code, using: grammar) { let token = segment.tokens.current let whitespace = segment.trailingWhitespace guard !token.isEmpty else { whitespace.map { builder.addWhitespace($0) } continue } let tokenType = typeOfToken(in: segment) guard var currentState = state else { handle(token, ofType: tokenType, trailingWhitespace: whitespace) continue } guard currentState.tokenType == tokenType else { builder.addToken(currentState.token, ofType: currentState.tokenType) handle(token, ofType: tokenType, trailingWhitespace: whitespace) continue } currentState.token.append(token) handle(currentState.token, ofType: tokenType, trailingWhitespace: whitespace) } if let lastState = state { builder.addToken(lastState.token, ofType: lastState.tokenType) } return builder.build() } private func typeOfToken(in segment: Segment) -> TokenType? { let rule = grammar.syntaxRules.first { $0.matches(segment) } return rule?.tokenType } } private extension OutputBuilder { mutating func addToken(_ token: String, ofType type: TokenType?) { if let type = type { addToken(token, ofType: type) } else { addPlainText(token) } } }