rf-web/vendor/bundle/gems/rouge-3.12.0/lib/rouge/lexers/cython.rb
2019-10-21 10:18:17 +02:00

152 lines
4.1 KiB
Ruby

# -*- coding: utf-8 -*- #
# frozen_string_literal: true
module Rouge
module Lexers
load_lexer 'python.rb'
class Cython < Python
title "Cython"
desc "Cython and Pyrex source code (cython.org)"
tag 'cython'
aliases 'pyx', 'pyrex'
filenames '*.pyx', '*.pxd', '*.pxi'
mimetypes 'text/x-cython', 'application/x-cython'
def initialize(opts = {})
super opts
@indentation = nil
end
def self.keywords
@keywords ||= super + %w(
by except? fused gil nogil
)
end
def self.c_keywords
@ckeywords ||= %w(
public readonly extern api inline enum union
)
end
identifier = /[a-z_]\w*/i
dotted_identifier = /[a-z_.][\w.]*/i
prepend :root do
rule %r/cp?def|ctypedef/ do
token Keyword
push :c_definitions
push :c_start
end
rule %r/(from)((?:\\\s|\s)+)(#{dotted_identifier})((?:\\\s|\s)+)(cimport)/ do
groups Keyword::Namespace,
Text,
Name::Namespace,
Text,
Keyword::Namespace
end
rule %r/(cimport)(\s+)(#{dotted_identifier})/ do
groups Keyword::Namespace, Text, Name::Namespace
end
rule %r/(struct)((?:\\\s|\s)+)/ do
groups Keyword, Text
push :classname
end
mixin :func_call_fix
rule %r/[(,]/, Punctuation, :c_start
end
prepend :classname do
rule %r/(?:\\\s|\s)+/, Text
end
prepend :funcname do
rule %r/(?:\\\s|\s)+/, Text
end
# This is a fix for the way that function calls are lexed in the Python
# lexer. This should be moved to the Python lexer once confirmed that it
# does not cause any regressions.
state :func_call_fix do
rule %r/#{identifier}(?=\()/ do |m|
if self.class.keywords.include? m[0]
token Keyword
elsif self.class.exceptions.include? m[0]
token Name::Builtin
elsif self.class.builtins.include? m[0]
token Name::Builtin
elsif self.class.builtins_pseudo.include? m[0]
token Name::Builtin::Pseudo
else
token Name::Function
end
end
end
# The Cython lexer adds three states to those already in the Python lexer.
# Calls to `cdef`, `cpdef` and `ctypedef` move the lexer into the :c_start
# state. The primary purpose of this state is to highlight datatypes. Once
# this has been done, the lexer moves to the :c_definitions state where
# the majority of text in a definition is lexed. Finally, newlines cause
# the lexer to move to :c_indent. This state is used to check whether we
# have moved out of a C block.
state :c_start do
rule %r/[^\S\n]+/, Text
rule %r/cp?def|ctypedef/, Keyword
rule %r/(?:un)?signed/, Keyword::Type
# This rule matches identifiers that could be type declarations. The
# lookahead matches (1) pointers, (2) arrays and (3) variable names.
rule %r/#{identifier}(?=(?:\*+)|(?:[ \t]*\[)|(?:[ \t]+\w))/ do |m|
if self.class.keywords.include? m[0]
token Keyword
pop!
elsif %w(def).include? m[0]
token Keyword
goto :funcname
elsif %w(struct class).include? m[0]
token Keyword::Reserved
goto :classname
elsif self.class.c_keywords.include? m[0]
token Keyword::Reserved
else
token Keyword::Type
pop!
end
end
rule(//) { pop! }
end
state :c_definitions do
rule %r/\n/, Text, :c_indent
mixin :root
end
state :c_indent do
rule %r/[ \t]+/ do |m|
token Text
goto :c_start
if @indentation.nil?
@indentation = m[0]
elsif @indentation.length > m[0].length
@indentation = nil
pop! 2 # Pop :c_start and :c_definitions
end
end
rule(//) { @indentation = nil; reset_stack }
end
end
end
end