1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83
|
# encoding: utf-8
# frozen_string_literal: true
require 'open-uri'
# TODO: Newer versions require parsing Attributes.td separately.
LLVM_SYNTAX_URI = "https://raw.githubusercontent.com/llvm/llvm-project/9de7b93bc00804585a8e36fc35f6449329d8225a/llvm/lib/AsmParser/LLLexer.cpp"
LLVM_KEYWORDS_FILE = "./lib/rouge/lexers/llvm/keywords.rb"
namespace :builtins do
task :llvm do
input = URI.open(LLVM_SYNTAX_URI) { |f| f.read }
generator = Rouge::Tasks::Builtins::LLVM.new
keywords = generator.extract_keywords(input)
output = generator.render_output(keywords)
File.write(LLVM_KEYWORDS_FILE, output)
end
end
module Rouge
module Tasks
module Builtins
class LLVM
def extract_keywords(input)
keywords = Hash.new { |h,k| h[k] = Array.new }
kind = nil
input.each_line(";") do |line|
if line =~ /#define (.*?)\(/
case $1
when "KEYWORD"
kind = "keywords"
when "TYPEKEYWORD"
kind = "types"
when "INSTKEYWORD"
kind = "instructions"
else
kind = nil
end
next
end
next unless kind && line =~ /KEYWORD\("?([^)",]+)/
keywords[kind].push $1
end
# Does not use TYPEKEYWORD() due to special handling.
keywords["types"].push "ptr"
keywords.transform_values! { |v| v.sort }
end
def render_output(keywords, &b)
return enum_for(:render_output, keywords).to_a.join("\n") unless b
yield "# encoding: utf-8"
yield "# frozen_string_literal: true"
yield ""
yield "# DO NOT EDIT"
yield "# This file is automatically generated by `rake builtins:llvm`."
yield "# See tasks/builtins/llvm.rake for more info."
yield ""
yield "module Rouge"
yield " module Lexers"
yield " class LLVM"
keywords.each do |k,v|
yield " def self.#{k}"
yield " @#{k} ||= Set.new #{v.inspect}"
yield " end"
yield ""
end
yield " end"
yield " end"
yield "end"
yield ""
end
end
end
end
end
|