Emacs settings.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 

276 lines
8.1 KiB

;;; language-id.el --- Library to work with programming language identifiers -*- lexical-binding: t -*-
;; Author: Lassi Kortela <lassi@lassi.io>
;; URL: https://github.com/lassik/emacs-language-id
;; Package-Version: 20220613.1156
;; Package-Commit: cbd5b8fffa8c09f86d8b77f8d3f5e6f4ccd82bc4
;; Version: 0.19
;; Package-Requires: ((emacs "24.3"))
;; Keywords: languages util
;; SPDX-License-Identifier: ISC
;; This file is not part of GNU Emacs.
;;; Commentary:
;; language-id is a small, focused library that helps other Emacs
;; packages identify the programming languages and markup languages
;; used in Emacs buffers. The main point is that it contains an
;; evolving table of language definitions that doesn't need to be
;; replicated in other packages.
;; Right now there is only one public function, `language-id-buffer'.
;; It looks at the major mode and other variables and returns the
;; language's GitHub Linguist identifier. We can add support for
;; other kinds of identifiers if there is demand.
;; This library does not do any statistical text matching to guess the
;; language.
;;; Code:
(require 'cl-lib)
(defvar language-id--file-name-extension nil
"Internal variable for file name extension during lookup.")
;; <https://raw.githubusercontent.com/github/linguist/master/lib/linguist/languages.yml>
(defconst language-id--definitions
'(
;;; Definitions that need special attention to precedence order.
;; It is not uncommon for C++ mode to be used when writing Cuda.
;; In this case, the only way to correctly identify Cuda is by
;; looking at the extension.
("Cuda"
(c++-mode
(language-id--file-name-extension ".cu"))
(c++-mode
(language-id--file-name-extension ".cuh")))
;; json-mode is derived from javascript-mode.
("JSON5"
(json-mode
(language-id--file-name-extension ".json5"))
(web-mode
(web-mode-content-type "json")
(web-mode-engine "none")
(language-id--file-name-extension ".json5")))
("JSON"
json-mode
jsonian-mode
(web-mode
(web-mode-content-type "json")
(web-mode-engine "none")))
;; php-mode is derived from c-mode.
("PHP" php-mode)
;; scss-mode is derived from css-mode.
("SCSS" scss-mode)
;; solidity-mode is derived from c-mode.
("Solidity" solidity-mode)
;; svelte-mode is derived from html-mode.
("Svelte"
svelte-mode
(web-mode
(web-mode-content-type "html")
(web-mode-engine "svelte")))
;; terraform-mode is derived from hcl-mode.
("Terraform" terraform-mode)
;; TypeScript/TSX need to come before JavaScript/JSX because in
;; web-mode we can tell them apart by file name extension only.
;;
;; This implies that we inconsistently classify unsaved temp
;; buffers using TypeScript/TSX as JavaScript/JSX.
("TSX"
typescript-tsx-mode
(web-mode
(web-mode-content-type "jsx")
(web-mode-engine "none")
(language-id--file-name-extension ".tsx")))
("TypeScript"
typescript-mode
(web-mode
(web-mode-content-type "javascript")
(web-mode-engine "none")
(language-id--file-name-extension ".ts")))
;; ReScript needs to come before Reason because in reason-mode
;; we can tell them apart by file name extension only.
("ReScript"
(reason-mode
(language-id--file-name-extension ".res")))
("ReScript"
(reason-mode
(language-id--file-name-extension ".resi")))
("Reason" reason-mode)
;; vue-html-mode is derived from html-mode.
("Vue"
vue-mode
vue-html-mode
(web-mode
(web-mode-content-type "html")
(web-mode-engine "vue")))
;;; The rest of the definitions are in alphabetical order.
("Assembly" asm-mode nasm-mode)
("ATS" ats-mode)
("Awk" awk-mode)
("Bazel" bazel-mode)
("BibTeX" bibtex-mode)
("C" c-mode)
("C#" csharp-mode)
("C++" c++-mode)
("Cabal Config" haskell-cabal-mode)
("Clojure" clojurescript-mode clojurec-mode clojure-mode)
("CMake" cmake-mode)
("Common Lisp" lisp-mode)
("Crystal" crystal-mode)
("CSS"
css-mode
(web-mode
(web-mode-content-type "css")
(web-mode-engine "none")))
("Cuda" cuda-mode)
("D" d-mode)
("Dart" dart-mode)
("Dhall" dhall-mode)
("Dockerfile" dockerfile-mode)
("EJS"
(web-mode
(web-mode-content-type "html")
(web-mode-engine "ejs")))
("Elixir" elixir-mode)
("Elm" elm-mode)
("Emacs Lisp" emacs-lisp-mode)
("Erlang" erlang-mode)
("F#" fsharp-mode)
("Fish" fish-mode)
("Fortran" fortran-mode)
("Fortran Free Form" f90-mode)
("GLSL" glsl-mode)
("Go" go-mode)
("GraphQL" graphql-mode)
("Haskell" haskell-mode)
("HCL" hcl-mode)
("HTML"
html-helper-mode
mhtml-mode
html-mode
nxhtml-mode
(web-mode
(web-mode-content-type "html")
(web-mode-engine "none")))
("Java" java-mode)
("JavaScript"
(js-mode
(flow-minor-mode nil))
(js2-mode
(flow-minor-mode nil))
(js3-mode
(flow-minor-mode nil))
(web-mode
(web-mode-content-type "javascript")
(web-mode-engine "none")))
("JSON"
json-mode
(web-mode
(web-mode-content-type "json")
(web-mode-engine "none")))
("Jsonnet" jsonnet-mode)
("JSX"
js2-jsx-mode
jsx-mode
rjsx-mode
react-mode
(web-mode
(web-mode-content-type "jsx")
(web-mode-engine "none")))
("Kotlin" kotlin-mode)
("LaTeX" latex-mode)
("Less" less-css-mode)
("Literate Haskell" literate-haskell-mode)
("Lua" lua-mode)
("Markdown" gfm-mode markdown-mode)
("Nix" nix-mode)
("Objective-C" objc-mode)
("OCaml" caml-mode tuareg-mode)
("Perl" cperl-mode perl-mode)
("Protocol Buffer" protobuf-mode)
("PureScript" purescript-mode)
("Python" python-mode)
("R"
ess-r-mode
(ess-mode
(ess-dialect "R")))
("Racket" racket-mode)
("Ruby" enh-ruby-mode ruby-mode)
("Rust" rust-mode rustic-mode)
("Scala" scala-mode)
("Scheme" scheme-mode)
("Shell" sh-mode)
("SQL" sql-mode)
("Swift" swift-mode swift3-mode)
("TOML" toml-mode conf-toml-mode)
("V" v-mode)
("Verilog" verilog-mode)
("XML"
nxml-mode
xml-mode
(web-mode
(web-mode-content-type "xml")
(web-mode-engine "none")))
("YAML" yaml-mode)
("Zig" zig-mode))
"Internal table of programming language definitions.")
(defun language-id--mode-match-p (mode)
"Interal helper to match current buffer against MODE."
(let ((mode (if (listp mode) mode (list mode))))
(cl-destructuring-bind (wanted-major-mode &rest variables) mode
(and (derived-mode-p wanted-major-mode)
(cl-every
(lambda (variable)
(cl-destructuring-bind (symbol wanted-value) variable
(equal wanted-value
(if (boundp symbol) (symbol-value symbol) nil))))
variables)))))
(defun language-id-buffer ()
"Get GitHub Linguist language name for current buffer.
Return the name of the programming language or markup language
used in the current buffer. The name is a string from the GitHub
Linguist language list. The language is determined by looking at
the active `major-mode'. Some major modes support more than one
language. In that case minor modes and possibly other variables
are consulted to disambiguate the language.
In addition to the modes bundled with GNU Emacs, many third-party
modes are recognized. No statistical text matching or other
heuristics are used in detecting the language.
The language definitions live inside the language-id library and
are updated in new releases of the library.
If the language is not unambiguously recognized, the function
returns nil."
(let ((language-id--file-name-extension
(downcase (file-name-extension (or (buffer-file-name) "") t))))
(cl-some (lambda (definition)
(cl-destructuring-bind (language-id &rest modes) definition
(when (cl-some #'language-id--mode-match-p modes)
language-id)))
language-id--definitions)))
(provide 'language-id)
;;; language-id.el ends here