rust/crates/libsyntax2/src/lib.rs

253 lines
7.6 KiB
Rust
Raw Normal View History

//! An experimental implementation of [Rust RFC#2256 libsyntax2.0][rfc#2256].
//!
//! The intent is to be an IDE-ready parser, i.e. one that offers
//!
//! - easy and fast incremental re-parsing,
//! - graceful handling of errors, and
//! - maintains all information in the source file.
//!
//! For more information, see [the RFC][rfc#2265], or [the working draft][RFC.md].
//!
//! [rfc#2256]: <https://github.com/rust-lang/rfcs/pull/2256>
//! [RFC.md]: <https://github.com/matklad/libsyntax2/blob/master/docs/RFC.md>
2018-07-30 13:08:06 +02:00
#![forbid(
missing_debug_implementations,
unconditional_recursion,
future_incompatible
)]
2018-07-29 12:51:55 +02:00
#![deny(bad_style, missing_docs)]
#![allow(missing_docs)]
//#![warn(unreachable_pub)] // rust-lang/rust#47816
2018-07-31 14:40:40 +02:00
extern crate itertools;
2018-07-30 13:08:06 +02:00
extern crate unicode_xid;
2018-08-01 13:55:37 +02:00
extern crate drop_bomb;
2018-08-01 21:07:09 +02:00
extern crate parking_lot;
2018-08-13 13:24:22 +02:00
extern crate smol_str;
extern crate text_unit;
2017-12-29 21:33:04 +01:00
2018-07-31 14:40:40 +02:00
pub mod algo;
pub mod ast;
2017-12-28 22:56:36 +01:00
mod lexer;
2018-07-31 22:38:19 +02:00
#[macro_use]
2018-09-06 15:54:54 +02:00
mod token_set;
2018-07-31 22:38:19 +02:00
mod parser_api;
mod grammar;
mod parser_impl;
2018-07-29 14:16:07 +02:00
mod syntax_kinds;
2018-08-08 18:44:16 +02:00
mod yellow;
2018-07-30 14:25:52 +02:00
/// Utilities for simple uses of the parser.
pub mod utils;
2018-08-24 12:41:25 +02:00
pub mod text_utils;
2018-07-29 14:16:07 +02:00
pub use {
2018-08-18 11:42:28 +02:00
text_unit::{TextRange, TextUnit},
smol_str::SmolStr,
2018-08-25 10:40:17 +02:00
ast::AstNode,
2018-07-30 13:08:06 +02:00
lexer::{tokenize, Token},
2018-07-29 14:16:07 +02:00
syntax_kinds::SyntaxKind,
2018-08-17 20:10:55 +02:00
yellow::{SyntaxNode, SyntaxNodeRef, OwnedRoot, RefRoot, TreeRoot, SyntaxError},
2018-07-29 14:16:07 +02:00
};
2018-08-25 12:17:54 +02:00
use {
SyntaxKind::*,
yellow::{GreenNode, SyntaxRoot},
parser_api::Parser,
};
2018-08-25 11:10:35 +02:00
2018-08-25 10:40:17 +02:00
#[derive(Clone, Debug)]
2018-08-25 10:44:58 +02:00
pub struct File {
2018-08-25 10:40:17 +02:00
root: SyntaxNode
}
2018-08-25 10:44:58 +02:00
impl File {
2018-08-25 12:57:13 +02:00
fn new(green: GreenNode, errors: Vec<SyntaxError>) -> File {
let root = SyntaxRoot::new(green, errors);
2018-08-25 11:10:35 +02:00
let root = SyntaxNode::new_owned(root);
2018-09-08 17:34:41 +02:00
if cfg!(debug_assertions) {
utils::validate_block_structure(root.borrowed());
}
2018-08-25 10:44:58 +02:00
File { root }
2018-08-25 10:40:17 +02:00
}
2018-08-25 11:44:26 +02:00
pub fn parse(text: &str) -> File {
2018-08-25 11:10:35 +02:00
let tokens = tokenize(&text);
2018-08-25 13:45:17 +02:00
let (green, errors) = parser_impl::parse_with::<yellow::GreenBuilder>(
text, &tokens, grammar::root,
);
2018-08-25 12:57:13 +02:00
File::new(green, errors)
2018-08-25 11:10:35 +02:00
}
2018-08-25 12:17:54 +02:00
pub fn reparse(&self, edit: &AtomEdit) -> File {
2018-08-25 12:42:40 +02:00
self.incremental_reparse(edit).unwrap_or_else(|| self.full_reparse(edit))
2018-08-25 12:17:54 +02:00
}
2018-08-25 13:45:17 +02:00
pub fn incremental_reparse(&self, edit: &AtomEdit) -> Option<File> {
let (node, green, new_errors) =
self.reparse_leaf(&edit).or_else(|| self.reparse_block(&edit))?;
let green_root = node.replace_with(green);
let errors = merge_errors(self.errors(), new_errors, node, edit);
Some(File::new(green_root, errors))
}
fn reparse_leaf(&self, edit: &AtomEdit) -> Option<(SyntaxNodeRef, GreenNode, Vec<SyntaxError>)> {
let node = algo::find_covering_node(self.syntax(), edit.delete);
match node.kind() {
| WHITESPACE
| COMMENT
| DOC_COMMENT
| IDENT
| STRING
| RAW_STRING => {
let text = get_text_after_edit(node, &edit);
let tokens = tokenize(&text);
if tokens.len() != 1 || tokens[0].kind != node.kind() {
return None;
}
let green = GreenNode::new_leaf(node.kind(), &text);
let new_errors = vec![];
Some((node, green, new_errors))
},
_ => None,
}
}
fn reparse_block(&self, edit: &AtomEdit) -> Option<(SyntaxNodeRef, GreenNode, Vec<SyntaxError>)> {
2018-08-25 12:17:54 +02:00
let (node, reparser) = find_reparsable_node(self.syntax(), edit.delete)?;
let text = get_text_after_edit(node, &edit);
2018-08-25 12:57:13 +02:00
let tokens = tokenize(&text);
if !is_balanced(&tokens) {
return None;
}
let (green, new_errors) =
parser_impl::parse_with::<yellow::GreenBuilder>(
&text, &tokens, reparser,
);
Some((node, green, new_errors))
2018-08-25 12:17:54 +02:00
}
fn full_reparse(&self, edit: &AtomEdit) -> File {
2018-08-28 13:06:30 +02:00
let text = replace_range(self.syntax().text().to_string(), edit.delete, &edit.insert);
2018-08-25 12:17:54 +02:00
File::parse(&text)
}
2018-08-25 10:44:17 +02:00
pub fn ast(&self) -> ast::Root {
ast::Root::cast(self.syntax()).unwrap()
2018-08-25 10:40:17 +02:00
}
pub fn syntax(&self) -> SyntaxNodeRef {
self.root.borrowed()
}
pub fn errors(&self) -> Vec<SyntaxError> {
self.syntax().root.syntax_root().errors.clone()
}
2018-08-24 18:27:30 +02:00
}
2018-08-25 11:44:26 +02:00
#[derive(Debug, Clone)]
pub struct AtomEdit {
pub delete: TextRange,
pub insert: String,
}
impl AtomEdit {
pub fn replace(range: TextRange, replace_with: String) -> AtomEdit {
AtomEdit { delete: range, insert: replace_with }
}
pub fn delete(range: TextRange) -> AtomEdit {
AtomEdit::replace(range, String::new())
}
pub fn insert(offset: TextUnit, text: String) -> AtomEdit {
AtomEdit::replace(TextRange::offset_len(offset, 0.into()), text)
}
}
2018-08-25 12:17:54 +02:00
fn get_text_after_edit(node: SyntaxNodeRef, edit: &AtomEdit) -> String {
replace_range(
node.text().to_string(),
edit.delete - node.range().start(),
&edit.insert,
)
}
2018-08-25 12:17:54 +02:00
fn find_reparsable_node(node: SyntaxNodeRef, range: TextRange) -> Option<(SyntaxNodeRef, fn(&mut Parser))> {
let node = algo::find_covering_node(node, range);
return algo::ancestors(node)
.filter_map(|node| reparser(node).map(|r| (node, r)))
.next();
fn reparser(node: SyntaxNodeRef) -> Option<fn(&mut Parser)> {
let res = match node.kind() {
BLOCK => grammar::block,
NAMED_FIELD_DEF_LIST => grammar::named_field_def_list,
NAMED_FIELD_LIST => grammar::named_field_list,
ENUM_VARIANT_LIST => grammar::enum_variant_list,
MATCH_ARM_LIST => grammar::match_arm_list,
USE_TREE_LIST => grammar::use_tree_list,
EXTERN_ITEM_LIST => grammar::extern_item_list,
TOKEN_TREE if node.first_child().unwrap().kind() == L_CURLY => grammar::token_tree,
ITEM_LIST => {
let parent = node.parent().unwrap();
match parent.kind() {
IMPL_ITEM => grammar::impl_item_list,
TRAIT_DEF => grammar::trait_item_list,
MODULE => grammar::mod_item_list,
_ => return None,
}
},
2018-08-25 12:17:54 +02:00
_ => return None,
};
Some(res)
}
}
2018-08-25 12:57:13 +02:00
2018-08-25 13:45:17 +02:00
pub /*(meh)*/ fn replace_range(mut text: String, range: TextRange, replace_with: &str) -> String {
2018-08-25 12:57:13 +02:00
let start = u32::from(range.start()) as usize;
let end = u32::from(range.end()) as usize;
text.replace_range(start..end, replace_with);
text
}
fn is_balanced(tokens: &[Token]) -> bool {
if tokens.len() == 0
|| tokens.first().unwrap().kind != L_CURLY
|| tokens.last().unwrap().kind != R_CURLY {
return false
}
let mut balance = 0usize;
for t in tokens.iter() {
match t.kind {
L_CURLY => balance += 1,
R_CURLY => balance = match balance.checked_sub(1) {
Some(b) => b,
None => return false,
},
_ => (),
}
}
balance == 0
}
2018-08-25 13:45:17 +02:00
fn merge_errors(
old_errors: Vec<SyntaxError>,
new_errors: Vec<SyntaxError>,
2018-08-25 14:12:17 +02:00
old_node: SyntaxNodeRef,
2018-08-25 13:45:17 +02:00
edit: &AtomEdit,
) -> Vec<SyntaxError> {
let mut res = Vec::new();
for e in old_errors {
if e.offset <= old_node.range().start() {
2018-08-25 13:45:17 +02:00
res.push(e)
} else if e.offset >= old_node.range().end() {
2018-08-25 13:45:17 +02:00
res.push(SyntaxError {
msg: e.msg,
offset: e.offset + TextUnit::of_str(&edit.insert) - edit.delete.len(),
})
}
}
for e in new_errors {
res.push(SyntaxError {
msg: e.msg,
2018-08-25 14:12:17 +02:00
offset: e.offset + old_node.range().start(),
2018-08-25 13:45:17 +02:00
})
}
res
}