mirror of
https://github.com/github/codeql.git
synced 2026-03-10 01:26:47 +01:00
205 lines
7.0 KiB
Rust
205 lines
7.0 KiB
Rust
use itertools::Itertools;
|
|
use log::{debug, info};
|
|
use ra_ap_base_db::SourceDatabase;
|
|
use ra_ap_hir::Semantics;
|
|
use ra_ap_ide_db::RootDatabase;
|
|
use ra_ap_load_cargo::{load_workspace_at, LoadCargoConfig, ProcMacroServerChoice};
|
|
use ra_ap_paths::Utf8PathBuf;
|
|
use ra_ap_project_model::CargoConfig;
|
|
use ra_ap_project_model::ProjectManifest;
|
|
use ra_ap_project_model::RustLibSource;
|
|
use ra_ap_span::Edition;
|
|
use ra_ap_span::EditionedFileId;
|
|
use ra_ap_span::TextRange;
|
|
use ra_ap_span::TextSize;
|
|
use ra_ap_syntax::SourceFile;
|
|
use ra_ap_syntax::SyntaxError;
|
|
use ra_ap_vfs::Vfs;
|
|
use ra_ap_vfs::VfsPath;
|
|
use ra_ap_vfs::{AbsPathBuf, FileId};
|
|
use std::borrow::Cow;
|
|
use std::path::{Path, PathBuf};
|
|
use triomphe::Arc;
|
|
pub enum RustAnalyzer<'a> {
|
|
WithSemantics {
|
|
vfs: &'a Vfs,
|
|
semantics: &'a Semantics<'a, RootDatabase>,
|
|
},
|
|
WithoutSemantics {
|
|
reason: &'a str,
|
|
},
|
|
}
|
|
|
|
pub struct FileSemanticInformation<'a> {
|
|
pub file_id: EditionedFileId,
|
|
pub semantics: &'a Semantics<'a, RootDatabase>,
|
|
}
|
|
|
|
pub struct ParseResult<'a> {
|
|
pub ast: SourceFile,
|
|
pub text: Arc<str>,
|
|
pub errors: Vec<SyntaxError>,
|
|
pub semantics_info: Result<FileSemanticInformation<'a>, &'a str>,
|
|
}
|
|
|
|
impl<'a> RustAnalyzer<'a> {
|
|
pub fn load_workspace(
|
|
project: &ProjectManifest,
|
|
scratch_dir: &Path,
|
|
) -> Option<(RootDatabase, Vfs)> {
|
|
let config = CargoConfig {
|
|
sysroot: Some(RustLibSource::Discover),
|
|
target_dir: ra_ap_paths::Utf8PathBuf::from_path_buf(scratch_dir.to_path_buf())
|
|
.map(|x| x.join("target"))
|
|
.ok(),
|
|
..Default::default()
|
|
};
|
|
let progress = |t| (log::trace!("progress: {}", t));
|
|
let load_config = LoadCargoConfig {
|
|
load_out_dirs_from_check: true,
|
|
with_proc_macro_server: ProcMacroServerChoice::Sysroot,
|
|
prefill_caches: false,
|
|
};
|
|
let manifest = project.manifest_path();
|
|
|
|
match load_workspace_at(manifest.as_ref(), &config, &load_config, &progress) {
|
|
Ok((db, vfs, _macro_server)) => Some((db, vfs)),
|
|
Err(err) => {
|
|
log::error!("failed to load workspace for {}: {}", manifest, err);
|
|
None
|
|
}
|
|
}
|
|
}
|
|
pub fn new(vfs: &'a Vfs, semantics: &'a Semantics<'a, RootDatabase>) -> Self {
|
|
RustAnalyzer::WithSemantics { vfs, semantics }
|
|
}
|
|
pub fn parse(&self, path: &Path) -> ParseResult {
|
|
let no_semantics_reason;
|
|
match self {
|
|
RustAnalyzer::WithSemantics { vfs, semantics } => {
|
|
if let Some(file_id) = path_to_file_id(path, vfs) {
|
|
if let Ok(input) = std::panic::catch_unwind(|| semantics.db.file_text(file_id))
|
|
{
|
|
let file_id = EditionedFileId::current_edition(file_id);
|
|
let source_file = semantics.parse(file_id);
|
|
let errors = semantics
|
|
.db
|
|
.parse_errors(file_id)
|
|
.into_iter()
|
|
.flat_map(|x| x.to_vec())
|
|
.collect();
|
|
|
|
return ParseResult {
|
|
ast: source_file,
|
|
text: input,
|
|
errors,
|
|
semantics_info: Ok(FileSemanticInformation { file_id, semantics }),
|
|
};
|
|
}
|
|
debug!(
|
|
"No text available for file_id '{:?}', falling back to loading file '{}' from disk.",
|
|
file_id,
|
|
path.to_string_lossy()
|
|
);
|
|
no_semantics_reason = "no text available for the file in the project";
|
|
} else {
|
|
no_semantics_reason = "file not found in project";
|
|
}
|
|
}
|
|
RustAnalyzer::WithoutSemantics { reason } => {
|
|
no_semantics_reason = reason;
|
|
}
|
|
}
|
|
let mut errors = Vec::new();
|
|
let input = match std::fs::read(path) {
|
|
Ok(data) => data,
|
|
Err(e) => {
|
|
errors.push(SyntaxError::new(
|
|
format!("Could not read {}: {}", path.to_string_lossy(), e),
|
|
TextRange::empty(TextSize::default()),
|
|
));
|
|
vec![]
|
|
}
|
|
};
|
|
let (input, err) = from_utf8_lossy(&input);
|
|
|
|
let parse = ra_ap_syntax::ast::SourceFile::parse(&input, Edition::CURRENT);
|
|
errors.extend(parse.errors());
|
|
errors.extend(err);
|
|
ParseResult {
|
|
ast: parse.tree(),
|
|
text: input.as_ref().into(),
|
|
errors,
|
|
semantics_info: Err(no_semantics_reason),
|
|
}
|
|
}
|
|
}
|
|
|
|
pub fn find_project_manifests(
|
|
files: &[PathBuf],
|
|
) -> anyhow::Result<Vec<ra_ap_project_model::ProjectManifest>> {
|
|
let current = std::env::current_dir()?;
|
|
let abs_files: Vec<_> = files
|
|
.iter()
|
|
.map(|path| AbsPathBuf::assert_utf8(current.join(path)))
|
|
.collect();
|
|
let ret = ra_ap_project_model::ProjectManifest::discover_all(&abs_files);
|
|
let iter = || ret.iter().map(|m| format!(" {m}"));
|
|
const LOG_LIMIT: usize = 10;
|
|
if ret.len() <= LOG_LIMIT {
|
|
info!("found manifests:\n{}", iter().join("\n"));
|
|
} else {
|
|
info!(
|
|
"found manifests:\n{}\nand {} more",
|
|
iter().take(LOG_LIMIT).join("\n"),
|
|
ret.len() - LOG_LIMIT
|
|
);
|
|
debug!(
|
|
"rest of the manifests found:\n{}",
|
|
iter().dropping(LOG_LIMIT).join("\n")
|
|
);
|
|
}
|
|
Ok(ret)
|
|
}
|
|
fn from_utf8_lossy(v: &[u8]) -> (Cow<'_, str>, Option<SyntaxError>) {
|
|
let mut iter = v.utf8_chunks();
|
|
let (first_valid, first_invalid) = if let Some(chunk) = iter.next() {
|
|
let valid = chunk.valid();
|
|
let invalid = chunk.invalid();
|
|
if invalid.is_empty() {
|
|
debug_assert_eq!(valid.len(), v.len());
|
|
return (Cow::Borrowed(valid), None);
|
|
}
|
|
(valid, invalid)
|
|
} else {
|
|
return (Cow::Borrowed(""), None);
|
|
};
|
|
|
|
const REPLACEMENT: &str = "\u{FFFD}";
|
|
let error_start = first_valid.len() as u32;
|
|
let error_end = error_start + first_invalid.len() as u32;
|
|
let error_range = TextRange::new(TextSize::new(error_start), TextSize::new(error_end));
|
|
let error = SyntaxError::new("invalid utf-8 sequence".to_owned(), error_range);
|
|
let mut res = String::with_capacity(v.len());
|
|
res.push_str(first_valid);
|
|
|
|
res.push_str(REPLACEMENT);
|
|
|
|
for chunk in iter {
|
|
res.push_str(chunk.valid());
|
|
if !chunk.invalid().is_empty() {
|
|
res.push_str(REPLACEMENT);
|
|
}
|
|
}
|
|
|
|
(Cow::Owned(res), Some(error))
|
|
}
|
|
|
|
pub(crate) fn path_to_file_id(path: &Path, vfs: &Vfs) -> Option<FileId> {
|
|
Utf8PathBuf::from_path_buf(path.to_path_buf())
|
|
.ok()
|
|
.and_then(|x| AbsPathBuf::try_from(x).ok())
|
|
.map(VfsPath::from)
|
|
.and_then(|x| vfs.file_id(&x))
|
|
}
|