use crate::{codegen::Target, Objects, Reporter};
#[derive(Debug, Clone, Default)]
pub struct Docs {
lines: Vec<(String, String)>,
}
impl Docs {
pub fn from_raw_docs(
reporter: &Reporter,
virtpath: &str,
fqname: &str,
docs: Option<flatbuffers::Vector<'_, flatbuffers::ForwardsUOffset<&'_ str>>>,
) -> Self {
Self::from_lines(
reporter,
virtpath,
fqname,
docs.into_iter().flat_map(|doc| doc.into_iter()),
)
}
pub fn from_lines<'a>(
reporter: &Reporter,
virtpath: &str,
fqname: &str,
lines: impl Iterator<Item = &'a str>,
) -> Self {
let lines: Vec<(String, String)> = lines.map(parse_line).collect();
for (tag, comment) in &lines {
assert!(is_known_tag(tag), "Unknown tag: '\\{tag} {comment}'");
if tag.is_empty() {
find_and_recommend_doclinks(reporter, virtpath, fqname, comment);
}
}
Self { lines }
}
pub fn first_line(
&self,
reporter: &Reporter,
objects: &Objects,
target: Target,
) -> Option<String> {
let (tag, line) = self.lines.first()?;
assert!(
tag.is_empty(),
"Expected no tag on first line of docstring. Found: /// \\{tag} {line}"
);
Some(translate_doc_line(reporter, objects, line, target))
}
pub fn only_lines_tagged(&self, tag: &str) -> Vec<&str> {
assert!(is_known_tag(tag), "Unknown tag: '{tag}'");
self.lines
.iter()
.filter_map(
|(t, line)| {
if t == tag {
Some(line.as_str())
} else {
None
}
},
)
.collect()
}
pub(super) fn lines_for(
&self,
reporter: &Reporter,
objects: &Objects,
target: Target,
) -> Vec<String> {
let target_tag = match target {
Target::Cpp => "cpp",
Target::Python => "py",
Target::Rust => "rs",
Target::WebDocsMarkdown => "md",
};
assert!(
is_known_tag(target_tag),
"Unknown target tag: '{target_tag}'"
);
remove_extra_newlines(self.lines.iter().filter_map(|(tag, line)| {
if tag.is_empty() {
Some(translate_doc_line(reporter, objects, line, target))
} else if tag == target_tag {
Some(line.to_owned())
} else {
None
}
}))
}
}
fn remove_extra_newlines(lines: impl Iterator<Item = String>) -> Vec<String> {
let mut lines: Vec<String> = lines.collect();
lines.dedup();
while let Some(line) = lines.last() {
if line.is_empty() {
lines.pop();
} else {
break;
}
}
lines
}
fn is_known_tag(tag: &str) -> bool {
matches!(tag, "" | "example" | "cpp" | "py" | "rs" | "md")
}
fn parse_line(line: &str) -> (String, String) {
if let Some(line) = line.strip_prefix(" \\") {
let tag = line.split_whitespace().next().unwrap().to_owned();
let line = &line[tag.len()..];
if let Some(line) = line.strip_prefix(' ') {
(tag, line.to_owned())
} else {
assert!(line.is_empty());
(tag, String::new())
}
} else if let Some(line) = line.strip_prefix(' ') {
(String::new(), line.to_owned())
} else {
assert!(
line.is_empty(),
"Comments should start with a single space; found {line:?}"
);
(String::new(), String::new())
}
}
fn find_and_recommend_doclinks(
reporter: &Reporter,
virtpath: &str,
fqname: &str,
full_comment: &str,
) {
let mut comment = full_comment;
while let Some(start) = comment.find('`') {
comment = &comment[start + 1..];
if let Some(end) = comment.find('`') {
let content = &comment[..end];
let looks_like_type_name = content.len() > 5
&& content.chars().all(|c| c.is_ascii_alphanumeric())
&& content.chars().next().unwrap().is_ascii_uppercase()
&& !matches!(content, "ViewContents" | "VisibleTimeRanges" | "QueryExpression")
&& !matches!(content, "ChunkStore" | "ContainerId" | "EntityPathFilter" | "Spatial2DView" | "ViewId" | "View")
&& !matches!(content, "OpenStreetMap");
if looks_like_type_name {
reporter.warn(virtpath, fqname, format!("`{content}` can be written as a doclink, e.g. [archetypes.{content}] in comment: /// {full_comment}"));
}
comment = &comment[end + 1..];
} else {
return;
}
}
}
use doclink_translation::translate_doc_line;
mod doclink_translation {
use crate::{ObjectKind, Objects, Reporter};
use super::Target;
pub fn translate_doc_line(
reporter: &Reporter,
objects: &Objects,
input: &str,
target: Target,
) -> String {
let mut out_tokens: Vec<String> = vec![];
let mut within_backticks = false;
let mut tokens = tokenize(input).into_iter().peekable();
while let Some(token) = tokens.next() {
if token == "`" {
within_backticks = !within_backticks;
out_tokens.push(token.to_owned());
continue;
}
if within_backticks {
out_tokens.push(token.to_owned());
continue;
}
if token == "[" {
let mut doclink_tokens = vec![token];
for token in &mut tokens {
doclink_tokens.push(token);
if token == "]" {
break;
}
}
if tokens
.peek()
.is_some_and(|next_token| next_token.starts_with('('))
{
out_tokens.extend(doclink_tokens.iter().map(|&s| s.to_owned()));
continue;
}
out_tokens.push(translate_doclink(
reporter,
objects,
&doclink_tokens,
target,
));
continue;
}
out_tokens.push(token.to_owned());
}
out_tokens.into_iter().collect()
}
fn translate_doclink(
reporter: &Reporter,
objects: &Objects,
doclink_tokens: &[&str],
target: Target,
) -> String {
try_translate_doclink(objects, doclink_tokens, target).unwrap_or_else(|err| {
let original_doclink: String = doclink_tokens.join("");
let looks_like_rerun_doclink =
!original_doclink.contains(' ') && original_doclink.len() > 6;
if looks_like_rerun_doclink {
reporter.warn_no_context(format!(
"Looks like a Rerun doclink, but fails to parse: {original_doclink} - {err}"
));
}
original_doclink
})
}
fn try_translate_doclink(
objects: &Objects,
doclink_tokens: &[&str],
target: Target,
) -> Result<String, String> {
let has_type_or_enum = doclink_tokens.iter().filter(|t| t == &&".").count() == 2;
let mut tokens = doclink_tokens.iter();
if tokens.next() != Some(&"[") {
return Err("Missing opening bracket".to_owned());
}
let kind = *tokens.next().ok_or("Missing kind")?;
if kind == "`" {
return Err("Do not use backticks inside doclinks".to_owned());
}
if tokens.next() != Some(&".") {
return Err("Missing dot".to_owned());
}
let type_name = *tokens.next().ok_or("Missing type name")?;
let field_or_enum_name = if has_type_or_enum {
if tokens.next() != Some(&".") {
return Err("Missing dot".to_owned());
}
tokens.next()
} else {
None
};
if tokens.next() != Some(&"]") {
return Err("Missing closing bracket".to_owned());
}
if tokens.next().is_some() {
return Err("Trailing tokens".to_owned());
}
if ObjectKind::ALL
.iter()
.all(|object_kind| object_kind.plural_snake_case() != kind)
{
return Err(format!(
"Invalid kind {kind:?}. Valid are: {}",
ObjectKind::ALL
.map(|object_kind| object_kind.plural_snake_case())
.join(", ")
));
}
let is_unreleased;
let scope;
{
let mut candidates = vec![];
for obj in objects.values() {
if obj.kind.plural_snake_case() == kind && obj.name == type_name {
candidates.push(obj);
}
}
let Some(object) = candidates.first() else {
return Err("No object found for doclink".to_owned());
};
if candidates.len() > 2 {
use itertools::Itertools as _;
return Err(format!(
"Multiple objects found for doclink: {}",
candidates.iter().map(|obj| &obj.fqname).format(", ")
));
}
scope = object.scope().unwrap_or_default();
is_unreleased = object.is_attr_set(crate::ATTR_DOCS_UNRELEASED);
}
Ok(match target {
Target::Cpp => {
if let Some(field_or_enum_name) = field_or_enum_name {
format!("`{kind}::{type_name}::{field_or_enum_name}`")
} else {
format!("`{kind}::{type_name}`")
}
}
Target::Rust => {
let kind_and_type = format!("{kind}::{type_name}");
let object_path = if scope.is_empty() {
kind_and_type.clone()
} else {
format!("{scope}::{kind_and_type}")
};
if let Some(field_or_enum_name) = field_or_enum_name {
format!(
"[`{kind_and_type}::{field_or_enum_name}`][crate::{object_path}::{field_or_enum_name}]"
)
} else {
format!("[`{kind_and_type}`][crate::{object_path}]")
}
}
Target::Python => {
let kind_and_type = format!("{kind}.{type_name}");
let object_path = if scope.is_empty() {
format!("rerun.{kind_and_type}")
} else {
format!("rerun.{scope}.{kind_and_type}")
};
if let Some(field_or_enum_name) = field_or_enum_name {
format!("[`{kind_and_type}.{field_or_enum_name}`][{object_path}.{field_or_enum_name}]")
} else {
format!("[`{kind_and_type}`][{object_path}]")
}
}
Target::WebDocsMarkdown => {
let kind_and_type = format!("{kind}.{type_name}");
if scope == "blueprint" && (kind == "components" || kind == "archetypes") {
return Ok(kind_and_type);
}
let type_name_snake_case = re_case::to_snake_case(type_name);
let query = if is_unreleased {
"?speculative-link" } else {
""
};
let url = format!(
"https://rerun.io/docs/reference/types/{kind}/{type_name_snake_case}{query}"
);
if let Some(field_or_enum_name) = field_or_enum_name {
format!("[`{kind_and_type}#{field_or_enum_name}`]({url})")
} else {
format!("[`{kind_and_type}`]({url})")
}
}
})
}
pub(super) fn tokenize(input: &str) -> Vec<&str> {
tokenize_with(input, &['[', ']', '`', '.'])
}
fn tokenize_with<'input>(mut input: &'input str, special_chars: &[char]) -> Vec<&'input str> {
let mut tokens = vec![];
while !input.is_empty() {
if let Some(index) = input.find(|c| special_chars.contains(&c)) {
if 0 < index {
tokens.push(&input[..index]);
}
tokens.push(&input[index..index + 1]);
input = &input[index + 1..];
} else {
tokens.push(input);
break;
}
}
tokens
}
}
#[cfg(test)]
mod tests {
use crate::{
codegen::Target,
docs::doclink_translation::{tokenize, translate_doc_line},
Attributes, Docs, Object, ObjectKind, Objects,
};
fn test_objects() -> Objects {
Objects {
objects: std::iter::once((
"rerun.views.Spatial2DView".to_owned(),
Object {
virtpath: "path".to_owned(),
filepath: "path".into(),
fqname: "rerun.views.Spatial2DView".to_owned(),
pkg_name: "test".to_owned(),
name: "Spatial2DView".to_owned(),
docs: Docs::default(),
kind: ObjectKind::View,
attrs: Attributes::default(),
fields: Vec::new(),
class: crate::ObjectClass::Struct,
datatype: None,
},
))
.collect(),
}
}
#[test]
fn test_tokenize() {
assert_eq!(tokenize("This is a comment"), vec!["This is a comment"]);
assert_eq!(
tokenize("A vector `[1, 2, 3]` and a doclink [archetype.Image]."),
vec![
"A vector ",
"`",
"[",
"1, 2, 3",
"]",
"`",
" and a doclink ",
"[",
"archetype",
".",
"Image",
"]",
"."
]
);
}
#[test]
fn test_translate_doclinks() {
let objects = test_objects();
let (_report, reporter) = crate::report::init();
let input =
"A vector `[1, 2, 3]` and a doclink [views.Spatial2DView] and a [url](www.rerun.io).";
assert_eq!(
translate_doc_line(&reporter, &objects, input, Target::Cpp),
"A vector `[1, 2, 3]` and a doclink `views::Spatial2DView` and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::Python
),
"A vector `[1, 2, 3]` and a doclink [`views.Spatial2DView`][rerun.blueprint.views.Spatial2DView] and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::Rust
),
"A vector `[1, 2, 3]` and a doclink [`views::Spatial2DView`][crate::blueprint::views::Spatial2DView] and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::WebDocsMarkdown
),
"A vector `[1, 2, 3]` and a doclink [`views.Spatial2DView`](https://rerun.io/docs/reference/types/views/spatial2d_view) and a [url](www.rerun.io)."
);
}
#[test]
fn test_translate_doclinks_with_field() {
let objects = test_objects();
let (_report, reporter) = crate::report::init();
let input =
"A vector `[1, 2, 3]` and a doclink [views.Spatial2DView.position] and a [url](www.rerun.io).";
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::Cpp
),
"A vector `[1, 2, 3]` and a doclink `views::Spatial2DView::position` and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::Python
),
"A vector `[1, 2, 3]` and a doclink [`views.Spatial2DView.position`][rerun.blueprint.views.Spatial2DView.position] and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::Rust
),
"A vector `[1, 2, 3]` and a doclink [`views::Spatial2DView::position`][crate::blueprint::views::Spatial2DView::position] and a [url](www.rerun.io)."
);
assert_eq!(
translate_doc_line(
&reporter,
&objects,
input,
Target::WebDocsMarkdown
),
"A vector `[1, 2, 3]` and a doclink [`views.Spatial2DView#position`](https://rerun.io/docs/reference/types/views/spatial2d_view) and a [url](www.rerun.io)."
);
}
#[test]
fn test_docs() {
let objects = test_objects();
let (_report, reporter) = crate::report::init();
let docs = Docs::from_lines(
&reporter,
"testpath",
"testfqname",
[
r" Doclink to [views.Spatial2DView].",
r" ",
r" The second line.",
r" ",
r" \py Only for Python.",
r" ",
r" The third line.",
r" ",
r" \cpp Only for C++.",
]
.into_iter(),
);
assert_eq!(docs.only_lines_tagged("py"), vec!["Only for Python.",]);
assert_eq!(docs.only_lines_tagged("cpp"), vec!["Only for C++.",]);
assert_eq!(
docs.lines_for(&reporter, &objects, Target::Python),
vec![
"Doclink to [`views.Spatial2DView`][rerun.blueprint.views.Spatial2DView].",
"",
"The second line.",
"",
"Only for Python.",
"",
"The third line.",
]
);
assert_eq!(
docs.lines_for(&reporter, &objects, Target::Cpp),
vec![
"Doclink to `views::Spatial2DView`.",
"",
"The second line.",
"",
"The third line.",
"",
"Only for C++.",
]
);
assert_eq!(
docs.first_line(&reporter, &objects, Target::Rust),
Some(
"Doclink to [`views::Spatial2DView`][crate::blueprint::views::Spatial2DView]."
.to_owned()
)
);
}
}