expanded embeddable context to accomodate for struct context and file paths
This commit is contained in:
parent
dd0dbdc5bd
commit
02f523094b
1 changed files with 31 additions and 15 deletions
|
@ -20,6 +20,9 @@ pub struct ParsedFile {
|
||||||
pub documents: Vec<Document>,
|
pub documents: Vec<Document>,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
const CODE_CONTEXT_TEMPLATE: &str =
|
||||||
|
"The below code snippet is from file '<path>'\n\n```<language>\n<item>\n```";
|
||||||
|
|
||||||
pub struct CodeContextRetriever {
|
pub struct CodeContextRetriever {
|
||||||
pub parser: Parser,
|
pub parser: Parser,
|
||||||
pub cursor: QueryCursor,
|
pub cursor: QueryCursor,
|
||||||
|
@ -58,27 +61,40 @@ impl CodeContextRetriever {
|
||||||
tree.root_node(),
|
tree.root_node(),
|
||||||
content.as_bytes(),
|
content.as_bytes(),
|
||||||
) {
|
) {
|
||||||
let mut item_range: Option<Range<usize>> = None;
|
let mut name: Vec<&str> = vec![];
|
||||||
let mut name_range: Option<Range<usize>> = None;
|
let mut item: Option<&str> = None;
|
||||||
|
let mut offset: Option<usize> = None;
|
||||||
for capture in mat.captures {
|
for capture in mat.captures {
|
||||||
if capture.index == embedding_config.item_capture_ix {
|
if capture.index == embedding_config.item_capture_ix {
|
||||||
item_range = Some(capture.node.byte_range());
|
offset = Some(capture.node.byte_range().start);
|
||||||
|
item = content.get(capture.node.byte_range());
|
||||||
} else if capture.index == embedding_config.name_capture_ix {
|
} else if capture.index == embedding_config.name_capture_ix {
|
||||||
name_range = Some(capture.node.byte_range());
|
if let Some(name_content) = content.get(capture.node.byte_range()) {
|
||||||
|
name.push(name_content);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Some(context_capture_ix) = embedding_config.context_capture_ix {
|
||||||
|
if capture.index == context_capture_ix {
|
||||||
|
if let Some(context) = content.get(capture.node.byte_range()) {
|
||||||
|
name.push(context);
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if let Some((item_range, name_range)) = item_range.zip(name_range) {
|
if item.is_some() && offset.is_some() && name.len() > 0 {
|
||||||
if let Some((item, name)) =
|
let context_span = CODE_CONTEXT_TEMPLATE
|
||||||
content.get(item_range.clone()).zip(content.get(name_range))
|
.replace("<path>", pending_file.relative_path.to_str().unwrap())
|
||||||
{
|
.replace("<language>", &pending_file.language.name().to_lowercase())
|
||||||
context_spans.push(item.to_string());
|
.replace("<item>", item.unwrap());
|
||||||
documents.push(Document {
|
|
||||||
name: name.to_string(),
|
context_spans.push(context_span);
|
||||||
offset: item_range.start,
|
documents.push(Document {
|
||||||
embedding: Vec::new(),
|
name: name.join(" "),
|
||||||
});
|
offset: offset.unwrap(),
|
||||||
}
|
embedding: Vec::new(),
|
||||||
|
})
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue