
This PR makes it so the `/fetch` slash command will display an error when the URL does not have any textual content: <img width="308" alt="Screenshot 2024-08-08 at 4 51 55 PM" src="https://github.com/user-attachments/assets/bf4cbc18-c65b-48a2-aedd-26b50f47f018"> Release Notes: - N/A
169 lines
5.5 KiB
Rust
169 lines
5.5 KiB
Rust
use std::cell::RefCell;
|
|
use std::rc::Rc;
|
|
use std::sync::atomic::AtomicBool;
|
|
use std::sync::Arc;
|
|
|
|
use anyhow::{anyhow, bail, Context, Result};
|
|
use assistant_slash_command::{
|
|
ArgumentCompletion, SlashCommand, SlashCommandOutput, SlashCommandOutputSection,
|
|
};
|
|
use futures::AsyncReadExt;
|
|
use gpui::{AppContext, Task, WeakView};
|
|
use html_to_markdown::{convert_html_to_markdown, markdown, TagHandler};
|
|
use http_client::{AsyncBody, HttpClient, HttpClientWithUrl};
|
|
use language::LspAdapterDelegate;
|
|
use ui::prelude::*;
|
|
use workspace::Workspace;
|
|
|
|
#[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
|
|
enum ContentType {
|
|
Html,
|
|
Plaintext,
|
|
Json,
|
|
}
|
|
|
|
pub(crate) struct FetchSlashCommand;
|
|
|
|
impl FetchSlashCommand {
|
|
async fn build_message(http_client: Arc<HttpClientWithUrl>, url: &str) -> Result<String> {
|
|
let mut url = url.to_owned();
|
|
if !url.starts_with("https://") && !url.starts_with("http://") {
|
|
url = format!("https://{url}");
|
|
}
|
|
|
|
let mut response = http_client.get(&url, AsyncBody::default(), true).await?;
|
|
|
|
let mut body = Vec::new();
|
|
response
|
|
.body_mut()
|
|
.read_to_end(&mut body)
|
|
.await
|
|
.context("error reading response body")?;
|
|
|
|
if response.status().is_client_error() {
|
|
let text = String::from_utf8_lossy(body.as_slice());
|
|
bail!(
|
|
"status error {}, response: {text:?}",
|
|
response.status().as_u16()
|
|
);
|
|
}
|
|
|
|
let Some(content_type) = response.headers().get("content-type") else {
|
|
bail!("missing Content-Type header");
|
|
};
|
|
let content_type = content_type
|
|
.to_str()
|
|
.context("invalid Content-Type header")?;
|
|
let content_type = match content_type {
|
|
"text/html" => ContentType::Html,
|
|
"text/plain" => ContentType::Plaintext,
|
|
"application/json" => ContentType::Json,
|
|
_ => ContentType::Html,
|
|
};
|
|
|
|
match content_type {
|
|
ContentType::Html => {
|
|
let mut handlers: Vec<TagHandler> = vec![
|
|
Rc::new(RefCell::new(markdown::WebpageChromeRemover)),
|
|
Rc::new(RefCell::new(markdown::ParagraphHandler)),
|
|
Rc::new(RefCell::new(markdown::HeadingHandler)),
|
|
Rc::new(RefCell::new(markdown::ListHandler)),
|
|
Rc::new(RefCell::new(markdown::TableHandler::new())),
|
|
Rc::new(RefCell::new(markdown::StyledTextHandler)),
|
|
];
|
|
if url.contains("wikipedia.org") {
|
|
use html_to_markdown::structure::wikipedia;
|
|
|
|
handlers.push(Rc::new(RefCell::new(wikipedia::WikipediaChromeRemover)));
|
|
handlers.push(Rc::new(RefCell::new(wikipedia::WikipediaInfoboxHandler)));
|
|
handlers.push(Rc::new(
|
|
RefCell::new(wikipedia::WikipediaCodeHandler::new()),
|
|
));
|
|
} else {
|
|
handlers.push(Rc::new(RefCell::new(markdown::CodeHandler)));
|
|
}
|
|
|
|
convert_html_to_markdown(&body[..], &mut handlers)
|
|
}
|
|
ContentType::Plaintext => Ok(std::str::from_utf8(&body)?.to_owned()),
|
|
ContentType::Json => {
|
|
let json: serde_json::Value = serde_json::from_slice(&body)?;
|
|
|
|
Ok(format!(
|
|
"```json\n{}\n```",
|
|
serde_json::to_string_pretty(&json)?
|
|
))
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
impl SlashCommand for FetchSlashCommand {
|
|
fn name(&self) -> String {
|
|
"fetch".into()
|
|
}
|
|
|
|
fn description(&self) -> String {
|
|
"insert URL contents".into()
|
|
}
|
|
|
|
fn menu_text(&self) -> String {
|
|
"Insert fetched URL contents".into()
|
|
}
|
|
|
|
fn requires_argument(&self) -> bool {
|
|
true
|
|
}
|
|
|
|
fn complete_argument(
|
|
self: Arc<Self>,
|
|
_query: String,
|
|
_cancel: Arc<AtomicBool>,
|
|
_workspace: Option<WeakView<Workspace>>,
|
|
_cx: &mut AppContext,
|
|
) -> Task<Result<Vec<ArgumentCompletion>>> {
|
|
Task::ready(Ok(Vec::new()))
|
|
}
|
|
|
|
fn run(
|
|
self: Arc<Self>,
|
|
argument: Option<&str>,
|
|
workspace: WeakView<Workspace>,
|
|
_delegate: Option<Arc<dyn LspAdapterDelegate>>,
|
|
cx: &mut WindowContext,
|
|
) -> Task<Result<SlashCommandOutput>> {
|
|
let Some(argument) = argument else {
|
|
return Task::ready(Err(anyhow!("missing URL")));
|
|
};
|
|
let Some(workspace) = workspace.upgrade() else {
|
|
return Task::ready(Err(anyhow!("workspace was dropped")));
|
|
};
|
|
|
|
let http_client = workspace.read(cx).client().http_client();
|
|
let url = argument.to_string();
|
|
|
|
let text = cx.background_executor().spawn({
|
|
let url = url.clone();
|
|
async move { Self::build_message(http_client, &url).await }
|
|
});
|
|
|
|
let url = SharedString::from(url);
|
|
cx.foreground_executor().spawn(async move {
|
|
let text = text.await?;
|
|
if text.trim().is_empty() {
|
|
bail!("no textual content found");
|
|
}
|
|
|
|
let range = 0..text.len();
|
|
Ok(SlashCommandOutput {
|
|
text,
|
|
sections: vec![SlashCommandOutputSection {
|
|
range,
|
|
icon: IconName::AtSign,
|
|
label: format!("fetch {}", url).into(),
|
|
}],
|
|
run_commands_in_text: false,
|
|
})
|
|
})
|
|
}
|
|
}
|