-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #5 from chenwanqq/rerank
add rerank model support
- Loading branch information
Showing
10 changed files
with
236 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,36 @@ | ||
use erniebot_rs::reranker::{RerankerEndpoint, RerankerModel}; | ||
use tokio::runtime::Runtime; | ||
|
||
fn test_reranker() { | ||
let reranker = RerankerEndpoint::new(RerankerModel::BceRerankerBaseV1).unwrap(); | ||
let query = "你好".to_string(); | ||
let documents = vec![ | ||
"你好".to_string(), | ||
"你叫什么名字".to_string(), | ||
"你是谁".to_string(), | ||
]; | ||
let reranker_response = reranker.invoke(query, documents, None, None).unwrap(); | ||
let reranker_results = reranker_response.get_reranker_response().unwrap(); | ||
println!("{},{:?}", reranker_results.len(), reranker_results); | ||
} | ||
|
||
fn test_async_reranker() { | ||
let reranker = RerankerEndpoint::new(RerankerModel::BceRerankerBaseV1).unwrap(); | ||
let query = "你好".to_string(); | ||
let documents = vec![ | ||
"你好".to_string(), | ||
"你叫什么名字".to_string(), | ||
"你是谁".to_string(), | ||
]; | ||
let rt = Runtime::new().unwrap(); | ||
let reranker_response = rt | ||
.block_on(reranker.ainvoke(query, documents, None, None)) | ||
.unwrap(); | ||
let reranker_results = reranker_response.get_reranker_response().unwrap(); | ||
println!("{},{:?}", reranker_results.len(), reranker_results); | ||
} | ||
|
||
fn main() { | ||
test_reranker(); | ||
test_async_reranker(); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,99 @@ | ||
use super::model::RerankerModel; | ||
use super::response::RerankerResponse; | ||
use crate::errors::ErnieError; | ||
use crate::utils::{build_url, get_access_token}; | ||
use json_value_merge::Merge; | ||
use serde_json::Value; | ||
use url::Url; | ||
|
||
static RERANKER_BASE_URL: &str = | ||
"https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/reranker/"; | ||
|
||
/** ChatEndpoint is a struct that represents the chat endpoint of erniebot API | ||
*/ | ||
pub struct RerankerEndpoint { | ||
url: Url, | ||
access_token: String, | ||
} | ||
|
||
impl RerankerEndpoint { | ||
// create a new embedding instance using pre-defined model | ||
pub fn new(model: RerankerModel) -> Result<Self, ErnieError> { | ||
Ok(RerankerEndpoint { | ||
url: build_url(RERANKER_BASE_URL, model.to_string().as_str())?, | ||
access_token: get_access_token()?, | ||
}) | ||
} | ||
/// sync invoke | ||
pub fn invoke( | ||
&self, | ||
query: String, | ||
documents: Vec<String>, | ||
top_n: Option<u64>, | ||
user_id: Option<String>, | ||
) -> Result<RerankerResponse, ErnieError> { | ||
let mut body = serde_json::json!({ | ||
"query": query, | ||
"documents": documents, | ||
}); | ||
if let Some(top_n) = top_n { | ||
body.merge(&serde_json::json!({"top_n": top_n})); | ||
} | ||
if let Some(user_id) = user_id { | ||
body.merge(&serde_json::json!({"user_id": user_id})); | ||
} | ||
let client = reqwest::blocking::Client::new(); | ||
let response: Value = client | ||
.post(self.url.as_str()) | ||
.query(&[("access_token", self.access_token.as_str())]) | ||
.json(&body) | ||
.send() | ||
.map_err(|e| ErnieError::InvokeError(e.to_string()))? | ||
.json() | ||
.map_err(|e| ErnieError::InvokeError(e.to_string()))?; | ||
|
||
//if error_code key in response, means RemoteAPIError | ||
if response.get("error_code").is_some() { | ||
return Err(ErnieError::RemoteAPIError(response.to_string())); | ||
} | ||
|
||
Ok(RerankerResponse::new(response)) | ||
} | ||
///async invoke | ||
pub async fn ainvoke( | ||
&self, | ||
query: String, | ||
documents: Vec<String>, | ||
top_n: Option<u64>, | ||
user_id: Option<String>, | ||
) -> Result<RerankerResponse, ErnieError> { | ||
let mut body = serde_json::json!({ | ||
"query": query, | ||
"documents": documents, | ||
}); | ||
if let Some(top_n) = top_n { | ||
body.merge(&serde_json::json!({"top_n": top_n})); | ||
} | ||
if let Some(user_id) = user_id { | ||
body.merge(&serde_json::json!({"user_id": user_id})); | ||
} | ||
let client = reqwest::Client::new(); | ||
let response: Value = client | ||
.post(self.url.as_str()) | ||
.query(&[("access_token", self.access_token.as_str())]) | ||
.json(&body) | ||
.send() | ||
.await | ||
.map_err(|e| ErnieError::InvokeError(e.to_string()))? | ||
.json() | ||
.await | ||
.map_err(|e| ErnieError::InvokeError(e.to_string()))?; | ||
|
||
//if error_code key in response, means RemoteAPIError | ||
if response.get("error_code").is_some() { | ||
return Err(ErnieError::RemoteAPIError(response.to_string())); | ||
} | ||
|
||
Ok(RerankerResponse::new(response)) | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,7 @@ | ||
mod endpoint; | ||
mod model; | ||
mod response; | ||
|
||
pub use endpoint::RerankerEndpoint; | ||
pub use model::RerankerModel; | ||
pub use response::RerankerResponse; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
use serde::{Deserialize, Serialize}; | ||
use strum_macros::{Display, EnumString}; | ||
|
||
#[derive(Debug, Default, Clone, Serialize, Deserialize, EnumString, Display, PartialEq, Eq)] | ||
#[non_exhaustive] | ||
pub enum RerankerModel { | ||
#[default] | ||
#[strum(serialize = "bce_reranker_base")] | ||
#[serde(rename = "bce_reranker_base")] | ||
BceRerankerBaseV1, | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,71 @@ | ||
use crate::errors::ErnieError; | ||
use serde::{Deserialize, Serialize}; | ||
use serde_json::value; | ||
|
||
/// Response is using for non-stream response | ||
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)] | ||
pub struct RerankerResponse { | ||
raw_response: value::Value, | ||
} | ||
|
||
impl RerankerResponse { | ||
pub fn new(raw_response: value::Value) -> Self { | ||
RerankerResponse { raw_response } | ||
} | ||
|
||
pub fn get_raw_response(&self) -> &value::Value { | ||
&self.raw_response | ||
} | ||
|
||
pub fn get(&self, key: &str) -> Option<&value::Value> { | ||
self.raw_response.get(key) | ||
} | ||
|
||
pub fn get_mut(&mut self, key: &str) -> Option<&mut value::Value> { | ||
self.raw_response.get_mut(key) | ||
} | ||
|
||
/// get the result of reranker response | ||
pub fn get_reranker_response(&self) -> Result<Vec<RerankData>, ErnieError> { | ||
match self.raw_response.get("results") { | ||
Some(data) => { | ||
let data_array = data | ||
.as_array() | ||
.ok_or(ErnieError::GetResponseError( | ||
"reranker results is not an array".to_string(), | ||
))? | ||
.clone(); | ||
let results = data_array | ||
.into_iter() | ||
.map(|x| { | ||
serde_json::from_value(x) | ||
.map_err(|e| ErnieError::GetResponseError(e.to_string())) | ||
}) | ||
.collect::<Result<Vec<RerankData>, ErnieError>>()?; | ||
Ok(results) | ||
} | ||
None => Err(ErnieError::GetResponseError( | ||
"reranker results is not found".to_string(), | ||
)), | ||
} | ||
} | ||
/// get tokens used by prompt | ||
pub fn get_prompt_tokens(&self) -> Option<u64> { | ||
let usage = self.get("usage")?.as_object()?; | ||
let prompt_tokens = usage.get("prompt_tokens")?.as_u64()?; | ||
Some(prompt_tokens) | ||
} | ||
/// get tokens used by completion | ||
pub fn get_total_tokens(&self) -> Option<u64> { | ||
let usage = self.get("usage")?.as_object()?; | ||
let total_tokens = usage.get("total_tokens")?.as_u64()?; | ||
Some(total_tokens) | ||
} | ||
} | ||
|
||
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)] | ||
pub struct RerankData { | ||
document: String, | ||
relevance_score: f64, | ||
index: u64, | ||
} |