queries.rs 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155
  1. use heed3::RoTxn;
  2. use get_routes::handler;
  3. use helix_db::{field_remapping, identifier_remapping, traversal_remapping, exclude_field, value_remapping};
  4. use helix_db::helix_engine::vector_core::vector::HVector;
  5. use helix_db::{
  6. helix_engine::graph_core::ops::{
  7. g::G,
  8. in_::{in_::InAdapter, in_e::InEdgesAdapter, to_n::ToNAdapter},
  9. out::{from_n::FromNAdapter, out::OutAdapter, out_e::OutEdgesAdapter},
  10. source::{
  11. add_e::{AddEAdapter, EdgeType},
  12. add_n::AddNAdapter,
  13. e_from_id::EFromIdAdapter,
  14. e_from_type::EFromTypeAdapter,
  15. n_from_id::NFromIdAdapter,
  16. n_from_type::NFromTypeAdapter,
  17. n_from_index::NFromIndexAdapter,
  18. },
  19. tr_val::{Traversable, TraversalVal},
  20. util::{
  21. dedup::DedupAdapter, filter_mut::FilterMut,
  22. filter_ref::FilterRefAdapter, range::RangeAdapter, update::UpdateAdapter,
  23. map::MapAdapter, paths::ShortestPathAdapter, props::PropsAdapter, drop::Drop,
  24. },
  25. vectors::{insert::InsertVAdapter, search::SearchVAdapter, brute_force_search::BruteForceSearchVAdapter},
  26. bm25::search_bm25::SearchBM25Adapter,
  27. },
  28. helix_engine::types::GraphError,
  29. helix_gateway::router::router::HandlerInput,
  30. node_matches, props,
  31. protocol::count::Count,
  32. protocol::remapping::{RemappingMap, ResponseRemapping},
  33. protocol::response::Response,
  34. protocol::{
  35. filterable::Filterable, remapping::Remapping, return_values::ReturnValue, value::Value, id::ID,
  36. },
  37. };
  38. use sonic_rs::{Deserialize, Serialize};
  39. use std::collections::{HashMap, HashSet};
  40. use std::sync::Arc;
  41. use std::time::Instant;
  42. use std::cell::RefCell;
  43. use chrono::{DateTime, Utc};
  44. pub struct Doc {
  45. pub content: String,
  46. pub number: i32,
  47. }
  48. pub struct Chunk {
  49. pub content: String,
  50. }
  51. pub struct EmbeddingOf {
  52. pub from: Doc,
  53. pub to: Embedding,
  54. }
  55. pub struct Embedding {
  56. pub chunk: String,
  57. pub chunk_id: i32,
  58. pub number: i32,
  59. pub reference: String,
  60. }
  61. #[derive(Serialize, Deserialize)]
  62. pub struct searchEmbeddingInput {
  63. pub query: Vec<f64>
  64. }
  65. #[handler]
  66. pub fn searchEmbedding (input: &HandlerInput, response: &mut Response) -> Result<(), GraphError> {
  67. let data: searchEmbeddingInput = match sonic_rs::from_slice(&input.request.body) {
  68. Ok(data) => data,
  69. Err(err) => return Err(GraphError::from(err)),
  70. };
  71. let mut remapping_vals = RemappingMap::new();
  72. let db = Arc::clone(&input.graph.storage);
  73. let txn = db.graph_env.read_txn().unwrap();
  74. let c = G::new(Arc::clone(&db), &txn)
  75. .n_from_index("number", &1).collect_to::<Vec<_>>();
  76. let embedding_search = G::new(Arc::clone(&db), &txn)
  77. .search_v::<fn(&HVector, &RoTxn) -> bool>(&data.query, 10, None).collect_to::<Vec<_>>();
  78. let mut return_vals: HashMap<String, ReturnValue> = HashMap::new();
  79. return_vals.insert("embedding_search".to_string(), ReturnValue::from_traversal_value_array_with_mixin(G::new_from(Arc::clone(&db), &txn, embedding_search.clone())
  80. .map_traversal(|item, txn| { traversal_remapping!(remapping_vals, item.clone(), "chunk" => G::new_from(Arc::clone(&db), &txn, vec![item.clone()])
  81. .check_property("chunk").collect_to::<Vec<_>>())?;
  82. traversal_remapping!(remapping_vals, item.clone(), "chunk_id" => G::new_from(Arc::clone(&db), &txn, vec![item.clone()])
  83. .check_property("chunk_id").collect_to::<Vec<_>>())?;
  84. traversal_remapping!(remapping_vals, item.clone(), "number" => G::new_from(Arc::clone(&db), &txn, vec![item.clone()])
  85. .check_property("number").collect_to::<Vec<_>>())?;
  86. traversal_remapping!(remapping_vals, item.clone(), "reference" => G::new_from(Arc::clone(&db), &txn, vec![item.clone()])
  87. .check_property("reference").collect_to::<Vec<_>>())?;
  88. Ok(item) }).collect_to::<Vec<_>>().clone(), remapping_vals.borrow_mut()));
  89. txn.commit().unwrap();
  90. response.body = sonic_rs::to_vec(&return_vals).unwrap();
  91. Ok(())
  92. }
  93. #[derive(Serialize, Deserialize)]
  94. pub struct addEmbeddingInput {
  95. pub vec: Vec<f64>
  96. }
  97. #[handler]
  98. pub fn addEmbedding (input: &HandlerInput, response: &mut Response) -> Result<(), GraphError> {
  99. let data: addEmbeddingInput = match sonic_rs::from_slice(&input.request.body) {
  100. Ok(data) => data,
  101. Err(err) => return Err(GraphError::from(err)),
  102. };
  103. let mut remapping_vals = RemappingMap::new();
  104. let db = Arc::clone(&input.graph.storage);
  105. let mut txn = db.graph_env.write_txn().unwrap();
  106. let doc = G::new_mut(Arc::clone(&db), &mut txn)
  107. .add_n("Doc", Some(props! { "number" => 1, "content" => "Hello, content!" }), Some(&["number"])).collect_to::<Vec<_>>();
  108. let embedding = G::new_mut(Arc::clone(&db), &mut txn)
  109. .insert_v::<fn(&HVector, &RoTxn) -> bool>(&data.vec, "Embedding", Some(props! { "chunk_id" => 1, "number" => 1, "chunk" => "Hello, chunk!", "reference" => "Hello, reference!" })).collect_to::<Vec<_>>();
  110. G::new_mut(Arc::clone(&db), &mut txn)
  111. .add_e("EmbeddingOf", None, doc.id(), embedding.id(), true, EdgeType::Node).collect_to::<Vec<_>>();
  112. let mut return_vals: HashMap<String, ReturnValue> = HashMap::new();
  113. return_vals.insert("embedding".to_string(), ReturnValue::from_traversal_value_array_with_mixin(embedding.clone(), remapping_vals.borrow_mut()));
  114. txn.commit().unwrap();
  115. response.body = sonic_rs::to_vec(&return_vals).unwrap();
  116. Ok(())
  117. }
  118. #[handler]
  119. pub fn getAllEmbedding (input: &HandlerInput, response: &mut Response) -> Result<(), GraphError> {
  120. let mut remapping_vals = RemappingMap::new();
  121. let db = Arc::clone(&input.graph.storage);
  122. let txn = db.graph_env.read_txn().unwrap();
  123. let c = G::new(Arc::clone(&db), &txn)
  124. .n_from_index("number", &1).collect_to::<Vec<_>>();
  125. let embeddings = G::new_from(Arc::clone(&db), &txn, c.clone())
  126. .out("EmbeddingOf",&EdgeType::Vec).collect_to::<Vec<_>>();
  127. let mut return_vals: HashMap<String, ReturnValue> = HashMap::new();
  128. return_vals.insert("embeddings".to_string(), ReturnValue::from_traversal_value_array_with_mixin(embeddings.clone(), remapping_vals.borrow_mut()));
  129. txn.commit().unwrap();
  130. response.body = sonic_rs::to_vec(&return_vals).unwrap();
  131. Ok(())
  132. }